1070 lines
30 KiB
PHP
Executable File
1070 lines
30 KiB
PHP
Executable File
<?php
|
|
|
|
// Yuba
|
|
// //
|
|
//////////////////////////////////////////
|
|
$version = file_get_contents(__DIR__."/current_version.txt");
|
|
|
|
ini_set('memory_limit', '10240M');
|
|
date_default_timezone_set("America/Los_Angeles");
|
|
|
|
// Includes & Prefs
|
|
//////////////////////////////////////////
|
|
|
|
// Timestamp
|
|
|
|
$mytime = time();
|
|
$tmpdir = "/tmp/yuba/".$mytime;
|
|
if (!is_dir($tmpdir)) { mkdir($tmpdir,0777,true); }
|
|
$stamp = date("Y-m-d_H-i-s", $mytime);
|
|
if (!file_exists("/tmp/yuba/debug.log")) { touch("/tmp/yuba/debug.log"); }
|
|
|
|
// Prefs
|
|
|
|
$prefs_file = "/Users/".get_current_user()."/Library/Preferences/org.profiteroles.Yuba.php";
|
|
if (!file_exists($prefs_file)) {
|
|
if (!copy(__DIR__."/prefs.php",$prefs_file)) {
|
|
echo "Error creating preferences file";
|
|
die;
|
|
}
|
|
}
|
|
$p = unserialize(file_get_contents($prefs_file));
|
|
|
|
require("functions.php");
|
|
require("filetypes.php");
|
|
|
|
// Manual prefs
|
|
|
|
$wopt_steps = 7; // total number of steps
|
|
$wopt_currstep = 1;
|
|
if ($p['debug']) { $wopt_clear = 0; } else { $wopt_clear = 1; }
|
|
|
|
$parser = new plistParser();
|
|
|
|
// Menu options
|
|
//////////////////////////////////////////
|
|
|
|
// Preferences
|
|
|
|
if (@$argv[1] == "Preferences...") {
|
|
exec($bin_php." ".escapeshellarg(__DIR__."/YubaPrefs.php")." 2>&1");
|
|
die;
|
|
}
|
|
|
|
// Console
|
|
|
|
if (@$argv[1] == "Console") {
|
|
exec("open -n ".__DIR__."/bin/Console.app --args /tmp/yuba/debug.log");
|
|
die;
|
|
}
|
|
|
|
// Version check
|
|
|
|
if (@$argv[1] == "Check for Updates...") {
|
|
|
|
$curr_version = file_get_contents("https://www.profiteroles.org/git/p/Yuba/raw/master/current_version.txt");
|
|
if ($curr_version > $version) {
|
|
if(askMulti("Yuba ".$curr_version." is available (you have ".$version.")", array("Cancel","Download")) == 1) {
|
|
exec("open https://www.profiteroles.org/git/p/Yuba/");
|
|
echo "QUITAPP\n";
|
|
}
|
|
} else {
|
|
alert($version." is the latest version","Up-to-date");
|
|
die;
|
|
}
|
|
|
|
}
|
|
|
|
dm("Launching Yuba\n".str_repeat("-",33)."\n".print_r($p,true));
|
|
|
|
// PHP Checks
|
|
//////////////////////////////////////////
|
|
|
|
$needed = array("iconv","fileinfo","json","PDO","pdo_sqlite","SimpleXML","sqlite3","xml");
|
|
foreach ($needed as $ext) {
|
|
if (!extension_loaded($ext)) {
|
|
alert("PHP is missing the ".$ext.". Exiting.","PHP Extension Missing");
|
|
echo "QUITAPP\n";
|
|
}
|
|
}
|
|
if ($p['contents'] && !extension_loaded("zip")) {
|
|
alert("PHP is missing the zip extension. Yuba will not collect file contents.","PHP Extension Missing");
|
|
revise_prefs(array("contents" => 0));
|
|
}
|
|
|
|
// Path & application variables
|
|
//////////////////////////////////////////
|
|
|
|
if (!isset($argv[1]) || $argv[1] == "") { echo "No input"; die; }
|
|
$zpath = realpath(@$argv[1]);
|
|
if ($p['bdest']) { $bdest = realpath($p['bdest']); } else { $bdest = "/Users/".get_current_user()."/Documents/Yuba/"; }
|
|
if (!is_dir($bdest)) { if (!mkdir($bdest,0777,true)) { echo "Error creating destination directory"; die; } }
|
|
|
|
// Check for bundle
|
|
if ($zpath == "/") { $blabel = "root"; } else { $blabel = preg_replace("/[^A-Za-z0-9\.]/", "_", basename($zpath)); }
|
|
if (!$p['reuse']) { $blabel .= "-".$mytime; }
|
|
if (is_writable($zpath)) { echo "Warning: source is writeable\n"; }
|
|
|
|
$bpath = chop($bdest,"/")."/".substr(crc32($zpath),0,3)."_".$blabel.".bundle";
|
|
if (!is_dir($bpath)) { mkdir($bpath); }
|
|
if (!is_dir($bpath."/thumbs")) { mkdir($bpath."/thumbs"); }
|
|
if (!is_dir($bpath."/icons")) { mkdir($bpath."/icons"); }
|
|
if (!is_dir($bpath."/contents")) { mkdir($bpath."/contents"); }
|
|
|
|
// Logfile
|
|
$messages_log_file = $bpath."/".$stamp."_messages.log";
|
|
$error_log_file = $bpath."/".$stamp."_error.log";
|
|
error_reporting(E_ALL);
|
|
ini_set("display_errors", TRUE);
|
|
ini_set("log_errors", TRUE);
|
|
ini_set("error_log", $error_log_file);
|
|
|
|
// Bundled QlGenerators
|
|
$generators = @glob(__DIR__."/../Library/Quicklook/*.qlgenerator");
|
|
if (!empty($generators)) {
|
|
foreach ($generators as $generator) {
|
|
$p['bundled_generators'][] = basename($generator);
|
|
}
|
|
}
|
|
|
|
// Parallel check
|
|
//////////////////////////////////////////
|
|
|
|
$physicalcpu = trim(shell_exec("sysctl -n hw.physicalcpu"));
|
|
|
|
if ($p['parallel'] > $physicalcpu) {
|
|
alert("Parallel hardware mismatch");
|
|
echo "QUITAPP\n";
|
|
}
|
|
if ($p['parallel'] == 1) {
|
|
$wopt_parallelmsg = "max";
|
|
} else {
|
|
$wopt_parallelmsg = $p['parallel'];
|
|
}
|
|
|
|
// Banner
|
|
//////////////////////////////////////////
|
|
|
|
if (!is_dir($zpath) | !is_dir($bdest)) { echo "Filepath error"; die; }
|
|
|
|
$banner = "Yuba: ".$zpath." -> ".$bpath;
|
|
echo msg($banner."\n".str_repeat("-", strlen($banner)));
|
|
|
|
// System Info
|
|
//////////////////////////////////////////
|
|
|
|
echo msg("Using ".$wopt_parallelmsg." cores");
|
|
echo msg("Gathering system info...");
|
|
|
|
// Disks
|
|
|
|
if (substr($zpath, 0, 9) != "/Volumes/") {
|
|
$zbase = "/";
|
|
} else {
|
|
$zparts = explode("/", $zpath);
|
|
$zbase = "/Volumes/".$zparts[2];
|
|
}
|
|
|
|
$host = gethostname();
|
|
$disks = shell_exec("diskutil list -plist 2>&1");
|
|
$diskutil = shell_exec("diskutil info -plist ".$zbase." 2>&1");
|
|
$diskutil_parsed = $parser->parseString(utf8_for_xml($diskutil));
|
|
foreach ($diskutil_parsed['SMARTDeviceSpecificKeysMayVaryNotGuaranteed'] as $key => $value) {
|
|
$diskutil_parsed[$key] = $value;
|
|
}
|
|
unset($diskutil_parsed['SMARTDeviceSpecificKeysMayVaryNotGuaranteed']);
|
|
$vdisks = shell_exec("hdiutil info -plist 2>&1");
|
|
$vdisks_parsed = $parser->parseString(utf8_for_xml($vdisks));
|
|
$df = shell_exec("df 2>&1");
|
|
|
|
$df_volume = $diskutil_parsed['MountPoint'];
|
|
$df_device = "/dev/".$diskutil_parsed['ParentWholeDisk'];
|
|
|
|
$mdutil = shell_exec("mdutil -sv ".$df_volume);
|
|
if (strpos($mdutil,"disabled")) {
|
|
echo msg("Warning: spotlight indexing is disabled");
|
|
$p['spotlight'] = false;
|
|
}
|
|
|
|
if ($zpath == "/") {
|
|
$type = "Startup disk";
|
|
} elseif (strtolower($zpath) == strtolower("/Volumes/".$diskutil_parsed["VolumeName"])) {
|
|
if ($diskutil_parsed["BusProtocol"] == "Disk Image") {
|
|
$type = "Disk image";
|
|
} else {
|
|
$type = "External disk";
|
|
}
|
|
} else {
|
|
$type = "Folder";
|
|
}
|
|
|
|
if ($type == "Disk image") {
|
|
$hdiutil = shell_exec("hdiutil imageinfo -plist ".$df_device." 2>&1");
|
|
foreach ($vdisks_parsed['images'] as $id => $disk) {
|
|
if ($disk['system-entities'][0]['dev-entry'] == $df_device) {
|
|
$image_file = $disk['image-path'];
|
|
}
|
|
}
|
|
} else {
|
|
$hdiutil = false;
|
|
$image_file = false;
|
|
}
|
|
|
|
// System Profile
|
|
|
|
if ($p['profile']) {
|
|
echo msg("system_profiler");
|
|
$profile = shell_exec("system_profiler SPHardwareDataType SPStorageDataType SPThunderboltDataType SPUSBDataType 2>&1");
|
|
} else {
|
|
$profile = "disabled";
|
|
}
|
|
$sysvers = shell_exec("sw_vers 2>&1");
|
|
|
|
// QuickLook
|
|
|
|
foreach (explode("\n",shell_exec($bin_qlmanage." -m plugins 2>&1")) as $ql_line) {
|
|
$ql_parts = @explode(" -> ",trim($ql_line));
|
|
if (@$ql_parts[1]) {
|
|
$qlmanage['plugins'][$ql_parts[0]] = $ql_parts[1];
|
|
}
|
|
}
|
|
$qlmanage['server'] = trim(shell_exec($bin_qlmanage." -m server 2>&1"));
|
|
$qlmanage['memory'] = trim(shell_exec($bin_qlmanage." -m memory 2>&1"));
|
|
$qlmanage['burst'] = trim(shell_exec($bin_qlmanage." -m burst 2>&1"));
|
|
$qlmanage['threads'] = trim(shell_exec($bin_qlmanage." -m threads 2>&1"));
|
|
$qlmanage['other'] = trim(shell_exec($bin_qlmanage." -m other 2>&1"));
|
|
|
|
// Database
|
|
//////////////////////////////////////////
|
|
|
|
echo msg("Building database...");
|
|
|
|
$dbo = new PDO("sqlite:".$bpath."/".$stamp.".sqlite3");
|
|
$dbo->setAttribute(PDO::ATTR_ERRMODE, PDO::ERRMODE_EXCEPTION);
|
|
$dbo->setAttribute(PDO::ATTR_DEFAULT_FETCH_MODE, PDO::FETCH_ASSOC);
|
|
|
|
$dbo->query("PRAGMA page_size = 4096");
|
|
$dbo->query("PRAGMA cache_size = 10000");
|
|
$dbo->query("PRAGMA synchronous = NORMAL");
|
|
$dbo->query("PRAGMA locking_mode = NORMAL");
|
|
$dbo->query("PRAGMA journal_mode = WAL");
|
|
|
|
$dbo->exec("CREATE TABLE _skim (
|
|
version TEXT,
|
|
opts TEXT,
|
|
host TEXT,
|
|
uid INTEGER,
|
|
zpath TEXT,
|
|
bpath TEXT,
|
|
type TEXT,
|
|
passed_file INTEGER,
|
|
passed_dir INTEGER,
|
|
passed_link INTEGER,
|
|
passed_total INTEGER,
|
|
nodescended INTEGER,
|
|
ignored INTEGER,
|
|
dupes INTEGER,
|
|
qlmanage TEXT,
|
|
sysvers TEXT,
|
|
disks TEXT,
|
|
diskutil TEXT,
|
|
vdisks TEXT,
|
|
hdiutil TEXT,
|
|
image_file TEXT,
|
|
df TEXT,
|
|
df_device TEXT,
|
|
df_volume TEXT,
|
|
mdutil TEXT,
|
|
profile TEXT,
|
|
status TEXT
|
|
)");
|
|
|
|
$dbo->exec("CREATE TABLE family (
|
|
pid TEXT,
|
|
fid TEXT,
|
|
children TEXT
|
|
)");
|
|
|
|
$dbo->exec("CREATE TABLE dupes (
|
|
fid TEXT,
|
|
dupes TEXT
|
|
)");
|
|
|
|
$dbo->exec("CREATE TABLE files (
|
|
pid TEXT,
|
|
fid TEXT,
|
|
Pathname TEXT,
|
|
Path TEXT,
|
|
Filename TEXT,
|
|
Extension TEXT,
|
|
Type TEXT,
|
|
Size INTEGER,
|
|
Inode INTEGER,
|
|
Perms INTEGER,
|
|
Owner TEXT,
|
|
ATime INTEGER,
|
|
MTime INTEGER,
|
|
CTime INTEGER,
|
|
LinkTarget TEXT,
|
|
RealPath TEXT,
|
|
stat TEXT,
|
|
items INTEGER,
|
|
newest INTEGER,
|
|
fkind TEXT,
|
|
gfi_type TEXT,
|
|
gfi_attr TEXT,
|
|
gfi_created TEXT,
|
|
has_exif INTEGER,
|
|
has_mediainfo INTEGER,
|
|
has_hash INTEGER,
|
|
thumb_filename TEXT,
|
|
thumb_width INTEGER,
|
|
thumb_height INTEGER,
|
|
thumb_tool TEXT,
|
|
icon_filename TEXT,
|
|
icon_tool TEXT,
|
|
contents_filename TEXT
|
|
)");
|
|
|
|
$stmt = $dbo->prepare("INSERT INTO _skim VALUES (:version, :opts, :host, :uid, :zpath, :bpath, :type, :passed_file, :passed_dir, :passed_link, :passed_total, :nodescended, :ignored, :dupes, :qlmanage, :sysvers, :disks, :diskutil, :vdisks, :hdiutil, :image_file, :df, :df_device, :df_volume, :mdutil, :profile, :status)");
|
|
$stmt->BindValue(":version",$version);
|
|
$stmt->BindValue(":opts",serialize($p));
|
|
$stmt->BindValue(":host",$host);
|
|
$stmt->BindValue(":uid",posix_getuid());
|
|
$stmt->BindValue(":zpath",$zpath);
|
|
$stmt->BindValue(":bpath",$bpath);
|
|
$stmt->BindValue(":type",$type);
|
|
$stmt->BindValue(":qlmanage",serialize($qlmanage));
|
|
$stmt->BindValue(":sysvers",$sysvers);
|
|
$stmt->BindValue(":disks",$disks);
|
|
$stmt->BindValue(":diskutil",$diskutil);
|
|
$stmt->BindValue(":vdisks",$vdisks);
|
|
$stmt->BindValue(":hdiutil",$hdiutil);
|
|
$stmt->BindValue(":image_file",$image_file);
|
|
$stmt->BindValue(":df",$df);
|
|
$stmt->BindValue(":df_device",$df_device);
|
|
$stmt->BindValue(":df_volume",$df_volume);
|
|
$stmt->BindValue(":mdutil",$mdutil);
|
|
$stmt->BindValue(":profile",$profile);
|
|
$stmt->BindValue(":status","aborted");
|
|
$stmt->execute();
|
|
|
|
// Iterator
|
|
//////////////////////////////////////////
|
|
|
|
$first_run = 1;
|
|
$passed_file = $passed_dir = $passed_link = $passed_total = $nodescended = $ignored = 0;
|
|
$files = new RecursiveIteratorIterator(
|
|
new RecursiveCallbackFilterIterator(
|
|
new RecursiveDirectoryIterator(
|
|
$zpath,
|
|
RecursiveDirectoryIterator::SKIP_DOTS
|
|
),
|
|
function ($current, $key, $iterator) use ($p) {
|
|
global $nodescended, $ignored, $passed_file, $passed_dir, $passed_link, $passed_total, $first_run;
|
|
$clean = true;
|
|
// identify ignore files
|
|
if (is_array($p['ignore'])) {
|
|
foreach ($p['ignore'] as $wildcard) {
|
|
if (fnmatch($wildcard, $current->getFilename())) {
|
|
$clean = false;
|
|
if ($first_run) { $ignored++; }
|
|
}
|
|
}
|
|
}
|
|
// identify nodescend dirs
|
|
if (is_array($p['nodescend'])) {
|
|
foreach ($p['nodescend'] as $wildcard) {
|
|
if (fnmatch($wildcard, $current->getPath())) {
|
|
$clean = false;
|
|
if ($first_run) { $nodescended++; }
|
|
}
|
|
}
|
|
}
|
|
//tally stats
|
|
if ($clean && $first_run) {
|
|
if ($current->getType() == "file") {
|
|
$passed_file++;
|
|
} elseif ($current->getType() == "dir") {
|
|
$passed_dir++;
|
|
} elseif ($current->getType() == "link") {
|
|
$passed_link++;
|
|
}
|
|
$passed_total++;
|
|
}
|
|
return $clean;
|
|
}
|
|
),
|
|
RecursiveIteratorIterator::SELF_FIRST,
|
|
RecursiveIteratorIterator::CATCH_GET_CHILD
|
|
);
|
|
|
|
// Tally
|
|
//////////////////////////////////////////
|
|
|
|
echo msg("Counting files...");
|
|
|
|
foreach ($files as $null) { }
|
|
$first_run = 0;
|
|
|
|
if (!$passed_total) {
|
|
echo msg("Nothing was found, exiting");
|
|
die;
|
|
}
|
|
|
|
echo msg("Total files: ".$passed_total."");
|
|
|
|
// Prescan
|
|
//////////////////////////////////////////
|
|
|
|
$i = 0;
|
|
$family = array();
|
|
$fids = array();
|
|
$noread = array();
|
|
$splcount = 0;
|
|
$bline = array();
|
|
|
|
echo ProgressBar::start($passed_total,"Prescan (".stepString().")");
|
|
|
|
foreach ($files as $splFileInfo) {
|
|
|
|
$path = $splFileInfo->getPath();
|
|
$pathname = $splFileInfo->getPathname();
|
|
$shellpath = escapeshellarg($splFileInfo->getPathname());
|
|
$realpath = $splFileInfo->getRealPath();
|
|
|
|
$pid = md5($pathname);
|
|
$pkey = md5($path);
|
|
$fid = null;
|
|
|
|
if (array_key_exists($pid, $family)) {
|
|
echo msg("Duplicate key on ".$pathname.""); die;
|
|
}
|
|
|
|
$family[$pid] = array();
|
|
|
|
// Path-agnostic Unique File ID (to prevent redundant hashes and thumbs)
|
|
|
|
if ($splFileInfo->getType() != "dir" && $splFileInfo->getType() != "link") {
|
|
|
|
$fid = md5($splFileInfo->getSize().$splFileInfo->getMtime().$splFileInfo->getBasename());
|
|
$dx[$fid][] = $pathname;
|
|
$family[$pid]['fid'] = $fid;
|
|
$splcount++;
|
|
|
|
}
|
|
|
|
// Collect file stat()
|
|
|
|
if ($p['stat_mode']) {
|
|
|
|
$sty[$i] = statToArray(shell_exec("stat -s ".$shellpath." 2>&1"));
|
|
|
|
if ($p['stat_mode'] > 1 && $splFileInfo->getType() != "link") {
|
|
|
|
// capture stat values for postflight comparison
|
|
$stx[$i] = array($splFileInfo->getATime(), $splFileInfo->getMTime(), $splFileInfo->getCTime());
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
$sty[$i] = "bypass";
|
|
|
|
}
|
|
|
|
// Create batch
|
|
|
|
if ($p['thumbs'] || $p['icons'] || $p['meta'] || $p['hash'] || $p['contents'] || $p['spotlight']) {
|
|
|
|
$parts = array();
|
|
$parts[] = $bin_php;
|
|
$parts[] = escapeshellarg(realpath("helper.php"));
|
|
$parts[] = $i;
|
|
$parts[] = $passed_total;
|
|
$parts[] = $fid ?: $pid;
|
|
$parts[] = escapeshellarg($pathname);
|
|
$parts[] = $splFileInfo->getType();
|
|
$parts[] = escapeshellarg($bpath);
|
|
$parts[] = $mytime;
|
|
$parts[] = $p['spotlight'];
|
|
|
|
$tcmd = implode(" ",$parts);
|
|
$bline[] = $tcmd;
|
|
|
|
}
|
|
|
|
// Check file can be read
|
|
|
|
if ($realpath && !is_readable($realpath)) {
|
|
$noread[] = $realpath;
|
|
}
|
|
|
|
// Children
|
|
|
|
$family[$pkey]['children'][] = $i+1;
|
|
|
|
echo ProgressBar::next(true);
|
|
$i++;
|
|
|
|
}
|
|
|
|
$batchfile = $tmpdir."/batch.sh";
|
|
if (!empty($bline)) {
|
|
file_put_contents($batchfile,implode("\n", $bline));
|
|
msg("Writing batch to file");
|
|
}
|
|
|
|
echo ProgressBar::finish($wopt_clear);
|
|
|
|
// Thow permissions error
|
|
|
|
if (count($noread)) {
|
|
echo msg("Current user (".posix_getuid().") does not have read access to the following files:\n").implode("\n",$noread)."\n";
|
|
if ($p['readability']) {
|
|
echo msg("Exiting...");
|
|
die;
|
|
}
|
|
}
|
|
|
|
// Write family to DB
|
|
|
|
$dupes = array_filter($dx, function($a) { return count($a) > 1; });
|
|
$dupecount = 0;
|
|
$dupetotal = 0;
|
|
|
|
if (count($dupes)) {
|
|
$dupecount = count($dupes,COUNT_RECURSIVE) - count($dupes);
|
|
$dupetotal = floor(($dupecount/$passed_total)*100);
|
|
foreach ($dupes as $fid => $array) {
|
|
$stmt = $dbo->prepare("INSERT INTO dupes VALUES (:fid, :array)");
|
|
$stmt->BindValue(":fid",$fid);
|
|
$stmt->BindValue(":array",serialize($array));
|
|
$stmt->execute();
|
|
}
|
|
}
|
|
|
|
$message = "Writing family to DB: ";
|
|
$message .= $passed_file." files, ";
|
|
$message .= $passed_dir." dirs, ";
|
|
$message .= $nodescended." bundles, ";
|
|
$message .= $passed_link." links, ";
|
|
$message .= $ignored." ignored, ";
|
|
$message .= $dupecount." dupes (".$dupetotal."%)";
|
|
|
|
echo ProgressBar::start(count($family),$message);
|
|
|
|
foreach ($family as $key => $item) {
|
|
|
|
$stmt = $dbo->prepare("INSERT INTO family VALUES (:pid, :fid, :children)");
|
|
$stmt->BindValue(":pid",$key);
|
|
if (@$item['fid']) {
|
|
$stmt->BindValue(":fid",$item['fid']);
|
|
}
|
|
if (@$item['children'] && is_array(@$item['children'])) {
|
|
$stmt->BindValue(":children",serialize($item['children']));
|
|
}
|
|
$stmt->execute();
|
|
|
|
echo ProgressBar::next();
|
|
|
|
}
|
|
|
|
echo ProgressBar::finish($wopt_clear);
|
|
|
|
// create an index for family db
|
|
$dbo->exec("CREATE INDEX family_index ON family (pid)");
|
|
$dbo->exec("CREATE INDEX dupes_index ON dupes (fid)");
|
|
|
|
unset($dx, $dxo, $dupes);
|
|
|
|
// stats
|
|
$stmt = "UPDATE _skim SET ";
|
|
$stmt .= "passed_file=".$passed_file.", ";
|
|
$stmt .= "passed_dir=".$passed_dir.", ";
|
|
$stmt .= "passed_link=".$passed_link.", ";
|
|
$stmt .= "passed_total=".$passed_total.", ";
|
|
$stmt .= "nodescended=".$nodescended.", ";
|
|
$stmt .= "ignored=".$ignored.", ";
|
|
$stmt .= "dupes=".(@$dupecount ? $dupecount : 0);
|
|
$dbo->exec($stmt);
|
|
|
|
$wopt_currstep++;
|
|
|
|
// Init Spotlight DB
|
|
//////////////////////////////////////////
|
|
|
|
if ($p['spotlight']) { $dbo->exec("CREATE TABLE mdls (id INTEGER PRIMARY KEY,".implode(",",$cbuild).")"); }
|
|
|
|
// Pool DB
|
|
//////////////////////////////////////////
|
|
|
|
$dbp = new PDO("sqlite:".$bpath."/pool.sqlite3");
|
|
|
|
$dbp->setAttribute(PDO::ATTR_ERRMODE, PDO::ERRMODE_EXCEPTION);
|
|
|
|
$dbp->query("PRAGMA page_size = 4096");
|
|
$dbp->query("PRAGMA cache_size = 10000");
|
|
$dbp->query("PRAGMA synchronous = NORMAL");
|
|
$dbp->query("PRAGMA locking_mode = NORMAL");
|
|
$dbp->query("PRAGMA journal_mode = WAL");
|
|
|
|
$dbp->exec("CREATE TABLE IF NOT EXISTS md5 (fid TEXT, hash TEXT)");
|
|
$dbp->exec("CREATE TABLE IF NOT EXISTS exiftool (fid TEXT, tags TEXT)");
|
|
$dbp->exec("CREATE TABLE IF NOT EXISTS mediainfo (fid TEXT, info TEXT)");
|
|
$dbp->exec("CREATE TABLE IF NOT EXISTS thumbs (fid TEXT, created INTEGER, relative_path TEXT, width INTEGER, height INTEGER, tool TEXT)");
|
|
$dbp->exec("CREATE TABLE IF NOT EXISTS icons (fid TEXT, hash TEXT, created INTEGER, relative_path TEXT, tool TEXT)");
|
|
$dbp->exec("CREATE TABLE IF NOT EXISTS contents (fid TEXT, created INTEGER, relative_path TEXT)");
|
|
|
|
// Helper
|
|
//////////////////////////////////////////
|
|
|
|
if (file_exists($batchfile)) {
|
|
|
|
echo ProgressBar::start($passed_file,"Running batch (".stepString().")");
|
|
if ($p['parallel'] === 0) {
|
|
passthru("bash ".$batchfile);
|
|
} elseif ($p['parallel'] === 1) {
|
|
passthru($bin_parallel." < ".$batchfile);
|
|
} else {
|
|
passthru($bin_parallel." -j ".$p['parallel']." < ".$batchfile);
|
|
}
|
|
echo ProgressBar::finish($wopt_clear);
|
|
|
|
}
|
|
|
|
// Pool Indices
|
|
//////////////////////////////////////////
|
|
|
|
// We are done with the Pool DB, make sure there are indices
|
|
|
|
$dbp->exec("CREATE INDEX IF NOT EXISTS contents_index ON contents (fid)");
|
|
$dbp->exec("CREATE INDEX IF NOT EXISTS exiftool_index ON exiftool (fid)");
|
|
$dbp->exec("CREATE INDEX IF NOT EXISTS md5_index ON md5 (fid)");
|
|
$dbp->exec("CREATE INDEX IF NOT EXISTS mediainfo_index ON mediainfo (fid)");
|
|
$dbp->exec("CREATE INDEX IF NOT EXISTS thumbs_index ON thumbs (fid)");
|
|
$dbp->exec("CREATE INDEX IF NOT EXISTS icons_index ON icons (fid)");
|
|
|
|
// Files
|
|
//////////////////////////////////////////
|
|
|
|
$j = 0;
|
|
|
|
echo ProgressBar::start($passed_total, "Skimming");
|
|
|
|
foreach ($files as $splFileInfo) {
|
|
|
|
// DB
|
|
|
|
$stmt = $dbo->prepare("INSERT INTO files VALUES (:pid, :fid, :Pathname, :Path, :Filename, :Extension, :Type, :Size, :Inode, :Perms, :Owner, :ATime, :MTime, :CTime, :LinkTarget, :RealPath, :stat, :items, :newest, :fkind, :gfi_type, :gfi_attr, :gfi_created, :has_exif, :has_mediainfo, :has_hash, :thumb_filename, :thumb_width, :thumb_height, :thumb_tool, :icon_filename, :icon_tool, :contents_filename)");
|
|
|
|
// Identify dir, file, link or bundle dir
|
|
|
|
$type = $splFileInfo->getType();
|
|
if ($type == "dir") {
|
|
foreach ($p['bundles'] as $bundle) {
|
|
$check = ".".$bundle;
|
|
if (substr($splFileInfo->getFilename(), -(strlen($check)), strlen($check)) == $check) { $type = "bundle"; }
|
|
}
|
|
}
|
|
|
|
$stmt->BindValue(":Type",$type);
|
|
|
|
// Path basics
|
|
|
|
$pathname = $splFileInfo->getPathname();
|
|
$path = $splFileInfo->getPath();
|
|
$filename = $splFileInfo->getFilename();
|
|
$extension = $splFileInfo->getExtension();
|
|
$shellpath = escapeshellarg($pathname);
|
|
|
|
$stmt->BindValue(":Pathname",$pathname);
|
|
$stmt->BindValue(":Path",$path);
|
|
$stmt->BindValue(":Filename",$filename);
|
|
$stmt->BindValue(":Extension",$extension);
|
|
|
|
//stat
|
|
$stmt->BindValue(":stat",serialize($sty[$j]));
|
|
|
|
if ($type == "link") {
|
|
|
|
$stmt->BindValue(":LinkTarget",$splFileInfo->getLinkTarget());
|
|
$stmt->BindValue(":RealPath",$splFileInfo->getRealPath());
|
|
|
|
} else {
|
|
|
|
$stmt->BindValue(":Inode",$splFileInfo->getInode());
|
|
$stmt->BindValue(":Perms",$splFileInfo->getPerms());
|
|
$stmt->BindValue(":Owner",$splFileInfo->getOwner().":".$splFileInfo->getGroup());
|
|
|
|
$stmt->BindValue(":ATime",$splFileInfo->getATime());
|
|
$stmt->BindValue(":MTime",$splFileInfo->getMTime());
|
|
$stmt->BindValue(":CTime",$splFileInfo->getCTime());
|
|
|
|
}
|
|
|
|
// ------------------------------------------------ //
|
|
|
|
// Generate PID and FID
|
|
|
|
$pid = md5($pathname);
|
|
$stmt->BindValue(":pid",$pid);
|
|
|
|
if ($type == "file") {
|
|
$fid = md5($splFileInfo->getSize().$splFileInfo->getMtime().$splFileInfo->getBasename());
|
|
$stmt->BindValue(":fid",$fid);
|
|
}
|
|
|
|
// Size
|
|
|
|
if ($type == "dir" || $type == "bundle") {
|
|
$size = trim(shell_exec("du -ks ".$shellpath." | cut -f1"))*1024;
|
|
} elseif ($type == "file") {
|
|
$size = $splFileInfo->getSize();
|
|
} else {
|
|
$size = null;
|
|
}
|
|
$stmt->BindValue(":Size",@$size);
|
|
|
|
// ------------------------------------------------ //
|
|
|
|
// Items
|
|
|
|
if ($type == "dir" || $type == "bundle" ) {
|
|
// below commented out because it was causing -1 on dirs beginning with a dot
|
|
//$items = chop(@shell_exec("find ".$shellpath." \( ! -regex '.*/\..*' \) | wc -l 2>&1"))-1;
|
|
// below should be rewritten to use $wopt_ignore files
|
|
$items = chop(@shell_exec("find ".$shellpath." \( ! -regex '.*/\.DS_Store' \) | wc -l 2>&1"))-1;
|
|
$stmt->BindValue(":items",@$items);
|
|
}
|
|
|
|
// ------------------------------------------------ //
|
|
|
|
// Newest
|
|
|
|
if ($type == "dir") {
|
|
$newest = @filemtime(chop(shell_exec("find ".$shellpath." -type f -not -path '*/\.*' -print0 | xargs -0 stat -f \"%m %N\" | sort -rn 2>&1 | head -1 | cut -f2- -d\" \"")));
|
|
$stmt->BindValue(":newest",@$newest);
|
|
}
|
|
|
|
// ------------------------------------------------ //
|
|
|
|
// GetFileInfo
|
|
|
|
$gfiparts = explode("\n", chop(shell_exec($bin_gfi." -P ".$shellpath." 2>&1")));
|
|
if (is_array($gfiparts)) {
|
|
foreach ($gfiparts as $line) {
|
|
list($label, $value) = explode(": ", $line);
|
|
$gfi[$label] = isset($value) ? trim($value,"\"") : null;
|
|
}
|
|
}
|
|
|
|
$writegfitype = @$gfi['type'].":".@$gfi['creator'];
|
|
if ($writegfitype == "\\0\\0\\0\\0:\\0\\0\\0\\0" || $writegfitype == ":") { $writegfitype = null; }
|
|
|
|
$stmt->BindValue(":gfi_type",$writegfitype);
|
|
$stmt->BindValue(":gfi_attr",@$gfi['attributes']);
|
|
$stmt->BindValue(":gfi_created",strtotime(@$gfi['created']));
|
|
|
|
// ------------------------------------------------ //
|
|
|
|
// Kind
|
|
|
|
unset($fkind);
|
|
|
|
if ($type == "file") {
|
|
$fkind = trim(shell_exec("export LC_ALL=C; file -b -p ".$shellpath." | cut -f1 -d,"));
|
|
$stmt->BindValue(":fkind",@$fkind);
|
|
}
|
|
|
|
// ------------------------------------------------ //
|
|
|
|
// Pool
|
|
|
|
if ($type == "file") {
|
|
|
|
$fetch_icon = @$dbp->query("SELECT * FROM icons WHERE fid='".$fid."'")->fetch();
|
|
if (@$fetch_icon['relative_path']) {
|
|
$stmt->BindValue(":icon_filename",$fetch_icon['relative_path']);
|
|
$stmt->BindValue(":icon_tool",$fetch_icon['tool']);
|
|
}
|
|
|
|
unset($fetch_exif, $fetch_media, $fetch_hash, $fetch_thumb, $fetch_icon, $yes_exif, $yes_media, $yes_hash);
|
|
|
|
$yes_exif = $dbp->query("SELECT rowid FROM exiftool WHERE fid='".$fid."'")->fetch()[0];
|
|
$stmt->BindValue(":has_exif",$yes_exif);
|
|
|
|
$yes_media = $dbp->query("SELECT rowid FROM mediainfo WHERE fid='".$fid."'")->fetch()[0];
|
|
$stmt->BindValue(":has_mediainfo",$yes_media);
|
|
|
|
$yes_hash = $dbp->query("SELECT rowid FROM md5 WHERE fid='".$fid."'")->fetch()[0];
|
|
$stmt->BindValue(":has_hash",$yes_hash);
|
|
|
|
$yes_contents = $dbp->query("SELECT relative_path FROM contents WHERE fid='".$fid."'")->fetch()[0];
|
|
$stmt->BindValue(":contents_filename",$yes_contents);
|
|
|
|
$fetch_thumb = $dbp->query("SELECT * FROM thumbs WHERE fid='".$fid."'")->fetch();
|
|
|
|
if (@$fetch_thumb['relative_path']) {
|
|
$stmt->BindValue(":thumb_filename",$fetch_thumb['relative_path']);
|
|
$stmt->BindValue(":thumb_width",$fetch_thumb['width']);
|
|
$stmt->BindValue(":thumb_height",$fetch_thumb['height']);
|
|
$stmt->BindValue(":thumb_tool",$fetch_thumb['tool']);
|
|
} else {
|
|
$stmt->BindValue(":thumb_filename",null);
|
|
}
|
|
|
|
} else {
|
|
|
|
unset($fetch_icon, $fetch_thumb);
|
|
|
|
$fetch_icon = @$dbp->query("SELECT * FROM icons WHERE fid='".$pid."'")->fetch();
|
|
if (@$fetch_icon['relative_path']) {
|
|
$stmt->BindValue(":icon_filename",$fetch_icon['relative_path']);
|
|
$stmt->BindValue(":icon_tool",$fetch_icon['tool']);
|
|
}
|
|
|
|
$fetch_thumb = $dbp->query("SELECT * FROM thumbs WHERE fid='".$pid."'")->fetch();
|
|
|
|
if (@$fetch_thumb['relative_path']) {
|
|
$stmt->BindValue(":thumb_filename",$fetch_thumb['relative_path']);
|
|
$stmt->BindValue(":thumb_width",$fetch_thumb['width']);
|
|
$stmt->BindValue(":thumb_height",$fetch_thumb['height']);
|
|
$stmt->BindValue(":thumb_tool",$fetch_thumb['tool']);
|
|
} else {
|
|
$stmt->BindValue(":thumb_filename",null);
|
|
}
|
|
|
|
}
|
|
|
|
// ------------------------------------------------ //
|
|
|
|
// Write to DB
|
|
|
|
$stmt->execute();
|
|
|
|
// Double check stat for file against pre-run value
|
|
|
|
if ($p['stat_mode'] > 1 && $type != "link") {
|
|
|
|
$restat = statToArray(shell_exec("stat -s ".$shellpath." 2>&1"));
|
|
|
|
$message = array();
|
|
if ($sty[$j]['st_atime'] != $restat['st_atime']) {
|
|
if ($p['stat_mode'] == 3 && is_writable($pathname)) {
|
|
exec("touch -at `date -r ".$sty[$j]['st_atime']." +%Y%m%d%H%M.%S` ".$shellpath." 2>&1");
|
|
$message[] = "atime (fix)";
|
|
} else {
|
|
$message[] = "atime";
|
|
}
|
|
}
|
|
if ($sty[$j]['st_mtime'] != $restat['st_mtime']) {
|
|
$message[] = "mtime";
|
|
}
|
|
if ($sty[$j]['st_ctime'] != $restat['st_ctime']) {
|
|
$message[] = "ctime";
|
|
}
|
|
|
|
if (count($message)) { echo msg(" CHANGE = ".implode(", ", $message).""); }
|
|
|
|
}
|
|
|
|
echo ProgressBar::next($pathname);
|
|
$j++;
|
|
|
|
}
|
|
|
|
echo ProgressBar::finish($wopt_clear);
|
|
|
|
// Milk
|
|
//////////////////////////////////////////
|
|
|
|
$milk['t*DocTitle'] = ["e^Title","k^Title","m^Track_name"];
|
|
$milk['t*Format'] = ["m^Format","e^Compression","e^MIMEType"];
|
|
$milk['t*Dimensions'] = ["k^PixelWidth.k^PixelHeight","e^PixelWidth.e^PixelHeight","m^SkimDims","k^SkimPageDims"];
|
|
$milk['s*Seconds'] = ["k^DurationSeconds","e^Duration","m^Duration"];
|
|
$milk['d*DateTime'] = ["e^DateTimeOriginal","m^EncodedDate","e^CreateDate","e^MediaCreateDate","k^ContentCreationDate"];
|
|
$milk['t*Origin'] = ["e^CameraModelName","e^Producer","e^CreatorTool","e^WriterName","e^Software","e^Encoder","k^Creator"];
|
|
$milk['t*GPS'] = ["k^Latitude.k^Longitude","e^GPSPosition"];
|
|
$milk['t*Author'] = ["e^Author","e^Artist","e^Creator","e^By-line","k^Copyright"];
|
|
|
|
$milk['i*Tracks'] = ["m^SkimTrackCount","k^NumberOfPages"];
|
|
$milk['t*Writer'] = ["m^Writing_application.m^Writing_library"];
|
|
$milk['t*Bitrate'] = ["m^Overall_bit_rate","e^AvgBitrate","k^TotalBitRate"];
|
|
|
|
//$milk['i*Orientation'] = ["e^Orientation"];
|
|
//$milk['t*Profile'] = ["e^Profile"];
|
|
//$milk['i*BitDepth'] = ["e^BitDepth"];
|
|
//$milk['t*LensType'] = ["e^LensType"];
|
|
//$milk['t*FocalLength'] = ["e^FocalLength"];
|
|
//$milk['t*Aperture'] = ["e^Aperture"];
|
|
//$milk['t*LightSource'] = ["e^LightSource"];
|
|
//$milk['t*WhiteBalance'] = ["e^WhiteBalance"];
|
|
|
|
$delimiter = ",";
|
|
$display_delimiter = " x ";
|
|
|
|
// Build DB
|
|
|
|
$cbuild = $ibuild = array();
|
|
foreach (array_keys($milk) as $name) {
|
|
list($kind,$item) = explode("*",$name);
|
|
switch ($kind) {
|
|
case "t":
|
|
case "d":
|
|
case "s":
|
|
$cbuild[] = $item." TEXT";
|
|
break;
|
|
case "i":
|
|
$cbuild[] = $item." INTEGER";
|
|
break;
|
|
}
|
|
$ibuild[] = ":".$item;
|
|
}
|
|
|
|
$dbo->exec("CREATE TABLE milk (".implode(",",$cbuild).")");
|
|
|
|
$countrows = @reset($dbo->query("SELECT max(rowid) FROM files")->fetch());
|
|
echo msg("Milking ".$countrows." rows");
|
|
echo ProgressBar::start($countrows, "Milk");
|
|
|
|
$loop = $dbo->query("SELECT rowid, * FROM files");
|
|
while ($row_a = $loop->fetch()) {
|
|
|
|
$stmt = $dbo->prepare("INSERT INTO milk VALUES (".implode(",",$ibuild).")");
|
|
|
|
if ($dbo->query("SELECT name FROM sqlite_master WHERE name='mdls'")->fetch()) {
|
|
$row_b = @$dbo->query("SELECT * FROM mdls WHERE (rowid='".$row_a['rowid']."')")->fetch();
|
|
}
|
|
|
|
if (count(@$row_b) > 1) {
|
|
$m['k'] = $row_b;
|
|
|
|
//custom values
|
|
|
|
if ($m['k']['PageWidth'] && $m['k']['PageHeight']) {
|
|
$m['k']['SkimPageDims'] = round($m['k']['PageWidth']/72,2)."in".$display_delimiter.round($m['k']['PageHeight']/72,2)."in";
|
|
}
|
|
|
|
} else {
|
|
$m['k'] = null;
|
|
}
|
|
|
|
if (isset($row_a['has_exif'])) {
|
|
$row_c = $dbp->query("SELECT * FROM exiftool WHERE (rowid='".$row_a['has_exif']."')")->fetch();
|
|
$m['e'] = unserialize($row_c['tags']);
|
|
} else {
|
|
$m['e'] = null;
|
|
}
|
|
|
|
if (isset($row_a['has_mediainfo'])) {
|
|
|
|
$row_d = $dbp->query("SELECT * FROM mediainfo WHERE (rowid='".$row_a['has_mediainfo']."')")->fetch();
|
|
if (substr($row_d['info'],0,5) == "<?xml") {
|
|
$decoded = @json_decode(json_encode(simplexml_load_string($row_d['info'])),true);
|
|
$m_base = $decoded['File']['track'];
|
|
$m['m'] = $decoded['File']['track'][0];
|
|
} else {
|
|
$decoded = @json_decode($row_d['info'],true);
|
|
$m_base = $decoded['media']['track'];
|
|
$m['m'] = $decoded['media']['track'][0];
|
|
}
|
|
|
|
$m['m']['SkimTrackCount'] = @count($m_base);
|
|
if (is_array($m_base)) {
|
|
foreach (@$m_base as $track) {
|
|
if (!@$m['m']['SkimDims'] && @$track['Width'] && @$track['Height']) {
|
|
$m['m']['SkimDims'] = @sanitize($track['Width'],"i").$display_delimiter.@sanitize($track['Height'],"i");
|
|
}
|
|
}
|
|
}
|
|
|
|
// do seconds fix here
|
|
|
|
} else {
|
|
|
|
$m['m'] = null;
|
|
|
|
}
|
|
|
|
// M*I*L*K baby
|
|
foreach ($milk as $value => $weighted) {
|
|
|
|
list($type,$name) = explode("*",$value);
|
|
$found = 0;
|
|
|
|
foreach ($weighted as $dindex) {
|
|
|
|
// concatenante 2 values
|
|
if (!$found && strpos($dindex, ".")) {
|
|
|
|
$parts = explode(".",$dindex);
|
|
$out = array();
|
|
foreach ($parts as $part) {
|
|
list($kind,$item) = explode("^",$part);
|
|
if (@$m[$kind][$item]) {
|
|
$out[] = sanitize($m[$kind][$item],$type);
|
|
}
|
|
}
|
|
if (count($out)) {
|
|
$stmt->BindValue(":".$name,implode($delimiter,$out));
|
|
$found = 1;
|
|
}
|
|
|
|
} elseif (!$found) {
|
|
|
|
// find a single value
|
|
list($kind,$item) = @explode("^",$dindex);
|
|
if (@$m[$kind][$item]) {
|
|
$stmt->BindValue(":".$name,@sanitize($m[$kind][$item],$type));
|
|
$found = 1;
|
|
}
|
|
|
|
}
|
|
}
|
|
|
|
}
|
|
|
|
echo ProgressBar::next(true);
|
|
|
|
$stmt->execute();
|
|
|
|
}
|
|
|
|
echo ProgressBar::finish($wopt_clear);
|
|
|
|
// Cleanup
|
|
//////////////////////////////////////////
|
|
|
|
echo msg("");
|
|
|
|
if (file_exists($error_log_file)) { echo file_get_contents($error_log_file); }
|
|
|
|
$seconds = floor($time = microtime(true)-$_SERVER["REQUEST_TIME_FLOAT"]);
|
|
$dbo->exec("UPDATE _skim SET status='completed_in_".$seconds."'");
|
|
|
|
// rsync
|
|
|
|
if ($p['postflight'] == 3) {
|
|
$url = "http://localhost/rtc.php?db=data/".basename($bpath)."/".$stamp.".sqlite3";
|
|
exec("open ".$url);
|
|
} elseif ($p['postflight'] == 2 && $p['rsync_dest']) {
|
|
echo msg("rsync...");
|
|
$command = "rsync -avv -e ssh ".$bpath." ".$p['rsync_dest'];
|
|
$count = trim(shell_exec("find ".escapeshellarg($bpath)." | wc -l"));
|
|
echo ProgressBar::start($count,$p['rsync_dest']);
|
|
$pipe = popen($command, "r");
|
|
while(fgets($pipe, 2048)) { echo ProgressBar::next(true); }
|
|
pclose($pipe);
|
|
echo ProgressBar::finish();
|
|
} elseif ($p['postflight'] == 1) {
|
|
exec("open -R ".escapeshellarg($bpath));
|
|
}
|
|
|
|
$done = "Finished ".$zpath." in ".$seconds." seconds";
|
|
$done_m = "Memory usage: ".prettysize(memory_get_usage(true));
|
|
echo msg($done."\n".$done_m); notification($done);
|
|
|
|
unset($dbo, $dbp, $files, $family);
|
|
|
|
?>
|