upd to 0.2

This commit is contained in:
ivan 2023-07-27 21:34:46 +03:00
parent 8d123343a3
commit 1225caf012
3 changed files with 289 additions and 140 deletions

View File

@ -2,11 +2,11 @@
mySQL image downloader / replacer wizard mySQL image downloader / replacer wizard
v.0.1 alpha v.0.2 beta adopted for php8
DWTWL license https://soundragon.su/license/license.html DWTWL license https://soundragon.su/license/license.html
This is alpha version written for specific needs. If you want complete and expanded version of this script, then make the request. This is beta version written for specific needs. If you want complete and expanded version of this script, then make the request.
@ -21,4 +21,4 @@ Using:
/mysqlim/ /mysqlim/
3. Add write privilegies for this directory. 3. Add write privilegies for this directory.
4. Login to wizard by web-browser: 4. Login to wizard by web-browser:
http://yourserver.com/mysqlim/ http://yourserver.com/mysqlim/index.php

View File

@ -1,7 +1,8 @@
<?php <?php
/** /**
* mySQL image replacer - https://github.com/zlaxy/mysqlimagereplacer * mySQL image replacer - https://gitlab.com/zlax/mysqlimagereplacer
* v.0.1 alpha - uder DWTWL license https://soundragon.su/license/license.html * adopted for php8.2
* v.0.2 beta - uder DWTWL license https://soundragon.su/license/license.html
* exec script * exec script
* *
* !MAKE BACKUP OF YOUR SQL-TABLE BEFORE YOU TRY THIS SCRIPT! * !MAKE BACKUP OF YOUR SQL-TABLE BEFORE YOU TRY THIS SCRIPT!
@ -33,9 +34,9 @@ function DownloadFopen($URL) {
} else { } else {
if (exif_imagetype($fileprefix.rawurldecode(pathinfo($URL)['basename']))>0) $result=$fileprefix.pathinfo($URL)['basename']; if (exif_imagetype($fileprefix.rawurldecode(pathinfo($URL)['basename']))>0) $result=$fileprefix.pathinfo($URL)['basename'];
else { else {
unlink ($fileprefix.rawurldecode(pathinfo($URL)['basename'])); unlink ($fileprefix.rawurldecode(pathinfo($URL)['basename']));
$result=false; $result=false;
} }
} }
} else { } else {
file_put_contents(rawurldecode(pathinfo($URL)['basename']), file_get_contents($URL)); file_put_contents(rawurldecode(pathinfo($URL)['basename']), file_get_contents($URL));
@ -67,22 +68,40 @@ $htmlprefix=$indatacsv[11];
$fixalready=$indatacsv[12]; $fixalready=$indatacsv[12];
$fixundownload=$indatacsv[13]; $fixundownload=$indatacsv[13];
$correctimagenumber=$indatacsv[14]; $correctimagenumber=$indatacsv[14];
$filtcolumn=$indatacsv[15];
$filtvalue=$indatacsv[16];
$ahrefparents=$indatacsv[17];
$webarchived=$indatacsv[18];
unlink ("indata.csv"); unlink ("indata.csv");
if ($logmessage=="emptyindata") echo "Can't read data file, please check write pirivlegies for ",$execdir," directory"; if (isset($logmessage) && $logmessage=="emptyindata")
echo "Can't read data file, please check write pirivlegies for ",$execdir," directory";
chdir("../".$dirname); chdir("../".$dirname);
if ($subdir) chdir ($subdir); if ($subdir)
$dbconnection=mysqli_connect($dbhost,$dbuser,$dbpass,$dbname); chdir ($subdir);
mysqli_set_charset($dbconnection,'utf8'); $dbconnection=mysqli_connect($dbhost,$dbuser,$dbpass,$dbname);
$resulttable=mysqli_query($dbconnection,"SELECT * FROM ".$dbtable); mysqli_set_charset($dbconnection,'utf8');
$totalstatus="started"; $resulttable=mysqli_query($dbconnection,"SELECT * FROM ".$dbtable);
$updatedurls=0; $totalstatus="started";
$failedtoupdate=0; $updatedurls=0;
$deletedurls=0; $failedtoupdate=0;
$rawsedit=0; $deletedurls=0;
SaveStatus ($totalstatus,$rawsedit,$updatedurls,$failedtoupdate,$deletedurls,$execdir); $rawsedit=0;
while($row=mysqli_fetch_assoc($resulttable)){ SaveStatus ($totalstatus,$rawsedit,$updatedurls,$failedtoupdate,$deletedurls,$execdir);
$originalcontent=$row[$dbcolumn]; $filteredpostnumber=0;
while($row=mysqli_fetch_assoc($resulttable)){
if (!empty($filtcolumn) && !empty($filtvalue)) {
if ($row[$filtcolumn] == $filtvalue) {
if (!empty($row[$dbcolumn]))
$originalcontent=$row[$dbcolumn];
$filteredpostnumber++;
}
} else { if (!empty($row[$dbcolumn]))
$originalcontent=$row[$dbcolumn];
$filteredpostnumber++;
}
if (isset($originalcontent)) {
$newcontent=$originalcontent; $newcontent=$originalcontent;
if ($fixbroken) { if ($fixbroken) {
$contentpost=new DOMDocument(); $contentpost=new DOMDocument();
@ -106,10 +125,25 @@ if ($subdir) chdir ($subdir);
$imageTags=$contentpost->getElementsByTagName('img'); $imageTags=$contentpost->getElementsByTagName('img');
for ($i = $imageTags->length; --$i >= 0; ) { // http://php.net/manual/class.domnodelist.php#83390 for ($i = $imageTags->length; --$i >= 0; ) { // http://php.net/manual/class.domnodelist.php#83390
$tag = $imageTags->item($i); $tag = $imageTags->item($i);
$imgsrctag=$tag->getAttribute('src'); if ($ahrefparents) {
$aofimg=$contentpost->importNode($tag->parentNode, true);
if (isset($aofimg)) {
$ahreofimg=$aofimg->getAttribute('href');
if ($ahreofimg=="") $ahreofimg=$tag->getAttribute('src');
$imgsrctag=$ahreofimg;
}
} else $imgsrctag=$tag->getAttribute('src');
$parsedimgsrctag=parse_url($imgsrctag); $parsedimgsrctag=parse_url($imgsrctag);
if ((!empty($parsedimgsrctag['host'])&&!empty($parsedimgsrctag['path']))&&(($parsedimgsrctag['scheme']=="http")||($parsedimgsrctag ['scheme']=="https"))&&(!($parsedimgsrctag['host']==$servername))) { if ((!empty($parsedimgsrctag['host'])&&!empty($parsedimgsrctag['path']))&&(($parsedimgsrctag['scheme']=="http")||($parsedimgsrctag ['scheme']=="https"))&&(!($parsedimgsrctag['host']==$servername))) {
$newimgsrc=DownloadFopen($imgsrctag); if ($webarchived) {
$parsedimgsrctagarch=parse_url($tag->getAttribute('src'));
if ($parsedimgsrctagarch['host']==$webarchived) {
$webarchivelink="https://web.archive.org/web/20200101id_/".$tag->getAttribute('src');
$newimgsrc=DownloadFopen($webarchivelink);
} else
$newimgsrc=DownloadFopen($imgsrctag);
} else
$newimgsrc=DownloadFopen($imgsrctag);
if ($newimgsrc) { if ($newimgsrc) {
if ($htmlprefix=="http") { if ($htmlprefix=="http") {
$srcbase="http://".$servername."/".$dirname."/"; $srcbase="http://".$servername."/".$dirname."/";
@ -120,7 +154,7 @@ if ($subdir) chdir ($subdir);
} }
if ($subdir) $srcbase=$srcbase.rawurlencode($subdir)."/"; if ($subdir) $srcbase=$srcbase.rawurlencode($subdir)."/";
$newimgsrc=$srcbase.$newimgsrc; $newimgsrc=$srcbase.$newimgsrc;
$newcontent=str_replace($imgsrctag,$newimgsrc,$newcontent); $newcontent=str_replace($tag->getAttribute('src'),$newimgsrc,$newcontent);
unset($newimgsrc); unset($newimgsrc);
$updatedurls++; $updatedurls++;
SaveStatus ($totalstatus,$rawsedit,$updatedurls,$failedtoupdate,$deletedurls,$execdir); SaveStatus ($totalstatus,$rawsedit,$updatedurls,$failedtoupdate,$deletedurls,$execdir);
@ -138,9 +172,10 @@ if ($subdir) chdir ($subdir);
$rawsedit++; $rawsedit++;
SaveStatus ($totalstatus,$rawsedit,$updatedurls,$failedtoupdate,$deletedurls,$execdir); SaveStatus ($totalstatus,$rawsedit,$updatedurls,$failedtoupdate,$deletedurls,$execdir);
} }
$totalstatus="finished"; }
SaveStatus ($totalstatus,$rawsedit,$updatedurls,$failedtoupdate,$deletedurls,$execdir); $totalstatus="finished";
echo $updatedurls," urls was downloaded and updated, ",$failedtoupdate," urls was failed to update","<br>\n"; SaveStatus ($totalstatus,$rawsedit,$updatedurls,$failedtoupdate,$deletedurls,$execdir);
if ($fixbroken or $fixundownload) echo $deletedurls, " tags was deleted<br>\n"; echo $updatedurls," urls was downloaded and updated, ",$failedtoupdate," urls was failed to update","<br>\n";
if ($fixbroken or $fixundownload) echo $deletedurls, " tags was deleted<br>\n";
?> ?>

330
index.php
View File

@ -1,7 +1,8 @@
<?php <?php
/** /**
* mySQL image replacer - https://github.com/zlaxy/mysqlimagereplacer * mySQL image replacer - https://gitlab.com/zlax/mysqlimagereplacer
* v.0.1 alpha - uder DWTWL license https://soundragon.su/license/license.html * adopted for php8.2
* v.0.2 beta - uder DWTWL license https://soundragon.su/license/license.html
* interface script * interface script
* *
* !MAKE BACKUP OF YOUR SQL-TABLE BEFORE YOU TRY THIS SCRIPT! * !MAKE BACKUP OF YOUR SQL-TABLE BEFORE YOU TRY THIS SCRIPT!
@ -12,17 +13,18 @@
* todo: rawurlencode for non-latin domains * todo: rawurlencode for non-latin domains
*/ */
session_start(); session_start();
if (!isset($_SESSION["template"])) $_SESSION["template"]="Custom";
function PageView() { function PageView() {
// First wizard-page // First wizard-page view
if ($_SESSION["step"]==0) { if ($_SESSION["step"]==0) {
echo "STEP 1: choose database:<br>\n"; echo "STEP 1: choose database:<br>\n";
$_SESSION["subdir"]="images"; $_SESSION["subdir"]="images";
echo "<form action=index.php method=post>\n"; echo "<form action=index.php method=post>\n";
echo " database host: <input type=text name=\"dbhost\" value=\"localhost\" maxlength=255><br>\n"; echo " database host: <input type=text name=\"dbhost\" value=\"localhost\" maxlength=255><br>\n";
echo " database user: <input type=text name=\"dbuser\" value=\"",$_SESSION["dbuser"],"\" maxlength=255><br>\n"; echo " database user: <input type=text name=\"dbuser\" value=\"",$_SESSION["dbuser"] ?? null,"\" maxlength=255><br>\n";
echo " database pass: <input type=password name=\"dbpass\" maxlength=255><br>\n"; echo " database pass: <input type=password name=\"dbpass\" maxlength=255><br>\n";
echo " database name: <input type=text name=\"dbname\" value=\"",$_SESSION["dbname"],"\" maxlength=255><br>\n"; echo " database name: <input type=text name=\"dbname\" value=\"",$_SESSION["dbname"] ?? null,"\" maxlength=255><br>\n";
echo " type template: <select name=\"dbtype\">\n"; echo " type template: <select name=\"dbtype\">\n";
echo " <option value=\"Custom\""; echo " <option value=\"Custom\"";
if (($_SESSION["template"]=="Custom")||(!$_SESSION["template"])) echo " selected"; if (($_SESSION["template"]=="Custom")||(!$_SESSION["template"])) echo " selected";
@ -42,7 +44,7 @@ function PageView() {
if ($_SESSION["error"]=="dbconnection") echo " Error: ", mysqli_connect_error(),"<br>\n"; if ($_SESSION["error"]=="dbconnection") echo " Error: ", mysqli_connect_error(),"<br>\n";
if ($_SESSION["error"]=="dbconnectionname") echo " Error: enter database name.<br>\n"; if ($_SESSION["error"]=="dbconnectionname") echo " Error: enter database name.<br>\n";
} }
// Second wizard-page // Second wizard-page view
if ($_SESSION["step"]==1) { if ($_SESSION["step"]==1) {
echo "STEP 2: entries and directories:<br>\n"; echo "STEP 2: entries and directories:<br>\n";
echo "<form action=index.php method=post>\n"; echo "<form action=index.php method=post>\n";
@ -50,14 +52,19 @@ function PageView() {
echo " Table name: <input type=text name=\"dbtable\" value=\"",$_SESSION["dbtable"],"\" maxlength=255><br>\n"; echo " Table name: <input type=text name=\"dbtable\" value=\"",$_SESSION["dbtable"],"\" maxlength=255><br>\n";
echo " Column name: <input type=text name=\"dbcolumn\" value=\"",$_SESSION["dbcolumn"],"\" maxlength=255><br>\n"; echo " Column name: <input type=text name=\"dbcolumn\" value=\"",$_SESSION["dbcolumn"],"\" maxlength=255><br>\n";
echo " Content directory: ~/<input type=text name=\"dirname\" value=\"",$_SESSION["dirname"],"\" maxlength=255><br>\n"; echo " Content directory: ~/<input type=text name=\"dirname\" value=\"",$_SESSION["dirname"],"\" maxlength=255><br>\n";
echo " Filter column: <input type=text name=\"IDcolumn\" value=\"",$_SESSION["IDcolumn"],"\" maxlength=255><br>\n";
echo " Filter column: <input type=text name=\"filtcolumn\" value=\"",$_SESSION["filtcolumn"],"\" maxlength=255><br>\n";
echo " Filter column value: <input type=text name=\"filtvalue\" value=\"",$_SESSION["filtvalue"],"\" maxlength=255><br>\n";
echo " <i>(F.e. to filter posts from drafts and attachments in Wordpress6+)</i><br>\n";
echo " <input type=submit name=\"prev1\" value=\"Previous\"> <input type=submit name=\"next1\" value=\"Next\">\n"; echo " <input type=submit name=\"prev1\" value=\"Previous\"> <input type=submit name=\"next1\" value=\"Next\">\n";
echo "</form>\n"; echo "</form>\n";
if ($_SESSION["error"]) echo $_SESSION["error"],"<br>\n"; if ($_SESSION["error"]) echo $_SESSION["error"],"<br>\n";
} }
// Third wizard-page // Third wizard-page view
if ($_SESSION["step"]==2) { if ($_SESSION["step"]==2) {
echo "STEP 3: check data:<br>\n"; echo "STEP 3: check data:<br>\n";
$postnumber=0; $postnumber=0;
$filteredpostnumber=0;
$totalimagenumber=0; $totalimagenumber=0;
$_SESSION["correctimagenumber"]=0; $_SESSION["correctimagenumber"]=0;
$_SESSION["alreadyimagenumber"]=0; $_SESSION["alreadyimagenumber"]=0;
@ -66,21 +73,47 @@ function PageView() {
mysqli_set_charset($dbconnection,'utf8'); mysqli_set_charset($dbconnection,'utf8');
$resulttable=mysqli_query($dbconnection,"SELECT * FROM ".$_SESSION["dbtable"]); $resulttable=mysqli_query($dbconnection,"SELECT * FROM ".$_SESSION["dbtable"]);
$resultrows=mysqli_num_rows($resulttable); $resultrows=mysqli_num_rows($resulttable);
if (!empty($_SESSION["IDcolumn"]))
$_SESSION["imgsrcsID"]=array();
$_SESSION["imgsrcs"]=array(); $_SESSION["imgsrcs"]=array();
// Checking table $_SESSION["imgsrcahrefs"]=array();
while($row=mysqli_fetch_assoc($resulttable)){ // -- Checking table
while($row=mysqli_fetch_assoc($resulttable)) {
$contentpost=new DOMDocument(); $contentpost=new DOMDocument();
$contentpost->loadHTML($row[$_SESSION["dbcolumn"]]); if (!empty($_SESSION["filtcolumn"]) && !empty($_SESSION["filtvalue"])) {
if ($row[$_SESSION["filtcolumn"]] == $_SESSION["filtvalue"]) {
if (!empty($row[$_SESSION["dbcolumn"]]))
$contentpost->loadHTML($row[$_SESSION["dbcolumn"]]);
$filteredpostnumber++;
}
} else {
if (!empty($row[$_SESSION["dbcolumn"]]))
$contentpost->loadHTML($row[$_SESSION["dbcolumn"]]);
$filteredpostnumber++;
}
$imageTags=$contentpost->getElementsByTagName('img'); $imageTags=$contentpost->getElementsByTagName('img');
$ahrefImageTags=$imageTags;
$imagenumberinpost=0; $imagenumberinpost=0;
foreach($imageTags as $tag) { foreach($imageTags as $tag) {
$imagenumberinpost++; $imagenumberinpost++;
$totalimagenumber++; $totalimagenumber++;
if (!empty($_SESSION["IDcolumn"]))
$_SESSION["imgsrcsID"][$postnumber]=$row[$_SESSION["IDcolumn"]];
$_SESSION["imgsrcs"][$postnumber][$imagenumberinpost]=$tag->getAttribute('src'); $_SESSION["imgsrcs"][$postnumber][$imagenumberinpost]=$tag->getAttribute('src');
$aofimg=$contentpost->importNode($tag->parentNode, true);
if (isset($aofimg)) {
$ahreofimg=$aofimg->getAttribute('href');
if ($ahreofimg=="") $ahreofimg=$tag->getAttribute('src');
$_SESSION["imgsrcahrefs"][$postnumber][$imagenumberinpost]=$ahreofimg;
}
else
$_SESSION["imgsrcahrefs"][$postnumber][$imagenumberinpost]=$tag->getAttribute('src');
$testurl=parse_url($_SESSION["imgsrcs"][$postnumber][$imagenumberinpost]); $testurl=parse_url($_SESSION["imgsrcs"][$postnumber][$imagenumberinpost]);
if ((!empty($testurl['host'])&&!empty($testurl['path']))&&(($testurl['scheme']=="http")||($testurl ['scheme']=="https"))&&(!($testurl['host']==$_SERVER['SERVER_NAME']))) $_SESSION["correctimagenumber"]++; if ((!empty($testurl['host'])&&!empty($testurl['path']))&&(($testurl['scheme']=="http")||($testurl ['scheme']=="https"))&&(!($testurl['host']==$_SERVER['SERVER_NAME'])))
else if ($testurl['host']==$_SERVER['SERVER_NAME']) $_SESSION["alreadyimagenumber"]++; $_SESSION["correctimagenumber"]++;
else $_SESSION["brokenimagenumber"]++; else if (isset($testurl['host']) && ($testurl['host']==$_SERVER['SERVER_NAME']))
$_SESSION["alreadyimagenumber"]++;
else $_SESSION["brokenimagenumber"]++;
} }
$postnumber++; $postnumber++;
} }
@ -89,6 +122,7 @@ function PageView() {
echo " ",getcwd(),"/<input type=text name=\"subdir\" value=\"",$_SESSION["subdir"],"\" maxlength=63> (leave blank if you don't need subdir)<br>\n"; echo " ",getcwd(),"/<input type=text name=\"subdir\" value=\"",$_SESSION["subdir"],"\" maxlength=63> (leave blank if you don't need subdir)<br>\n";
echo " type of html-prefix:<br>\n"; echo " type of html-prefix:<br>\n";
echo " <input type=\"radio\" name=\"htmlprefix\" value=\"http\""; echo " <input type=\"radio\" name=\"htmlprefix\" value=\"http\"";
if (!isset($_SESSION["htmlprefix"])) $_SESSION["htmlprefix"]="wo";
if ($_SESSION["htmlprefix"]=="http") echo " checked"; if ($_SESSION["htmlprefix"]=="http") echo " checked";
echo ">http://<br>\n"; echo ">http://<br>\n";
echo " <input type=\"radio\" name=\"htmlprefix\" value=\"https\""; echo " <input type=\"radio\" name=\"htmlprefix\" value=\"https\"";
@ -99,32 +133,42 @@ function PageView() {
echo ">without prefix and domain name<br>\n"; echo ">without prefix and domain name<br>\n";
echo " type of download:<br>\n"; echo " type of download:<br>\n";
echo " <input type=\"radio\" name=\"dwnldtype\" value=\"put\""; echo " <input type=\"radio\" name=\"dwnldtype\" value=\"put\"";
if (!($_SESSION["downloadtype"]=="curl")) echo " checked"; if (!isset($_SESSION["downloadtype"])) $_SESSION["downloadtype"]="put";
if ($_SESSION["downloadtype"]=="put") echo " checked";
echo ">file_put_contents<br>\n"; echo ">file_put_contents<br>\n";
echo " <input type=\"radio\" name=\"dwnldtype\" value=\"curl\""; echo " <input type=\"radio\" name=\"dwnldtype\" value=\"curl\"";
if ($_SESSION["downloadtype"]=="curl") echo " checked"; if ($_SESSION["downloadtype"]=="curl") echo " checked";
echo " disabled"; // usopported in alpha version echo " disabled"; // unsupported yet
echo ">curl<br>\n"; echo ">curl <i>[unsupported yet]</i><br>\n";
echo " <input type=\"radio\" name=\"dwnldtype\" value=\"wget\""; echo " <input type=\"radio\" name=\"dwnldtype\" value=\"wget\"";
if ($_SESSION["downloadtype"]=="wget") echo " checked"; if ($_SESSION["downloadtype"]=="wget") echo " checked";
echo " disabled"; // usopported in alpha version echo " disabled"; // unsupported yet
echo ">wget<br>\n"; echo ">wget <i>[unsupported yet]</i><br>\n";
echo " number of rows in table: $resultrows<br>\n"; echo " number of rows in table: $resultrows<br>\n";
echo " filtered rows: $filteredpostnumber<br>\n";
echo " number of rows with imgsrc tags: ",count($_SESSION["imgsrcs"]),"<br>\n"; echo " number of rows with imgsrc tags: ",count($_SESSION["imgsrcs"]),"<br>\n";
echo " total number of img src tags: $totalimagenumber<br>\n"; echo " total number of img src tags: $totalimagenumber<br>\n";
echo " broken image links: ",$_SESSION["brokenimagenumber"],"<br>\n"; echo " broken image links: ",$_SESSION["brokenimagenumber"],"<br>\n";
echo " already downloaded image links: ",$_SESSION["alreadyimagenumber"],"<br>\n"; echo " already downloaded image links: ",$_SESSION["alreadyimagenumber"],"<br>\n";
echo " correct external image links for download: ",$_SESSION["correctimagenumber"],"<br>\n"; echo " correct external image links for download: ",$_SESSION["correctimagenumber"],"<br>\n";
echo " <input type=checkbox name=fixbroken value=true"; echo " <input type=checkbox name=\"ahrefparents\" value=\"yes\"";
if (!isset($_SESSION["ahrefparents"])) $_SESSION["ahrefparents"]=true;
if ($_SESSION["ahrefparents"]) echo " checked";
echo ">download parent a hrefs if exists?<br>\n";
echo "Domain for webarchive download: <input type=text name=\"webarchived\" value=\"",$_SESSION["webarchived"],"\" maxlength=127> (leave blank if you don't need to download images from webarchive)<br>\n";
echo " <input type=checkbox name=\"fixbroken\" value=\"yes\"";
if (!isset($_SESSION["fixbroken"])) $_SESSION["fixbroken"]=false;
if ($_SESSION["fixbroken"]) echo " checked"; if ($_SESSION["fixbroken"]) echo " checked";
echo ">delete broken tags?<br>\n"; echo ">delete broken tags?<br>\n";
echo " <input type=checkbox name=fixundownload value=true"; echo " <input type=checkbox name=\"fixundownload\" value=\"yes\"";
if (!isset($_SESSION["fixundownload"])) $_SESSION["fixundownload"]=false;
if ($_SESSION["fixundownload"]) echo " checked"; if ($_SESSION["fixundownload"]) echo " checked";
echo ">remove undownloadble tags?<br>\n"; echo ">remove undownloadble tags?<br>\n";
echo " <input type=checkbox name=fixalready value=true"; echo " <input type=checkbox name=\"fixalready\" value=\"yes\"";
if (!isset($_SESSION["fixalready"])) $_SESSION["fixalready"]=false;
if ($_SESSION["fixalready"]) echo " checked"; if ($_SESSION["fixalready"]) echo " checked";
echo " disabled"; // usopported in alpha version echo " disabled"; // unsupported yet
echo ">fix prefix to already downloaded tags?<br>\n"; echo ">fix prefix to already downloaded tags? <i>[unsupported yet]</i><br>\n";
echo " <input type=submit name=\"prev2\" value=\"Previous\"> <input type=submit name=\"deta2\" value=\"Details\"> <input type=submit name=\"next2\" value=\"Next\">\n"; echo " <input type=submit name=\"prev2\" value=\"Previous\"> <input type=submit name=\"deta2\" value=\"Details\"> <input type=submit name=\"next2\" value=\"Next\">\n";
echo "</form>\n"; echo "</form>\n";
if ($_SESSION["error"]) echo $_SESSION["error"],"<br>\n"; if ($_SESSION["error"]) echo $_SESSION["error"],"<br>\n";
@ -132,19 +176,31 @@ function PageView() {
if ($_SESSION["details"]=="step2") { if ($_SESSION["details"]=="step2") {
echo "green links will be try to downloaded, yellow (already downloaded) and red (broken) - not:<hr>\n"; echo "green links will be try to downloaded, yellow (already downloaded) and red (broken) - not:<hr>\n";
foreach ($_SESSION["imgsrcs"] as $postnum=>$postimgs) { foreach ($_SESSION["imgsrcs"] as $postnum=>$postimgs) {
echo ($postnum+1),":<br>\n"; echo ($postnum+1);
foreach ($postimgs as $imgs) { if (!empty($_SESSION["IDcolumn"]))
echo " (ID ", $_SESSION["imgsrcsID"][$postnum],")";
echo ":<br>\n";
foreach ($postimgs as $imgnum=>$imgs) {
$testurl=parse_url($imgs); $testurl=parse_url($imgs);
if ((!empty($testurl['host'])&&!empty($testurl['path']))&&(($testurl['scheme']=="http")||($testurl ['scheme']=="https"))&&(!($testurl['host']==$_SERVER['SERVER_NAME']))) echo " <font color=green>"; if ((!empty($testurl['host'])&&!empty($testurl['path']))&&(($testurl['scheme']=="http")||($testurl ['scheme']=="https"))&&(!($testurl['host']==$_SERVER['SERVER_NAME']))) echo " <font color=green>";
else if ($testurl['host']==$_SERVER['SERVER_NAME']) echo " <font color=yellow>"; else if (isset($testurl['host']) && ($testurl['host']==$_SERVER['SERVER_NAME']))
else echo " <font color=red>"; echo " <font color=yellow>";
echo $imgs,"</font><br>\n"; else echo " <font color=red>";
echo $imgs,"</font>, (";
if ($_SESSION["imgsrcahrefs"][$postnum][$imgnum]==$_SESSION["imgsrcs"][$postnum][$imgnum])
echo "<i>";
else echo "<b>";
echo $_SESSION["imgsrcahrefs"][$postnum][$imgnum];
if ($_SESSION["imgsrcahrefs"][$postnum][$imgnum]==$_SESSION["imgsrcs"][$postnum][$imgnum])
echo "</i>";
else echo "</b>";
echo ")<br>\n";
} }
echo "<hr>\n"; echo "<hr>\n";
} }
} }
} }
// Approve page // Approve page view
if ($_SESSION["step"]==3) { if ($_SESSION["step"]==3) {
echo "STEP 4: approve processing:<br>\n"; echo "STEP 4: approve processing:<br>\n";
echo "<form action=index.php method=post>\n"; echo "<form action=index.php method=post>\n";
@ -158,77 +214,90 @@ function PageView() {
if ($_SESSION["subdir"]) echo "/",$_SESSION["subdir"]; if ($_SESSION["subdir"]) echo "/",$_SESSION["subdir"];
echo "/<br>\n"; echo "/<br>\n";
} }
if ($_SESSION["fixbroken"]) echo $_SESSION["brokenimagenumber"]," tags will be deleted<br>\n"; if ($_SESSION["ahrefparents"])
echo "parent a hrefs will be downloaded (if exists)<br>\n";
if ($_SESSION["webarchived"])
echo "this domain will be downloaded via webarchive: ", $_SESSION["webarchived"], "<br>\n";
if ($_SESSION["fixbroken"])
echo $_SESSION["brokenimagenumber"]," tags will be deleted<br>\n";
echo " are you sure to proceed?<br>\n"; echo " are you sure to proceed?<br>\n";
echo " <input type=submit name=\"prev3\" value=\"Previous\"> <input type=submit name=\"next3\" value=\"Next\">\n"; echo " <input type=submit name=\"prev3\" value=\"Previous\"> <input type=submit name=\"next3\" value=\"Next\">\n";
echo "</form>\n"; echo "</form>\n";
} }
// Start page // Start page view
if ($_SESSION["step"]==4) { if ($_SESSION["step"]==4) {
$_SESSION["error"]=""; $_SESSION["error"]="";
echo "RESULT:<br>\n"; echo "RESULT:<br>\n";
if ($_SESSION["subdir"]) { if ($_SESSION["subdir"]) {
mkdir($_SESSION["subdir"]); if (!is_dir($_SESSION["subdir"]))
if (!chdir($_SESSION["subdir"])) $_SESSION["error"]="error to apperate with new directory"; mkdir($_SESSION["subdir"]);
if (!chdir($_SESSION["subdir"]))
$_SESSION["error"]="can't to operate with new directory";
} else { } else {
if (mkdir ("testimuploaddir")) rmdir("testimuploaddir"); if (mkdir ("testimuploaddir"))
else $_SESSION["error"]="error to apperate with directory, check privilegies"; rmdir("testimuploaddir");
else $_SESSION["error"]="can't to operate with directory, check privilegies";
}
if ($_SESSION["error"])
echo $_SESSION["error"]."<br>\n";
else {
chdir(__DIR__);
$csvsessiondata[]=$_SESSION["dbhost"];
$csvsessiondata[]=$_SESSION["dbuser"];
$csvsessiondata[]=$_SESSION["dbpass"];
$csvsessiondata[]=$_SESSION["dbname"];
$csvsessiondata[]=$_SESSION["dbtable"];
$csvsessiondata[]=$_SESSION["dbcolumn"];
$csvsessiondata[]=$_SERVER['SERVER_NAME'];
$csvsessiondata[]=$_SESSION["fixbroken"];
$csvsessiondata[]=$_SESSION["dirname"];
$csvsessiondata[]=$_SESSION["subdir"];
$csvsessiondata[]=$_SESSION["downloadtype"];
$csvsessiondata[]=$_SESSION["htmlprefix"];
$csvsessiondata[]=$_SESSION["fixalready"];
$csvsessiondata[]=$_SESSION["fixundownload"];
$csvsessiondata[]=$_SESSION["correctimagenumber"];
$csvsessiondata[]=$_SESSION["filtcolumn"];
$csvsessiondata[]=$_SESSION["filtvalue"];
$csvsessiondata[]=$_SESSION["ahrefparents"];
$csvsessiondata[]=$_SESSION["webarchived"];
$fhandle=fopen("indata.csv","w");
fputcsv($fhandle,$csvsessiondata);
fclose($fhandle);
exec("php -q exec.php < /dev/null > exec.log &");
echo "Process started, it's take some time. Please press Details for check status<br>\n";
} }
if ($_SESSION["error"]) echo $_SESSION["error"]."<br>\n";
else {
chdir(__DIR__);
$csvsessiondata[]=$_SESSION["dbhost"];
$csvsessiondata[]=$_SESSION["dbuser"];
$csvsessiondata[]=$_SESSION["dbpass"];
$csvsessiondata[]=$_SESSION["dbname"];
$csvsessiondata[]=$_SESSION["dbtable"];
$csvsessiondata[]=$_SESSION["dbcolumn"];
$csvsessiondata[]=$_SERVER['SERVER_NAME'];
$csvsessiondata[]=$_SESSION["fixbroken"];
$csvsessiondata[]=$_SESSION["dirname"];
$csvsessiondata[]=$_SESSION["subdir"];
$csvsessiondata[]=$_SESSION["downloadtype"];
$csvsessiondata[]=$_SESSION["htmlprefix"];
$csvsessiondata[]=$_SESSION["fixalready"];
$csvsessiondata[]=$_SESSION["fixundownload"];
$csvsessiondata[]=$_SESSION["correctimagenumber"];
$fhandle=fopen("indata.csv","w");
fputcsv($fhandle,$csvsessiondata);
fclose($fhandle);
exec("php -q exec.php < /dev/null > exec.log &");
echo "Process started, it's take some time. Please press Details for check status<br>\n";
}
echo "<form action=index.php method=post>\n"; echo "<form action=index.php method=post>\n";
echo " <input type=submit name=\"deta4\" value=\"Details\">\n"; echo " <input type=submit name=\"deta4\" value=\"Details\">\n";
echo "</form>\n"; echo "</form>\n";
} }
// Result page // Result page view
if ($_SESSION["step"]==5) { if ($_SESSION["step"]==5) {
echo "RESULT:<br>\n"; echo "RESULT:<br>\n";
if (file_exists("outdata.csv")) if (file_exists("outdata.csv")) {
{ $fhandle=fopen("outdata.csv","r");
$fhandle=fopen("outdata.csv","r"); $outdatacsv=fgetcsv($fhandle, 1024, ",");
$outdatacsv=fgetcsv($fhandle, 1024, ","); fclose($fhandle);
fclose($fhandle); $rawsedit=$outdatacsv[0];
$rawsedit=$outdatacsv[0]; $updatedurls=$outdatacsv[1];
$updatedurls=$outdatacsv[1]; $failedtoupdate=$outdatacsv[2];
$failedtoupdate=$outdatacsv[2]; $deletedurls=$outdatacsv[3];
$deletedurls=$outdatacsv[3]; echo "raws edited: ",$rawsedit,", urldecode downloaded: ",$updatedurls,", failed to download: ",$failedtoupdate,", deleted tags: ",$deletedurls,"<br>\n";
echo "raws edited: ",$rawsedit,", urldecode downloaded: ",$updatedurls,", failed to download: ",$failedtoupdate,", deleted tags: ",$deletedurls,"<br>\n"; } else echo "no results<br>\n";
} else { if (file_exists("exec.log")) {
$logexec=file_get_contents("exec.log"); $logexec=file_get_contents("exec.log");
echo $logexec; echo $logexec;
} } else echo "no log<br>\n";
echo "<form action=index.php method=post>\n"; echo "<form action=index.php method=post>\n";
echo " <input type=submit name=\"deta5\" value=\"Details\">\n"; echo " <input type=submit name=\"deta5\" value=\"Details\">\n";
echo "</form>\n"; echo "</form>\n";
} }
} }
// First wizard-page handler
$_SESSION["step"]=0; $_SESSION["step"]=0;
$_SESSION["error"]=""; $_SESSION["error"]="";
$_SESSION["details"]=""; $_SESSION["details"]="";
if (isset($_POST["next0"])) {
if ($_POST["next0"]) {
$_SESSION["dbhost"]=$_POST["dbhost"]; $_SESSION["dbhost"]=$_POST["dbhost"];
$_SESSION["dbuser"]=$_POST["dbuser"]; $_SESSION["dbuser"]=$_POST["dbuser"];
$_SESSION["dbpass"]=$_POST["dbpass"]; $_SESSION["dbpass"]=$_POST["dbpass"];
@ -239,33 +308,46 @@ if ($_SESSION["step"]==5) {
if (!$dbconnection) { if (!$dbconnection) {
$_SESSION["step"]=0; $_SESSION["step"]=0;
$_SESSION["error"]="dbconnection"; $_SESSION["error"]="dbconnection";
} if ($_SESSION["template"]=="Wordpress") { }
if ($_SESSION["template"]=="Wordpress") {
$_SESSION["dbtable"]="wp_posts"; $_SESSION["dbtable"]="wp_posts";
$_SESSION["dbcolumn"]="post_content"; $_SESSION["dbcolumn"]="post_content";
$_SESSION["dirname"]="wp-content/uploads"; $_SESSION["dirname"]="wp-content/uploads";
} if ($_SESSION["template"]=="Joomla") { $_SESSION["IDcolumn"]="ID";
$_SESSION["filtcolumn"]="post_type";
$_SESSION["filtvalue"]="post";
}
if ($_SESSION["template"]=="Joomla") {
$_SESSION["dbtable"]="prefix_content"; $_SESSION["dbtable"]="prefix_content";
$_SESSION["dbcolumn"]="fulltext"; $_SESSION["dbcolumn"]="fulltext";
$_SESSION["dirname"]="images/stories"; $_SESSION["dirname"]="images/stories";
} if ($_SESSION["template"]=="Drupal") { }
if ($_SESSION["template"]=="Drupal") {
$_SESSION["dbtable"]="field_data_body"; $_SESSION["dbtable"]="field_data_body";
$_SESSION["dbcolumn"]="body_value"; $_SESSION["dbcolumn"]="body_value";
$_SESSION["dirname"]="sites/default/files"; $_SESSION["dirname"]="sites/default/files";
} if (!$_POST["dbname"]) { }
if (!$_POST["dbname"]) {
$_SESSION["step"]=0; $_SESSION["step"]=0;
$_SESSION["error"]="dbconnectionname"; $_SESSION["error"]="dbconnectionname";
} }
} }
// Second wizard-page handler
if ($_POST["prev1"]) { if (isset($_POST["prev1"])) {
$_SESSION["dbtable"]=$_POST["dbtable"]; $_SESSION["dbtable"]=$_POST["dbtable"];
$_SESSION["dbcolumn"]=$_POST["dbcolumn"]; $_SESSION["dbcolumn"]=$_POST["dbcolumn"];
$_SESSION["dirname"]=$_POST["dirname"]; $_SESSION["dirname"]=$_POST["dirname"];
$_SESSION["IDcolumn"]=$_POST["IDcolumn"];
$_SESSION["filtcolumn"]=$_POST["filtcolumn"];
$_SESSION["filtvalue"]=$_POST["filtvalue"];
$_SESSION["step"]=0; $_SESSION["step"]=0;
} if ($_POST["next1"]) { } if (isset($_POST["next1"])) {
$_SESSION["dbtable"]=$_POST["dbtable"]; $_SESSION["dbtable"]=$_POST["dbtable"];
$_SESSION["dbcolumn"]=$_POST["dbcolumn"]; $_SESSION["dbcolumn"]=$_POST["dbcolumn"];
$_SESSION["dirname"]=$_POST["dirname"]; $_SESSION["dirname"]=$_POST["dirname"];
$_SESSION["IDcolumn"]=$_POST["IDcolumn"];
$_SESSION["filtcolumn"]=$_POST["filtcolumn"];
$_SESSION["filtvalue"]=$_POST["filtvalue"];
$dbconnection=mysqli_connect($_SESSION["dbhost"],$_SESSION["dbuser"],$_SESSION["dbpass"],$_SESSION["dbname"]); $dbconnection=mysqli_connect($_SESSION["dbhost"],$_SESSION["dbuser"],$_SESSION["dbpass"],$_SESSION["dbname"]);
$columns=mysqli_query($dbconnection, "SHOW COLUMNS FROM ".$_SESSION["dbtable"]); $columns=mysqli_query($dbconnection, "SHOW COLUMNS FROM ".$_SESSION["dbtable"]);
if (!$columns) { if (!$columns) {
@ -274,54 +356,86 @@ if ($_SESSION["step"]==5) {
} }
if (mysqli_num_rows($columns)>0) { if (mysqli_num_rows($columns)>0) {
$_SESSION["error"]="Column not found"; $_SESSION["error"]="Column not found";
while ($row = mysqli_fetch_assoc($columns)) if ($row[Field]==$_SESSION["dbcolumn"]) $_SESSION["error"]=""; while ($row = mysqli_fetch_assoc($columns)) if ($row['Field']==$_SESSION["dbcolumn"]) $_SESSION["error"]="";
} else $_SESSION["error"]="Table is empty or not exists"; } else $_SESSION["error"]="Table is empty or not exists";
$uploadsdir=chdir("../".$_SESSION["dirname"]); $uploadsdir=chdir("../".$_SESSION["dirname"]);
if ($uploadsdir) { if (!is_writeable(getcwd())) $_SESSION["error"]="Cant write to directory, check previlegies"; } if ($uploadsdir) {
else $_SESSION["error"]="Cant open directory"; if (!is_writeable(getcwd())) $_SESSION["error"]="Cant write to directory, check previlegies";
if (!$_SESSION["error"]) $_SESSION["step"]=2; } else $_SESSION["error"]="Cant open directory";
else $_SESSION["step"]=1; if (!$_SESSION["error"])
$_SESSION["step"]=2;
else $_SESSION["step"]=1;
} }
// Third wizard-page handler
if ($_POST["prev2"]) { if (isset($_POST["prev2"])) {
$_SESSION["step"]=1; $_SESSION["step"]=1;
$_SESSION["subdir"]=$_POST["subdir"]; $_SESSION["subdir"]=$_POST["subdir"];
} if ($_POST["deta2"]) { }
if (isset($_POST["deta2"])) {
$_SESSION["details"]="step2"; $_SESSION["details"]="step2";
$_SESSION["step"]=2; $_SESSION["step"]=2;
$_SESSION["subdir"]=$_POST["subdir"]; $_SESSION["subdir"]=$_POST["subdir"];
$_SESSION["htmlprefix"]=$_POST["htmlprefix"]; $_SESSION["htmlprefix"]=$_POST["htmlprefix"];
$_SESSION["downloadtype"]=$_POST["dwnldtype"]; $_SESSION["downloadtype"]=$_POST["dwnldtype"];
$_SESSION["fixbroken"]=$_POST["fixbroken"]; if (isset($_POST['ahrefparents']) && ($_POST['ahrefparents'] == 'yes'))
$_SESSION["fixundownload"]=$_POST["fixundownload"]; $_SESSION["ahrefparents"]=true;
$_SESSION["fixalready"]=$_POST["fixalready"]; else $_SESSION["ahrefparents"]=false;
if (isset($_POST['webarchived']))
$_SESSION["webarchived"]=$_POST["webarchived"];
else $_SESSION["webarchived"]=false;
if (isset($_POST['fixbroken']) && ($_POST['fixbroken'] == 'yes'))
$_SESSION["fixbroken"]=true;
else $_SESSION["fixbroken"]=false;
if (isset($_POST['fixundownload']) && ($_POST['fixundownload'] == 'yes'))
$_SESSION["fixundownload"]=true;
else $_SESSION["fixundownload"]=false;
if (isset($_POST['fixalready']) && ($_POST['fixalready'] == 'yes'))
$_SESSION["fixalready"]=true;
else $_SESSION["fixalready"]=false;
$uploadsdir=chdir("../".$_SESSION["dirname"]); $uploadsdir=chdir("../".$_SESSION["dirname"]);
} if ($_POST["next2"]) { }
if (isset($_POST["next2"])) {
$_SESSION["step"]=3; $_SESSION["step"]=3;
$_SESSION["subdir"]=$_POST["subdir"]; $_SESSION["subdir"]=$_POST["subdir"];
$_SESSION["htmlprefix"]=$_POST["htmlprefix"]; $_SESSION["htmlprefix"]=$_POST["htmlprefix"];
$_SESSION["downloadtype"]=$_POST["dwnldtype"]; $_SESSION["downloadtype"]=$_POST["dwnldtype"];
$_SESSION["fixbroken"]=$_POST["fixbroken"]; if (isset($_POST['ahrefparents']) && ($_POST['ahrefparents'] == 'yes'))
$_SESSION["fixundownload"]=$_POST["fixundownload"]; $_SESSION["ahrefparents"]=true;
$_SESSION["fixalready"]=$_POST["fixalready"]; else $_SESSION["ahrefparents"]=false;
if (isset($_POST['webarchived']))
$_SESSION["webarchived"]=$_POST["webarchived"];
else $_SESSION["webarchived"]=false;
if (isset($_POST['fixbroken']) && ($_POST['fixbroken'] == 'yes'))
$_SESSION["fixbroken"]=true;
else $_SESSION["fixbroken"]=false;
if (isset($_POST['fixundownload']) && ($_POST['fixundownload'] == 'yes'))
$_SESSION["fixundownload"]=true;
else $_SESSION["fixundownload"]=false;
if (isset($_POST['fixalready']) && ($_POST['fixalready'] == 'yes'))
$_SESSION["fixalready"]=true;
else $_SESSION["fixalready"]=false;
$uploadsdir=chdir("../".$_SESSION["dirname"]); $uploadsdir=chdir("../".$_SESSION["dirname"]);
if ($_POST["fixbroken"]) { if (($_SESSION["correctimagenumber"]<1)&($_SESSION["brokenimagenumber"]<1)) $_SESSION["step"]=2; } if (isset($_POST['fixbroken']) && ($_POST['fixbroken'] == 'yes')) {
else if ($_SESSION["correctimagenumber"]<1) $_SESSION["step"]=2; if (($_SESSION["correctimagenumber"]<1)&($_SESSION["brokenimagenumber"]<1))
$_SESSION["step"]=2;
} else if ($_SESSION["correctimagenumber"]<1)
$_SESSION["step"]=2;
} }
// Approve page handler
if ($_POST["prev3"]) { if (isset($_POST["prev3"])) {
$_SESSION["step"]=2; $_SESSION["step"]=2;
$uploadsdir=chdir("../".$_SESSION["dirname"]); $uploadsdir=chdir("../".$_SESSION["dirname"]);
} if ($_POST["next3"]) { }
if (isset($_POST["next3"])) {
$_SESSION["step"]=4; $_SESSION["step"]=4;
$uploadsdir=chdir("../".$_SESSION["dirname"]); $uploadsdir=chdir("../".$_SESSION["dirname"]);
} }
// Start page handler
if ($_POST["deta4"]) { if (isset($_POST["deta4"])) {
$_SESSION["step"]=5; $_SESSION["step"]=5;
} }
// Result page handler
if ($_POST["deta5"]) { if (isset($_POST["deta5"])) {
$_SESSION["step"]=5; $_SESSION["step"]=5;
} }