Super-optimized it; made it a bit more verbose and clearer
This commit is contained in:
parent
c3d5050b42
commit
83868504d7
1 changed files with 126 additions and 81 deletions
|
@ -16,7 +16,7 @@
|
||||||
along with this program. If not, see <http://www.gnu.org/licenses/>.
|
along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||||
*/
|
*/
|
||||||
|
|
||||||
define('N',"\n");
|
const N="\n";
|
||||||
define('SNAME',basename(__FILE__));
|
define('SNAME',basename(__FILE__));
|
||||||
define('BNAME',preg_replace('/\.[^.]*$/','',SNAME));
|
define('BNAME',preg_replace('/\.[^.]*$/','',SNAME));
|
||||||
|
|
||||||
|
@ -32,11 +32,11 @@ $opts=[
|
||||||
'inifp'=>__DIR__.'/../conf/mustard.ini',
|
'inifp'=>__DIR__.'/../conf/mustard.ini',
|
||||||
'startinst'=>'mastodon.social',
|
'startinst'=>'mastodon.social',
|
||||||
'gracetime'=>$gracetime,
|
'gracetime'=>$gracetime,
|
||||||
'peersfp'=>__DIR__.'/peers',
|
'peersfp'=>__DIR__.'/peers.responding',
|
||||||
'cpeersfp'=>__DIR__.'/peers.checked',
|
'ckpeersfp'=>__DIR__.'/peers.checked',
|
||||||
'excludefp'=>null,
|
'excludefp'=>null,
|
||||||
'timeout'=>8,
|
'conntimeout'=>5,
|
||||||
'curltimeout'=>15,
|
'functimeout'=>10,
|
||||||
'loop'=>false,
|
'loop'=>false,
|
||||||
'excludedead'=>true,
|
'excludedead'=>true,
|
||||||
'ignorelock'=>false,
|
'ignorelock'=>false,
|
||||||
|
@ -45,8 +45,6 @@ $opts=[
|
||||||
|
|
||||||
$msglevs=['Debug', 'Info', 'Warning', 'Error', 'None'];
|
$msglevs=['Debug', 'Info', 'Warning', 'Error', 'None'];
|
||||||
|
|
||||||
$ghtsa=[[' day',' days'],[' hour',' hours'],[' minute',' minutes'],[' second',' seconds']];
|
|
||||||
|
|
||||||
$help='SYNOPSIS
|
$help='SYNOPSIS
|
||||||
|
|
||||||
'.SNAME.' [options]
|
'.SNAME.' [options]
|
||||||
|
@ -70,7 +68,7 @@ OPTIONS
|
||||||
If an instance has not been responding for longer than this time, avoid
|
If an instance has not been responding for longer than this time, avoid
|
||||||
checking it. See section «TIME SPECIFICATION» below to see how to specify
|
checking it. See section «TIME SPECIFICATION» below to see how to specify
|
||||||
time.
|
time.
|
||||||
DEFAULT: '.ght($opts['gracetime'],$ghtsa).'
|
DEFAULT: '.ght($opts['gracetime'],null,0).'
|
||||||
-G, --graceline
|
-G, --graceline
|
||||||
Return the “graceline” (now - gracetime: see option above) in unix time and
|
Return the “graceline” (now - gracetime: see option above) in unix time and
|
||||||
local time, then exit.
|
local time, then exit.
|
||||||
|
@ -78,22 +76,22 @@ OPTIONS
|
||||||
Defines the file into which the ordered list of responding instances
|
Defines the file into which the ordered list of responding instances
|
||||||
will be saved.
|
will be saved.
|
||||||
DEFAULT: «'.$opts['peersfp'].'»
|
DEFAULT: «'.$opts['peersfp'].'»
|
||||||
-c, --cpeersfp <file>
|
-c, --ckpeersfp <file>
|
||||||
Defines the file into which the ordered list of all checked instances will
|
Defines the file into which the ordered list of all checked instances will
|
||||||
be saved.
|
be saved.
|
||||||
DEFAULT: «'.$opts['cpeersfp'].'»
|
DEFAULT: «'.$opts['ckpeersfp'].'»
|
||||||
-I, --ignorelock
|
-I, --ignorelock
|
||||||
Normally, if its lockfile exists, the program exits with an error before
|
Normally, if its lockfile exists, the program exits with an error before
|
||||||
doing anything. With this option the lockfile is ignored. Please verify
|
doing anything. With this option the lockfile is ignored. Please verify
|
||||||
that the program is not already running before using it.
|
that the program is not already running before using it.
|
||||||
-t, --timeout <time>
|
-t, --conntimeout <time>
|
||||||
Defines the timeout in seconds for every connection attempt. See section
|
Defines the timeout in seconds for every connection attempt. See section
|
||||||
«TIME SPECIFICATION» below to see how to specify time.
|
«TIME SPECIFICATION» below to see how to specify time.
|
||||||
DEFAULT: '.ght($opts['timeout'],$ghtsa).'
|
DEFAULT: '.ght($opts['conntimeout'],null,0).'
|
||||||
-T, --curltimeout <time>
|
-T, --functimeout <time>
|
||||||
Defines the timeout in seconds for every download. See section «TIME
|
Defines the timeout in seconds for every download. See section «TIME
|
||||||
SPECIFICATION» below to see how to specify time.
|
SPECIFICATION» below to see how to specify time.
|
||||||
DEFAULT: '.ght($opts['curltimeout'],$ghtsa).'
|
DEFAULT: '.ght($opts['functimeout'],null,0).'
|
||||||
-m, --minmsgimplev <«debug»|«info»|«warning»|«error»|«none»>
|
-m, --minmsgimplev <«debug»|«info»|«warning»|«error»|«none»>
|
||||||
Defines the minimum “importance level” of messages to be written to the text
|
Defines the minimum “importance level” of messages to be written to the text
|
||||||
user interface. There are 4 “importance levels”, in this order of
|
user interface. There are 4 “importance levels”, in this order of
|
||||||
|
@ -132,11 +130,11 @@ for ($i=1; $i<$argc; $i++) {
|
||||||
mexit(3,'option «'.$argv[$i].'» has to be followed by a file’s path (use «-h» for more info).'.N,1,false);
|
mexit(3,'option «'.$argv[$i].'» has to be followed by a file’s path (use «-h» for more info).'.N,1,false);
|
||||||
$i++;
|
$i++;
|
||||||
$opts['peersfp']=$argv[$i];
|
$opts['peersfp']=$argv[$i];
|
||||||
} elseif ($argv[$i]=='-c' || $argv[$i]=='--cpeersfp') {
|
} elseif ($argv[$i]=='-c' || $argv[$i]=='--ckpeersfp') {
|
||||||
if ($i+1>=$argc)
|
if ($i+1>=$argc)
|
||||||
mexit(3,'option «'.$argv[$i].'» has to be followed by a file’s path (use «-h» for more info).'.N,1,false);
|
mexit(3,'option «'.$argv[$i].'» has to be followed by a file’s path (use «-h» for more info).'.N,1,false);
|
||||||
$i++;
|
$i++;
|
||||||
$opts['cpeersfp']=$argv[$i];
|
$opts['ckpeersfp']=$argv[$i];
|
||||||
} elseif ($argv[$i]=='-I' || $argv[$i]=='--ignorelock') {
|
} elseif ($argv[$i]=='-I' || $argv[$i]=='--ignorelock') {
|
||||||
$opts['ignorelock']=true;
|
$opts['ignorelock']=true;
|
||||||
} elseif ($argv[$i]=='-e' || $argv[$i]=='--excludefp') {
|
} elseif ($argv[$i]=='-e' || $argv[$i]=='--excludefp') {
|
||||||
|
@ -144,16 +142,16 @@ for ($i=1; $i<$argc; $i++) {
|
||||||
mexit(3,'option «'.$argv[$i].'» has to be followed by a file’s path (use «-h» for more info).'.N,1,false);
|
mexit(3,'option «'.$argv[$i].'» has to be followed by a file’s path (use «-h» for more info).'.N,1,false);
|
||||||
$i++;
|
$i++;
|
||||||
$opts['excludefp']=$argv[$i];
|
$opts['excludefp']=$argv[$i];
|
||||||
} elseif ($argv[$i]=='-t' || $argv[$i]=='--timeout') {
|
} elseif ($argv[$i]=='-t' || $argv[$i]=='--conntimeout') {
|
||||||
if ($i+1>=$argc || ($time=parsetime($argv[$i+1]))===false)
|
if ($i+1>=$argc || ($time=parsetime($argv[$i+1]))===false)
|
||||||
mexit(3,'option «'.$argv[$i].'» requires a valid time specification as an argument (use «-h» to read help).'.N,1,false);
|
mexit(3,'option «'.$argv[$i].'» requires a valid time specification as an argument (use «-h» to read help).'.N,1,false);
|
||||||
$i++;
|
$i++;
|
||||||
$opts['timeout']=$time;
|
$opts['conntimeout']=$time;
|
||||||
} elseif ($argv[$i]=='-T' || $argv[$i]=='--curltimeout') {
|
} elseif ($argv[$i]=='-T' || $argv[$i]=='--functimeout') {
|
||||||
if ($i+1>=$argc || ($time=parsetime($argv[$i+1]))===false)
|
if ($i+1>=$argc || ($time=parsetime($argv[$i+1]))===false)
|
||||||
mexit(3,'option «'.$argv[$i].'» requires a valid time specification as an argument (use «-h» to read help).'.N,1,false);
|
mexit(3,'option «'.$argv[$i].'» requires a valid time specification as an argument (use «-h» to read help).'.N,1,false);
|
||||||
$i++;
|
$i++;
|
||||||
$opts['curltimeout']=$time;
|
$opts['functimeout']=$time;
|
||||||
} elseif ($argv[$i]=='-i' || $argv[$i]=='--includedead') {
|
} elseif ($argv[$i]=='-i' || $argv[$i]=='--includedead') {
|
||||||
$opts['excludedead']=false;
|
$opts['excludedead']=false;
|
||||||
} elseif ($argv[$i]=='-m' || $argv[$i]=='--minmsgimplev') {
|
} elseif ($argv[$i]=='-m' || $argv[$i]=='--minmsgimplev') {
|
||||||
|
@ -183,6 +181,8 @@ pcntl_signal(SIGTERM,'sighandler');// Termination ('kill' was called)
|
||||||
pcntl_signal(SIGHUP,'sighandler');// Terminal log-out
|
pcntl_signal(SIGHUP,'sighandler');// Terminal log-out
|
||||||
pcntl_signal(SIGINT,'sighandler');// Interrupted (Ctrl-C is pressed)
|
pcntl_signal(SIGINT,'sighandler');// Interrupted (Ctrl-C is pressed)
|
||||||
|
|
||||||
|
lecho(1,'###### Starting '.BNAME.' ######'.N);
|
||||||
|
|
||||||
$iniarr=@parse_ini_file($opts['inifp']);
|
$iniarr=@parse_ini_file($opts['inifp']);
|
||||||
if ($iniarr===false) mexit(3,'couldn’t open «'.$opts['inifp'].'».'.N,1,true);
|
if ($iniarr===false) mexit(3,'couldn’t open «'.$opts['inifp'].'».'.N,1,true);
|
||||||
try { $link=@mysqli_connect($iniarr['db_host'],$iniarr['db_admin_name'],$iniarr['db_admin_password'],$iniarr['db_name'],$iniarr['db_port'],$iniarr['db_socket']); }
|
try { $link=@mysqli_connect($iniarr['db_host'],$iniarr['db_admin_name'],$iniarr['db_admin_password'],$iniarr['db_name'],$iniarr['db_port'],$iniarr['db_socket']); }
|
||||||
|
@ -197,13 +197,14 @@ if ($res===false) mexit(3,'couldn’t set «utf8mb4» charset for MySQL: '.mysql
|
||||||
$deadinsts=[];
|
$deadinsts=[];
|
||||||
if ($opts['excludedead']) {
|
if ($opts['excludedead']) {
|
||||||
$graceline=time()-$opts['gracetime'];
|
$graceline=time()-$opts['gracetime'];
|
||||||
|
lecho(1,'loading dead instances from “Instances” and “Peers” table (gracetime: '.ght($opts['gracetime'],null,0).'; graceline: '.date('Y-m-d H:i:s',$graceline).').'.N);
|
||||||
$res=myq($link,'SELECT URI FROM Instances WHERE LastOkCheckTS<'.$graceline.' OR (LastOkCheckTS IS NULL AND InsertTS<'.$graceline.')');
|
$res=myq($link,'SELECT URI FROM Instances WHERE LastOkCheckTS<'.$graceline.' OR (LastOkCheckTS IS NULL AND InsertTS<'.$graceline.')');
|
||||||
lecho(0,'got '.mysqli_num_rows($res).' dead instances from Instances table.'.N);
|
lecho(1,'got '.mysqli_num_rows($res).' dead instances from “Instances” table.'.N);
|
||||||
while ($row=mysqli_fetch_assoc($res))
|
while ($row=mysqli_fetch_assoc($res))
|
||||||
if (!in_array($row['URI'],$deadinsts))
|
if (!in_array($row['URI'],$deadinsts))
|
||||||
$deadinsts[]=$row['URI'];
|
$deadinsts[]=$row['URI'];
|
||||||
$res=myq($link,'SELECT Hostname FROM Peers WHERE LastOkCheckTS<'.$graceline.' OR (LastOkCheckTS IS NULL AND FirstCheckTS<'.$graceline.')');
|
$res=myq($link,'SELECT Hostname FROM Peers WHERE LastOkCheckTS<'.$graceline.' OR (LastOkCheckTS IS NULL AND FirstCheckTS<'.$graceline.')');
|
||||||
lecho(0,'got '.mysqli_num_rows($res).' dead instances from Peers table.'.N);
|
lecho(1,'got '.mysqli_num_rows($res).' dead instances from “Peers” table.'.N);
|
||||||
while ($row=mysqli_fetch_assoc($res))
|
while ($row=mysqli_fetch_assoc($res))
|
||||||
if (!in_array($row['Hostname'],$deadinsts))
|
if (!in_array($row['Hostname'],$deadinsts))
|
||||||
$deadinsts[]=$row['Hostname'];
|
$deadinsts[]=$row['Hostname'];
|
||||||
|
@ -213,21 +214,20 @@ if ($opts['excludedead']) {
|
||||||
//mexit(0,'bau!'.N,0,true);
|
//mexit(0,'bau!'.N,0,true);
|
||||||
|
|
||||||
$insts=[];
|
$insts=[];
|
||||||
$cinsts=[];
|
$ckinsts=[];
|
||||||
$exarr=[];
|
$exarr=[];
|
||||||
$notifs=[];
|
|
||||||
|
|
||||||
$maxround=1;
|
$maxround=1;
|
||||||
$newc=0;
|
$totnewc=0;
|
||||||
$tini=time();
|
$tini=time();
|
||||||
$list=[$opts['startinst']];
|
$list=[$opts['startinst']];
|
||||||
// go
|
// go
|
||||||
crawl($list,1);
|
crawl($list,1);
|
||||||
lecho(1,'done crawling! :-)'.N);
|
lecho(1,'done crawling! :-)'.N);
|
||||||
$now=time();
|
$now=time();
|
||||||
lecho(1,'crawl started on '.date('Y-m-d H:i:s',$tini).' and ended on '.date('Y-m-d H:i:s',$now).'; took '.ght($now-$tini).' in '.$maxround.' rounds; '.count($insts).' instance(s) responded; '.$newc.' new instances where found; max. memory usage: '.ghs(memory_get_peak_usage(true)).'.'.N);
|
lecho(1,'crawl started on '.date('Y-m-d H:i:s',$tini).' and ended on '.date('Y-m-d H:i:s',$now).'; took '.ght($now-$tini,null,0).' in '.$maxround.' rounds; '.count($insts).' instances responded; '.count($ckinsts).' instances were considered; '.$totnewc.' new instances were found; max. memory usage: '.ghs(memory_get_peak_usage(true)).'.'.N);
|
||||||
sortcheckandsave($insts,'list of responding instances',$opts['peersfp']);
|
sortcheckandsave($insts,'list of responding instances',$opts['peersfp']);
|
||||||
sortcheckandsave($cinsts,'list of checked instances',$opts['cpeersfp']);
|
sortcheckandsave($ckinsts,'list of checked instances',$opts['ckpeersfp']);
|
||||||
mysqli_close($link);
|
mysqli_close($link);
|
||||||
unlink($lockfp);
|
unlink($lockfp);
|
||||||
lecho(1,'done :-)'.N);
|
lecho(1,'done :-)'.N);
|
||||||
|
@ -237,51 +237,80 @@ exit(0);
|
||||||
// functions
|
// functions
|
||||||
|
|
||||||
function crawl(&$list,$id) {
|
function crawl(&$list,$id) {
|
||||||
global $insts, $deadinsts, $cinsts, $tini, $opts, $maxround, $newc, $link;
|
global $insts, $ckinsts, $deadinsts, $tini, $opts, $maxround, $totnewc, $link;
|
||||||
|
$newc=0;
|
||||||
lecho(1,'###### START OF ROUND '.$id.' ######'.N);
|
lecho(1,'###### START OF ROUND '.$id.' ######'.N);
|
||||||
|
$clist=count($list);
|
||||||
|
lecho(1,'will check '.$clist.' instance(s).'.N);
|
||||||
$nlist=[];
|
$nlist=[];
|
||||||
$c=count($list);
|
$i=0;
|
||||||
|
$buf=[];
|
||||||
|
foreach ($list as $inst) {
|
||||||
|
$i++;
|
||||||
|
$whynot=[];
|
||||||
|
if (in_array($inst,$ckinsts)) {
|
||||||
|
$whynot[]='it has already been checked';
|
||||||
|
$inckinsts=true;
|
||||||
|
} else {
|
||||||
|
$inckinsts=false;
|
||||||
|
}
|
||||||
|
if (!validhostname($inst)) $whynot[]='its hostname is not valid';
|
||||||
|
if (ckexarr($inst)) $whynot[]='its hostname matches an exclusion regexp';
|
||||||
|
if ($opts['excludedead'] && in_array($inst,$deadinsts)) $whynot[]='it’s dead';
|
||||||
|
if (count($whynot)>0) {
|
||||||
|
lecho(0,'excluding instance «'.$inst.'» ('.$i.'/'.$clist.'): '.implode(', ',$whynot).'.'.N);
|
||||||
|
} else {
|
||||||
|
lecho(0,'including instance «'.$inst.'» ('.$i.'/'.$clist.').'.N);
|
||||||
|
$buf[]=$inst;
|
||||||
|
if (!$inckinsts) $ckinsts[]=$inst;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
$cbuf=count($buf);
|
||||||
|
$list=$buf;
|
||||||
|
unset($buf);
|
||||||
|
if ($clist-$cbuf>0)
|
||||||
|
lecho(1,'excluded '.($clist-$cbuf).' instances; '.$cbuf.' instances remaining.'.N);
|
||||||
|
$clist=$cbuf;
|
||||||
$i=0;
|
$i=0;
|
||||||
$rtini=time();
|
$rtini=time();
|
||||||
foreach ($list as $inst) {
|
foreach ($list as $inst) {
|
||||||
|
$responded=false;
|
||||||
$i++;
|
$i++;
|
||||||
$now=time();
|
lecho(1,'round '.$id.': working on instance «'.$inst.'» ('.$i.'/'.$clist.').'.N);
|
||||||
$rtela=$now-$rtini;
|
|
||||||
lecho(1,'working on «'.$inst.'»: round '.$id.', '.$i.'/'.$c.'; TET: '.ght($now-$tini,null,0).'; ETR of this round: '.ght($rtela/$i*$c-$rtela,null,0).'; using '.ghs(memory_get_usage(true)).' mem. (peak: '.ghs(memory_get_peak_usage(true)).'); '.count($insts).' instances responded; '.count($nlist).' instances in next round list; '.$newc.' new instance(s) found.'.N);
|
|
||||||
waituntilonline();
|
|
||||||
updexarr();
|
updexarr();
|
||||||
lecho(1,'trying to load «'.$inst.'»’s peers...'.N);
|
waituntilonline();
|
||||||
$peers=gurl('https://'.$inst.'/api/v1/instance/peers',$opts['timeout'],$opts['curltimeout']);
|
lecho(1,'trying to load instance «'.$inst.'»’s peers...'.N);
|
||||||
$cinsts[]=$inst;// don't need to check if in_array
|
$peers=gurl('https://'.$inst.'/api/v1/instance/peers',$opts['conntimeout'],$opts['functimeout']);
|
||||||
if ($peers['cont']===false) {
|
if ($peers['cont']===false) {
|
||||||
lecho(2,'could not load «'.$inst.'»’s peers: '.$peers['emsg'].'.'.N);
|
lecho(2,'could not load instance «'.$inst.'»’s peers: '.$peers['emsg'].'.'.N);
|
||||||
} else {
|
} else {
|
||||||
$peers=@json_decode($peers['cont'],true);
|
$peers=@json_decode($peers['cont'],true);
|
||||||
if (!is_array($peers)) {
|
if (!is_array($peers)) {
|
||||||
lecho(2,'loading «'.$inst.'»’s peers, got bad JSON.'.N);
|
lecho(2,'expecting instance «'.$inst.'»’s peers, got bad JSON instead.'.N);
|
||||||
} else {
|
} else {
|
||||||
$cp=count($peers);
|
$responded=true;
|
||||||
lecho(1,'successfully loaded «'.$inst.'»’s peers ('.$cp.') :-)'.N);
|
$cpeers=count($peers);
|
||||||
|
lecho(1,'successfully loaded instance «'.$inst.'»’s peers ('.$cpeers.') :-)'.N);
|
||||||
$pi=1;
|
$pi=1;
|
||||||
foreach ($peers as $key=>$peer) {
|
foreach ($peers as $key=>$peer) {
|
||||||
if ($key!=$pi-1) {
|
if ($key!=$pi-1) {
|
||||||
lecho(2,'«'.$inst.'»’s peers: entity '.$pi.'/'.$cp.'’s key is not sequential; not checking further.'.N);
|
lecho(2,'instance «'.$inst.'»’s peers: entity '.$pi.'/'.$cpeers.'’s key is not sequential: not checking further.'.N);
|
||||||
break;
|
break;
|
||||||
} elseif (!is_string($peer)) {
|
} elseif (!is_string($peer)) {
|
||||||
lecho(2,'«'.$inst.'»’s peers: entity '.$pi.'/'.$cp.' is not a string; not checking further.'.N);
|
lecho(2,'instance «'.$inst.'»’s peers: entity '.$pi.'/'.$cpeers.' is not a string: not checking further.'.N);
|
||||||
break;
|
break;
|
||||||
} else {
|
} else {
|
||||||
$whynot=[];
|
$whynot=[];
|
||||||
if (in_array($peer,$cinsts)) $whynot[]='it has already been checked';
|
if (in_array($peer,$ckinsts)) $whynot[]='it has already been checked or excluded';
|
||||||
if (!validhostname($peer)) $whynot[]='its name is not a valid hostname';
|
if (!validhostname($peer)) $whynot[]='its hostname is not valid';
|
||||||
if (ckexarr($peer)) $whynot[]='its name matches an exclusion regexp';
|
if (ckexarr($peer)) $whynot[]='its hostname matches an exclusion regexp';
|
||||||
if (in_array($peer,$list)) $whynot[]='it is already present in current list';
|
if (in_array($peer,$list)) $whynot[]='it is already present in current list';
|
||||||
if (in_array($peer,$nlist)) $whynot[]='it has already been added to next round list';
|
if (in_array($peer,$nlist)) $whynot[]='it is already present in next round list';// this should never happen, but.
|
||||||
if ($opts['excludedead'] && in_array($peer,$deadinsts)) $whynot[]='it’s dead';
|
if ($opts['excludedead'] && in_array($peer,$deadinsts)) $whynot[]='it’s dead';
|
||||||
if (count($whynot)>0) {
|
if (count($whynot)>0) {
|
||||||
lecho(0,'«'.$inst.'»: not adding peer «'.$peer.'» ('.$pi.'/'.$cp.') to next round list because '.implode(', ',$whynot).'.'.N);
|
lecho(0,'instance «'.$inst.'»: not adding peer «'.$peer.'» ('.$pi.'/'.$cpeers.') to next round list: '.implode(', ',$whynot).'.'.N);
|
||||||
} else {
|
} else {
|
||||||
lecho(1,'«'.$inst.'»: adding peer «'.$peer.'» ('.$pi.'/'.$cp.') to next round list :-)'.N);
|
lecho(1,'instance «'.$inst.'»: adding peer «'.$peer.'» ('.$pi.'/'.$cpeers.') to next round list :-)'.N);
|
||||||
$nlist[]=$peer;
|
$nlist[]=$peer;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -289,58 +318,74 @@ function crawl(&$list,$id) {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
if (!ckexarr($inst)) {
|
if (!$responded) {
|
||||||
$responded=false;
|
lecho(1,'instance «'.$inst.'» didn’t respond at its “peers” endpoint; trying to load its info from “instance” endpoint...'.N);
|
||||||
lecho(1,'trying to load «'.$inst.'»’s instance info...'.N);
|
$instinfo=gurl('https://'.$inst.'/api/v1/instance',$opts['conntimeout'],$opts['functimeout']);
|
||||||
$instinfo=gurl('https://'.$inst.'/api/v1/instance',$opts['timeout'],$opts['curltimeout']);
|
|
||||||
if ($instinfo['cont']===false) {
|
if ($instinfo['cont']===false) {
|
||||||
lecho(2,'could not load «'.$inst.'»’s instance info: '.$instinfo['emsg'].'.'.N);
|
lecho(2,'could not load instance «'.$inst.'»’s info: '.$instinfo['emsg'].'.'.N);
|
||||||
} else {
|
} else {
|
||||||
$instinfo=@json_decode($instinfo['cont'],true);
|
$instinfo=@json_decode($instinfo['cont'],true);
|
||||||
if (is_array($instinfo))
|
if (is_array($instinfo))
|
||||||
$responded=true;
|
$responded=true;
|
||||||
else
|
else
|
||||||
lecho(2,'loading «'.$inst.'»’s instance info, got bad JSON.'.N);
|
lecho(2,'expecting instance «'.$inst.'»’s info, got bad JSON instead.'.N);
|
||||||
}
|
}
|
||||||
if ($responded && !in_array($inst,$insts)) {
|
}
|
||||||
lecho(1,'instance «'.$inst.'» responded :-)'.N);
|
$now=time();
|
||||||
$insts[]=$inst;
|
if ($responded) {
|
||||||
$res=myq($link,'SELECT ID FROM Instances WHERE URI=\''.myesc($link,$inst).'\'');
|
lecho(1,'instance «'.$inst.'» responded :-)'.N);
|
||||||
if (mysqli_num_rows($res)==0) {
|
$insts[]=$inst;
|
||||||
lecho(1,'instance «'.$inst.'» is new :-)'.N);
|
$res=myq($link,'SELECT ID FROM Instances WHERE URI=\''.myesc($link,$inst).'\'');
|
||||||
myq($link,'INSERT INTO Instances SET URI=\''.myesc($link,$inst).'\', InsertTS='.$now);
|
$cres=mysqli_num_rows($res);
|
||||||
$newc++;
|
if ($cres<1) {
|
||||||
}
|
lecho(1,'instance «'.$inst.'» is new to “Instances” table, adding it :-)'.N);
|
||||||
}
|
myq($link,'INSERT INTO Instances SET URI=\''.myesc($link,$inst).'\', InsertTS='.$now);
|
||||||
$res=myq($link,'SELECT * FROM Peers WHERE Hostname=\''.myesc($link,$inst).'\'');
|
$totnewc++;
|
||||||
$nrows=mysqli_num_rows($res);
|
$newc++;
|
||||||
if ($nrows>0) {
|
} elseif ($cres>1) {
|
||||||
if ($nrows>1) lecho(2,'«'.$inst.'» has '.$nrows.' records in “Peers” table! :-('.N);
|
lecho(2,'instance «'.$inst.'» has '.$cres.' records in “Instances” table! :-('.N);
|
||||||
$row=mysqli_fetch_assoc($res);
|
|
||||||
if ($responded) myq($link,'UPDATE Peers SET LastOkCheckTS='.$now.' WHERE ID='.$row['ID']);
|
|
||||||
} else {
|
} else {
|
||||||
$query='INSERT INTO Peers SET Hostname=\''.myesc($link,$inst).'\', FirstCheckTS='.$now;
|
lecho(1,'instance «'.$inst.'» is already present in “Instances” table.'.N);//+++
|
||||||
if ($responded) $query.=', LastOkCheckTS='.$now;
|
|
||||||
myq($link,$query);
|
|
||||||
}
|
}
|
||||||
} else {
|
} else {
|
||||||
lecho(2,'ignoring instance «'.$inst.'» because it matches an exclusion regexp: won’t add it to «Instances» and «Peers» tables.'.N);
|
lecho(1,'instance «'.$inst.'» didn’t respond :-('.N);
|
||||||
}
|
}
|
||||||
|
$res=myq($link,'SELECT * FROM Peers WHERE Hostname=\''.myesc($link,$inst).'\'');
|
||||||
|
$cres=mysqli_num_rows($res);
|
||||||
|
if ($cres<1) {
|
||||||
|
lecho(1,'instance «'.$inst.'» is new to “Peers” table, adding it :-)'.N);
|
||||||
|
$query='INSERT INTO Peers SET Hostname=\''.myesc($link,$inst).'\', FirstCheckTS='.$now;
|
||||||
|
if ($responded) $query.=', LastOkCheckTS='.$now;
|
||||||
|
myq($link,$query);
|
||||||
|
} elseif ($cres>0) {
|
||||||
|
if ($cres>1) lecho(2,'«'.$inst.'» has '.$cres.' records in “Peers” table! :-('.N);
|
||||||
|
if ($responded) {
|
||||||
|
lecho(1,'instance «'.$inst.'» is already present in “Peers” table, but it responded: updating its record’s “LastOkCheckTS” value...'.N);
|
||||||
|
$row=mysqli_fetch_assoc($res);
|
||||||
|
myq($link,'UPDATE Peers SET LastOkCheckTS='.$now.' WHERE ID='.$row['ID']);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
$now=time();
|
||||||
|
$rtela=$now-$rtini;
|
||||||
|
lecho(1,'round '.$id.': finished working on instance «'.$inst.'» ('.$i.'/'.$clist.'); RoundElapsedTime: '.ght($rtela,null,0).'; RoundEstimatedTimeRemaining: '.ght($rtela/$i*$clist-$rtela,null,0).'; RoundNewInsts: '.$newc.'; NextRoundInsts: '.count($nlist).'; TotElapsedTime: '.ght($now-$tini,null,0).'; TotConsideredInsts: '.count($ckinsts).'; TotRespondingInsts: '.count($insts).'; TotNewInsts: '.$totnewc.'; using '.ghs(memory_get_usage(true)).' mem. (peak: '.ghs(memory_get_peak_usage(true)).').'.N);
|
||||||
}
|
}
|
||||||
unset($list);
|
unset($list);
|
||||||
if (count($nlist)>0) {
|
$now=time();
|
||||||
|
$rtela=$now-$rtini;
|
||||||
|
$cnlist=count($nlist);
|
||||||
|
lecho(1,'END OF ROUND STATS: RoundCheckedInsts: '.$clist.'; RoundElapsedTime: '.ght($rtela,null,0).'; RoundNewInsts: '.$newc.'; NextRoundInsts: '.$cnlist.'; TotElapsedTime: '.ght($now-$tini,null,0).'; TotConsideredInsts: '.count($ckinsts).'; TotRespondingInsts: '.count($insts).'; TotNewInsts: '.$totnewc.'; using '.ghs(memory_get_usage(true)).' mem. (peak: '.ghs(memory_get_peak_usage(true)).').'.N);
|
||||||
|
if ($cnlist<1) lecho(1,'next round list is empty.'.N);
|
||||||
|
lecho(1,'###### END OF ROUND '.$id.' ######'.N);
|
||||||
|
if ($cnlist>0) {
|
||||||
crawl($nlist,$id+1);
|
crawl($nlist,$id+1);
|
||||||
if ($id+1>$maxround) $maxround=$id+1;
|
if ($id+1>$maxround) $maxround=$id+1;
|
||||||
} else {
|
|
||||||
lecho(1,'next round list is empty.'.N);
|
|
||||||
}
|
}
|
||||||
lecho(1,'###### END OF ROUND '.$id.' ######'.N);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
function mexit($lev,$msg,$code,$remlock) {
|
function mexit($lev,$msg,$code,$remlock) {
|
||||||
global $link, $insts, $cinsts, $lockfp, $opts;
|
global $link, $insts, $ckinsts, $lockfp, $opts;
|
||||||
if (isset($insts) && is_array($insts)) sortcheckandsave($insts,'list of responding instances',$opts['peersfp']);
|
if (isset($insts) && is_array($insts)) sortcheckandsave($insts,'list of responding instances',$opts['peersfp']);
|
||||||
if (isset($cinsts) && is_array($cinsts)) sortcheckandsave($cinsts,'list of checked instances',$opts['cpeersfp']);
|
if (isset($ckinsts) && is_array($ckinsts)) sortcheckandsave($ckinsts,'list of checked instances',$opts['ckpeersfp']);
|
||||||
if ($remlock && isset($lockfp) && is_file($lockfp)) unlink($lockfp);
|
if ($remlock && isset($lockfp) && is_file($lockfp)) unlink($lockfp);
|
||||||
lecho($lev,$msg);
|
lecho($lev,$msg);
|
||||||
exit($code);
|
exit($code);
|
||||||
|
@ -369,7 +414,7 @@ function myq(&$link,$query) {
|
||||||
function microdate($time=null) {
|
function microdate($time=null) {
|
||||||
if (is_null($time)) $time=microtime(false);
|
if (is_null($time)) $time=microtime(false);
|
||||||
$time=explode(' ',$time);
|
$time=explode(' ',$time);
|
||||||
return(date('Y-m-d H:i:s',$time[1]).'.'.substr($time[0],2));
|
return(date('Y-m-d H:i:s',$time[1]).'.'.substr($time[0],2,-2));
|
||||||
}
|
}
|
||||||
|
|
||||||
function sortcheckandsave(&$arr,$arrdesc,&$fp) {
|
function sortcheckandsave(&$arr,$arrdesc,&$fp) {
|
||||||
|
|
Loading…
Reference in a new issue