update.php 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409
  1. #!/usr/bin/env php
  2. <?php
  3. set_include_path(dirname(__FILE__) ."/include" . PATH_SEPARATOR .
  4. get_include_path());
  5. define('DISABLE_SESSIONS', true);
  6. chdir(dirname(__FILE__));
  7. require_once "autoload.php";
  8. require_once "functions.php";
  9. require_once "rssfuncs.php";
  10. require_once "config.php";
  11. require_once "sanity_check.php";
  12. require_once "db.php";
  13. require_once "db-prefs.php";
  14. if (!defined('PHP_EXECUTABLE'))
  15. define('PHP_EXECUTABLE', '/usr/bin/php');
  16. init_plugins();
  17. $longopts = array("feeds",
  18. "feedbrowser",
  19. "daemon",
  20. "daemon-loop",
  21. "task:",
  22. "cleanup-tags",
  23. "quiet",
  24. "log:",
  25. "indexes",
  26. "pidlock:",
  27. "update-schema",
  28. "convert-filters",
  29. "force-update",
  30. "gen-search-idx",
  31. "list-plugins",
  32. "debug-feed:",
  33. "force-refetch",
  34. "force-rehash",
  35. "help");
  36. foreach (PluginHost::getInstance()->get_commands() as $command => $data) {
  37. array_push($longopts, $command . $data["suffix"]);
  38. }
  39. $options = getopt("", $longopts);
  40. if (!is_array($options)) {
  41. die("error: getopt() failed. ".
  42. "Most probably you are using PHP CGI to run this script ".
  43. "instead of required PHP CLI. Check tt-rss wiki page on updating feeds for ".
  44. "additional information.\n");
  45. }
  46. if (count($options) == 0 && !defined('STDIN')) {
  47. ?> <html>
  48. <head>
  49. <title>Tiny Tiny RSS data update script.</title>
  50. <meta http-equiv="Content-Type" content="text/html; charset=utf-8">
  51. <link rel="stylesheet" type="text/css" href="css/utility.css">
  52. </head>
  53. <body>
  54. <div class="floatingLogo"><img src="images/logo_small.png"></div>
  55. <h1><?php echo __("Tiny Tiny RSS data update script.") ?></h1>
  56. <?php print_error("Please run this script from the command line. Use option \"-help\" to display command help if this error is displayed erroneously."); ?>
  57. </body></html>
  58. <?php
  59. exit;
  60. }
  61. if (count($options) == 0 || isset($options["help"]) ) {
  62. print "Tiny Tiny RSS data update script.\n\n";
  63. print "Options:\n";
  64. print " --feeds - update feeds\n";
  65. print " --feedbrowser - update feedbrowser\n";
  66. print " --daemon - start single-process update daemon\n";
  67. print " --task N - create lockfile using this task id\n";
  68. print " --cleanup-tags - perform tags table maintenance\n";
  69. print " --quiet - don't output messages to stdout\n";
  70. print " --log FILE - log messages to FILE\n";
  71. print " --indexes - recreate missing schema indexes\n";
  72. print " --update-schema - update database schema\n";
  73. print " --gen-search-idx - generate basic PostgreSQL fulltext search index\n";
  74. print " --convert-filters - convert type1 filters to type2\n";
  75. print " --force-update - force update of all feeds\n";
  76. print " --list-plugins - list all available plugins\n";
  77. print " --debug-feed N - perform debug update of feed N\n";
  78. print " --force-refetch - debug update: force refetch feed data\n";
  79. print " --force-rehash - debug update: force rehash articles\n";
  80. print " --help - show this help\n";
  81. print "Plugin options:\n";
  82. foreach (PluginHost::getInstance()->get_commands() as $command => $data) {
  83. $args = $data['arghelp'];
  84. printf(" --%-19s - %s\n", "$command $args", $data["description"]);
  85. }
  86. return;
  87. }
  88. if (!isset($options['daemon'])) {
  89. require_once "errorhandler.php";
  90. }
  91. if (!isset($options['update-schema'])) {
  92. $schema_version = get_schema_version();
  93. if ($schema_version != SCHEMA_VERSION) {
  94. die("Schema version is wrong, please upgrade the database.\n");
  95. }
  96. }
  97. define('QUIET', isset($options['quiet']));
  98. if (isset($options["log"])) {
  99. _debug("Logging to " . $options["log"]);
  100. define('LOGFILE', $options["log"]);
  101. }
  102. if (!isset($options["daemon"])) {
  103. $lock_filename = "update.lock";
  104. } else {
  105. $lock_filename = "update_daemon.lock";
  106. }
  107. if (isset($options["task"])) {
  108. _debug("Using task id " . $options["task"]);
  109. $lock_filename = $lock_filename . "-task_" . $options["task"];
  110. }
  111. if (isset($options["pidlock"])) {
  112. $my_pid = $options["pidlock"];
  113. $lock_filename = "update_daemon-$my_pid.lock";
  114. }
  115. _debug("Lock: $lock_filename");
  116. $lock_handle = make_lockfile($lock_filename);
  117. $must_exit = false;
  118. if (isset($options["task"]) && isset($options["pidlock"])) {
  119. $waits = $options["task"] * 5;
  120. _debug("Waiting before update ($waits)");
  121. sleep($waits);
  122. }
  123. // Try to lock a file in order to avoid concurrent update.
  124. if (!$lock_handle) {
  125. die("error: Can't create lockfile ($lock_filename). ".
  126. "Maybe another update process is already running.\n");
  127. }
  128. if (isset($options["force-update"])) {
  129. _debug("marking all feeds as needing update...");
  130. db_query( "UPDATE ttrss_feeds SET last_update_started = '1970-01-01',
  131. last_updated = '1970-01-01'");
  132. }
  133. if (isset($options["feeds"])) {
  134. update_daemon_common();
  135. housekeeping_common(true);
  136. PluginHost::getInstance()->run_hooks(PluginHost::HOOK_UPDATE_TASK, "hook_update_task", $op);
  137. }
  138. if (isset($options["feedbrowser"])) {
  139. $count = update_feedbrowser_cache();
  140. print "Finished, $count feeds processed.\n";
  141. }
  142. if (isset($options["daemon"])) {
  143. while (true) {
  144. $quiet = (isset($options["quiet"])) ? "--quiet" : "";
  145. $log = isset($options['log']) ? '--log '.$options['log'] : '';
  146. passthru(PHP_EXECUTABLE . " " . $argv[0] ." --daemon-loop $quiet $log");
  147. _debug("Sleeping for " . DAEMON_SLEEP_INTERVAL . " seconds...");
  148. sleep(DAEMON_SLEEP_INTERVAL);
  149. }
  150. }
  151. if (isset($options["daemon-loop"])) {
  152. if (!make_stampfile('update_daemon.stamp')) {
  153. _debug("warning: unable to create stampfile\n");
  154. }
  155. update_daemon_common(isset($options["pidlock"]) ? 50 : DAEMON_FEED_LIMIT);
  156. if (!isset($options["pidlock"]) || $options["task"] == 0)
  157. housekeeping_common(true);
  158. PluginHost::getInstance()->run_hooks(PluginHost::HOOK_UPDATE_TASK, "hook_update_task", $op);
  159. }
  160. if (isset($options["cleanup-tags"])) {
  161. $rc = cleanup_tags( 14, 50000);
  162. _debug("$rc tags deleted.\n");
  163. }
  164. if (isset($options["indexes"])) {
  165. _debug("PLEASE BACKUP YOUR DATABASE BEFORE PROCEEDING!");
  166. _debug("Type 'yes' to continue.");
  167. if (read_stdin() != 'yes')
  168. exit;
  169. _debug("clearing existing indexes...");
  170. if (DB_TYPE == "pgsql") {
  171. $result = db_query( "SELECT relname FROM
  172. pg_catalog.pg_class WHERE relname LIKE 'ttrss_%'
  173. AND relname NOT LIKE '%_pkey'
  174. AND relkind = 'i'");
  175. } else {
  176. $result = db_query( "SELECT index_name,table_name FROM
  177. information_schema.statistics WHERE index_name LIKE 'ttrss_%'");
  178. }
  179. while ($line = db_fetch_assoc($result)) {
  180. if (DB_TYPE == "pgsql") {
  181. $statement = "DROP INDEX " . $line["relname"];
  182. _debug($statement);
  183. } else {
  184. $statement = "ALTER TABLE ".
  185. $line['table_name']." DROP INDEX ".$line['index_name'];
  186. _debug($statement);
  187. }
  188. db_query( $statement, false);
  189. }
  190. _debug("reading indexes from schema for: " . DB_TYPE);
  191. $fp = fopen("schema/ttrss_schema_" . DB_TYPE . ".sql", "r");
  192. if ($fp) {
  193. while ($line = fgets($fp)) {
  194. $matches = array();
  195. if (preg_match("/^create index ([^ ]+) on ([^ ]+)$/i", $line, $matches)) {
  196. $index = $matches[1];
  197. $table = $matches[2];
  198. $statement = "CREATE INDEX $index ON $table";
  199. _debug($statement);
  200. db_query( $statement);
  201. }
  202. }
  203. fclose($fp);
  204. } else {
  205. _debug("unable to open schema file.");
  206. }
  207. _debug("all done.");
  208. }
  209. if (isset($options["convert-filters"])) {
  210. _debug("WARNING: this will remove all existing type2 filters.");
  211. _debug("Type 'yes' to continue.");
  212. if (read_stdin() != 'yes')
  213. exit;
  214. _debug("converting filters...");
  215. db_query( "DELETE FROM ttrss_filters2");
  216. $result = db_query( "SELECT * FROM ttrss_filters ORDER BY id");
  217. while ($line = db_fetch_assoc($result)) {
  218. $owner_uid = $line["owner_uid"];
  219. // date filters are removed
  220. if ($line["filter_type"] != 5) {
  221. $filter = array();
  222. if (sql_bool_to_bool($line["cat_filter"])) {
  223. $feed_id = "CAT:" . (int)$line["cat_id"];
  224. } else {
  225. $feed_id = (int)$line["feed_id"];
  226. }
  227. $filter["enabled"] = $line["enabled"] ? "on" : "off";
  228. $filter["rule"] = array(
  229. json_encode(array(
  230. "reg_exp" => $line["reg_exp"],
  231. "feed_id" => $feed_id,
  232. "filter_type" => $line["filter_type"])));
  233. $filter["action"] = array(
  234. json_encode(array(
  235. "action_id" => $line["action_id"],
  236. "action_param_label" => $line["action_param"],
  237. "action_param" => $line["action_param"])));
  238. // Oh god it's full of hacks
  239. $_REQUEST = $filter;
  240. $_SESSION["uid"] = $owner_uid;
  241. $filters = new Pref_Filters($_REQUEST);
  242. $filters->add();
  243. }
  244. }
  245. }
  246. if (isset($options["update-schema"])) {
  247. _debug("checking for updates (" . DB_TYPE . ")...");
  248. $updater = new DbUpdater(Db::get(), DB_TYPE, SCHEMA_VERSION);
  249. if ($updater->isUpdateRequired()) {
  250. _debug("schema update required, version " . $updater->getSchemaVersion() . " to " . SCHEMA_VERSION);
  251. _debug("WARNING: please backup your database before continuing.");
  252. _debug("Type 'yes' to continue.");
  253. if (read_stdin() != 'yes')
  254. exit;
  255. for ($i = $updater->getSchemaVersion() + 1; $i <= SCHEMA_VERSION; $i++) {
  256. _debug("performing update up to version $i...");
  257. $result = $updater->performUpdateTo($i, false);
  258. _debug($result ? "OK!" : "FAILED!");
  259. if (!$result) return;
  260. }
  261. } else {
  262. _debug("update not required.");
  263. }
  264. }
  265. if (isset($options["gen-search-idx"])) {
  266. echo "Generating search index (stemming set to English)...\n";
  267. $result = db_query("SELECT COUNT(id) AS count FROM ttrss_entries WHERE tsvector_combined IS NULL");
  268. $count = db_fetch_result($result, 0, "count");
  269. print "Articles to process: $count.\n";
  270. $limit = 500;
  271. $processed = 0;
  272. while (true) {
  273. $result = db_query("SELECT id, title, content FROM ttrss_entries WHERE tsvector_combined IS NULL ORDER BY id LIMIT $limit");
  274. while ($line = db_fetch_assoc($result)) {
  275. $tsvector_combined = db_escape_string(mb_substr($line['title'] . ' ' . strip_tags(str_replace('<', ' <', $line['content'])),
  276. 0, 1000000));
  277. db_query("UPDATE ttrss_entries SET tsvector_combined = to_tsvector('english', '$tsvector_combined') WHERE id = " . $line["id"]);
  278. }
  279. $processed += db_num_rows($result);
  280. print "Processed $processed articles...\n";
  281. if (db_num_rows($result) != $limit) {
  282. echo "All done.\n";
  283. break;
  284. }
  285. }
  286. }
  287. if (isset($options["list-plugins"])) {
  288. $tmppluginhost = new PluginHost();
  289. $tmppluginhost->load_all($tmppluginhost::KIND_ALL, false);
  290. $enabled = array_map("trim", explode(",", PLUGINS));
  291. echo "List of all available plugins:\n";
  292. foreach ($tmppluginhost->get_plugins() as $name => $plugin) {
  293. $about = $plugin->about();
  294. $status = $about[3] ? "system" : "user";
  295. if (in_array($name, $enabled)) $name .= "*";
  296. printf("%-50s %-10s v%.2f (by %s)\n%s\n\n",
  297. $name, $status, $about[0], $about[2], $about[1]);
  298. }
  299. echo "Plugins marked by * are currently enabled for all users.\n";
  300. }
  301. if (isset($options["debug-feed"])) {
  302. $feed = $options["debug-feed"];
  303. if (isset($options["force-refetch"])) $_REQUEST["force_refetch"] = true;
  304. if (isset($options["force-rehash"])) $_REQUEST["force_rehash"] = true;
  305. $_REQUEST['xdebug'] = 1;
  306. update_rss_feed($feed);
  307. }
  308. PluginHost::getInstance()->run_commands($options);
  309. if (file_exists(LOCK_DIRECTORY . "/$lock_filename"))
  310. unlink(LOCK_DIRECTORY . "/$lock_filename");
  311. ?>