2009-04-22 03:09:27 +01:00
|
|
|
#!/usr/bin/env php
|
|
|
|
<?php
|
2019-11-01 12:27:36 +00:00
|
|
|
// This file is part of GNU social - https://www.gnu.org/software/social
|
|
|
|
//
|
|
|
|
// GNU social is free software: you can redistribute it and/or modify
|
|
|
|
// it under the terms of the GNU Affero General Public License as published by
|
|
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
|
|
// (at your option) any later version.
|
|
|
|
//
|
|
|
|
// GNU social is distributed in the hope that it will be useful,
|
|
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
// GNU Affero General Public License for more details.
|
|
|
|
//
|
|
|
|
// You should have received a copy of the GNU Affero General Public License
|
|
|
|
// along with GNU social. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
|
2009-06-17 20:31:35 +01:00
|
|
|
/**
|
2019-11-01 12:27:36 +00:00
|
|
|
* @copyright 2008-2010 StatusNet, Inc
|
|
|
|
* @license https://www.gnu.org/licenses/agpl.html GNU AGPL v3 or later
|
2009-04-22 03:09:27 +01:00
|
|
|
*/
|
|
|
|
|
2009-08-26 01:59:06 +01:00
|
|
|
define('INSTALLDIR', realpath(dirname(__FILE__) . '/../../..'));
|
2019-11-01 12:27:36 +00:00
|
|
|
define('PUBLICDIR', INSTALLDIR . DIRECTORY_SEPARATOR . 'public');
|
2009-04-22 03:09:27 +01:00
|
|
|
|
2009-05-05 20:28:57 +01:00
|
|
|
// Tune number of processes and how often to poll Twitter
|
2009-05-07 08:25:15 +01:00
|
|
|
// XXX: Should these things be in config.php?
|
|
|
|
define('MAXCHILDREN', 2);
|
2013-10-05 10:32:43 +01:00
|
|
|
define('POLL_INTERVAL', 70); // in seconds, Twitter API v1.1 says 15 calls every 15 mins
|
2009-05-05 20:28:57 +01:00
|
|
|
|
2009-07-18 02:36:13 +01:00
|
|
|
$shortoptions = 'di::';
|
|
|
|
$longoptions = array('id::', 'debug');
|
2009-06-28 21:16:44 +01:00
|
|
|
|
2009-06-23 00:39:21 +01:00
|
|
|
$helptext = <<<END_OF_TRIM_HELP
|
|
|
|
Batch script for retrieving Twitter messages from foreign service.
|
2009-06-20 22:58:47 +01:00
|
|
|
|
2009-07-18 02:36:13 +01:00
|
|
|
-i --id Identity (default 'generic')
|
|
|
|
-d --debug Debug (lots of log output)
|
2009-07-18 02:09:03 +01:00
|
|
|
|
2009-06-23 00:39:21 +01:00
|
|
|
END_OF_TRIM_HELP;
|
2009-06-20 22:58:47 +01:00
|
|
|
|
2009-08-26 01:59:06 +01:00
|
|
|
require_once INSTALLDIR . '/scripts/commandline.inc';
|
2019-08-23 13:36:02 +01:00
|
|
|
require_once INSTALLDIR . '/lib/util/common.php';
|
|
|
|
require_once INSTALLDIR . '/lib/util/daemon.php';
|
2014-08-06 08:29:47 +01:00
|
|
|
require_once dirname(__DIR__) . '/twitter.php';
|
2009-06-17 20:31:35 +01:00
|
|
|
|
|
|
|
/**
|
2010-03-27 23:36:04 +00:00
|
|
|
* Fetch statuses from Twitter
|
2009-06-17 20:31:35 +01:00
|
|
|
*
|
2010-03-27 23:36:04 +00:00
|
|
|
* Fetches statuses from Twitter and inserts them as notices
|
|
|
|
*
|
|
|
|
* NOTE: an Avatar path MUST be set in config.php for this
|
|
|
|
* script to work, e.g.:
|
|
|
|
* $config['avatar']['path'] = $config['site']['path'] . '/avatar/';
|
|
|
|
*
|
|
|
|
* @todo @fixme @gar Fix the above. For some reason $_path is always empty when
|
|
|
|
* this script is run, so the default avatar path is always set wrong in
|
|
|
|
* default.php. Therefore it must be set explicitly in config.php. --Z
|
2009-06-17 20:31:35 +01:00
|
|
|
*
|
|
|
|
* @category Twitter
|
2009-08-25 23:12:20 +01:00
|
|
|
* @package StatusNet
|
2009-08-25 23:19:04 +01:00
|
|
|
* @author Zach Copley <zach@status.net>
|
|
|
|
* @author Evan Prodromou <evan@status.net>
|
2009-06-17 20:31:35 +01:00
|
|
|
* @license http://www.fsf.org/licensing/licenses/agpl-3.0.html GNU Affero General Public License version 3.0
|
2009-08-25 23:16:46 +01:00
|
|
|
* @link http://status.net/
|
2009-06-17 20:31:35 +01:00
|
|
|
*/
|
2009-08-06 23:52:58 +01:00
|
|
|
class TwitterStatusFetcher extends ParallelizingDaemon
|
2009-05-07 08:25:15 +01:00
|
|
|
{
|
2009-08-06 23:52:58 +01:00
|
|
|
/**
|
|
|
|
* Constructor
|
|
|
|
*
|
|
|
|
* @param string $id the name/id of this daemon
|
|
|
|
* @param int $interval sleep this long before doing everything again
|
|
|
|
* @param int $max_children maximum number of child processes at a time
|
|
|
|
* @param boolean $debug debug output flag
|
|
|
|
*
|
|
|
|
* @return void
|
|
|
|
*
|
|
|
|
**/
|
2019-11-01 12:27:36 +00:00
|
|
|
public function __construct(
|
|
|
|
$id = null,
|
|
|
|
$interval = 60,
|
|
|
|
$max_children = 2,
|
|
|
|
$debug = null
|
|
|
|
) {
|
2009-08-06 23:52:58 +01:00
|
|
|
parent::__construct($id, $interval, $max_children, $debug);
|
2009-07-18 02:09:03 +01:00
|
|
|
}
|
|
|
|
|
2009-06-17 20:31:35 +01:00
|
|
|
/**
|
|
|
|
* Name of this daemon
|
|
|
|
*
|
|
|
|
* @return string Name of the daemon.
|
|
|
|
*/
|
2019-11-01 12:27:36 +00:00
|
|
|
public function name()
|
2009-05-07 08:25:15 +01:00
|
|
|
{
|
2009-06-28 21:16:44 +01:00
|
|
|
return ('twitterstatusfetcher.'.$this->_id);
|
2009-05-07 08:25:15 +01:00
|
|
|
}
|
2009-05-06 02:12:26 +01:00
|
|
|
|
2009-06-17 20:31:35 +01:00
|
|
|
/**
|
2009-08-06 23:52:58 +01:00
|
|
|
* Find all the Twitter foreign links for users who have requested
|
|
|
|
* importing of their friends' timelines
|
2009-06-17 20:31:35 +01:00
|
|
|
*
|
2009-08-06 23:52:58 +01:00
|
|
|
* @return array flinks an array of Foreign_link objects
|
2009-06-17 20:31:35 +01:00
|
|
|
*/
|
2019-11-01 12:27:36 +00:00
|
|
|
public function getObjects()
|
2009-06-17 20:31:35 +01:00
|
|
|
{
|
2009-08-05 01:16:12 +01:00
|
|
|
global $_DB_DATAOBJECT;
|
2009-05-07 08:25:15 +01:00
|
|
|
$flink = new Foreign_link();
|
2009-08-05 01:16:12 +01:00
|
|
|
$conn = &$flink->getDatabaseConnection();
|
2009-06-17 20:31:35 +01:00
|
|
|
|
2009-08-04 03:21:18 +01:00
|
|
|
$flink->service = TWITTER_SERVICE;
|
2009-05-07 08:25:15 +01:00
|
|
|
$flink->orderBy('last_noticesync');
|
2009-08-06 23:52:58 +01:00
|
|
|
$flink->find();
|
2009-05-05 20:28:57 +01:00
|
|
|
|
2009-05-07 08:25:15 +01:00
|
|
|
$flinks = array();
|
2009-05-05 20:28:57 +01:00
|
|
|
|
2009-05-07 08:25:15 +01:00
|
|
|
while ($flink->fetch()) {
|
2009-05-07 09:10:31 +01:00
|
|
|
if (($flink->noticesync & FOREIGN_NOTICE_RECV) ==
|
|
|
|
FOREIGN_NOTICE_RECV) {
|
2009-05-07 08:25:15 +01:00
|
|
|
$flinks[] = clone($flink);
|
2009-10-28 19:29:20 +00:00
|
|
|
common_log(LOG_INFO, "sync: foreign id $flink->foreign_id");
|
|
|
|
} else {
|
|
|
|
common_log(LOG_INFO, "nothing to sync");
|
2009-05-07 08:25:15 +01:00
|
|
|
}
|
|
|
|
}
|
2009-05-05 20:28:57 +01:00
|
|
|
|
2009-05-07 08:25:15 +01:00
|
|
|
$flink->free();
|
|
|
|
unset($flink);
|
2009-05-05 20:28:57 +01:00
|
|
|
|
2009-08-05 01:16:12 +01:00
|
|
|
$conn->disconnect();
|
|
|
|
unset($_DB_DATAOBJECT['CONNECTIONS']);
|
|
|
|
|
2009-05-07 08:25:15 +01:00
|
|
|
return $flinks;
|
|
|
|
}
|
2009-05-05 20:28:57 +01:00
|
|
|
|
2015-07-18 10:39:34 +01:00
|
|
|
// FIXME: make it so we can force a Foreign_link here without colliding with parent
|
2019-11-01 12:27:36 +00:00
|
|
|
public function childTask($flink)
|
|
|
|
{
|
2009-08-06 23:52:58 +01:00
|
|
|
// Each child ps needs its own DB connection
|
|
|
|
|
|
|
|
// Note: DataObject::getDatabaseConnection() creates
|
2009-11-09 19:01:46 +00:00
|
|
|
// a new connection if there isn't one already
|
2009-08-06 23:52:58 +01:00
|
|
|
$conn = &$flink->getDatabaseConnection();
|
|
|
|
|
2013-02-18 22:16:06 +00:00
|
|
|
$this->getTimeline($flink, 'home_timeline');
|
2013-02-10 19:06:30 +00:00
|
|
|
$this->getTimeline($flink, 'mentions_timeline');
|
2009-08-06 23:52:58 +01:00
|
|
|
|
|
|
|
$flink->last_friendsync = common_sql_now();
|
|
|
|
$flink->update();
|
|
|
|
|
|
|
|
$conn->disconnect();
|
|
|
|
|
2009-11-08 22:28:51 +00:00
|
|
|
// XXX: Couldn't find a less brutal way to blow
|
2009-08-06 23:52:58 +01:00
|
|
|
// away a cached connection
|
|
|
|
global $_DB_DATAOBJECT;
|
|
|
|
unset($_DB_DATAOBJECT['CONNECTIONS']);
|
2009-05-05 20:28:57 +01:00
|
|
|
}
|
|
|
|
|
2019-11-01 12:27:36 +00:00
|
|
|
public function getTimeline(Foreign_link $flink, $timelineUri = 'home_timeline')
|
2009-05-07 08:25:15 +01:00
|
|
|
{
|
2013-02-18 22:16:06 +00:00
|
|
|
common_log(LOG_DEBUG, $this->name() . ' - Trying to get ' . $timelineUri .
|
|
|
|
' timeline for Twitter user ' . $flink->foreign_id);
|
2009-04-22 03:09:27 +01:00
|
|
|
|
2009-08-28 08:02:27 +01:00
|
|
|
$client = null;
|
2009-08-10 08:00:59 +01:00
|
|
|
|
2009-08-28 08:02:27 +01:00
|
|
|
if (TwitterOAuthClient::isPackedToken($flink->credentials)) {
|
|
|
|
$token = TwitterOAuthClient::unpackToken($flink->credentials);
|
|
|
|
$client = new TwitterOAuthClient($token->key, $token->secret);
|
2013-02-18 22:16:06 +00:00
|
|
|
common_log(LOG_DEBUG, $this->name() . ' - Grabbing ' . $timelineUri . ' timeline with OAuth.');
|
2009-08-28 08:02:27 +01:00
|
|
|
} else {
|
2013-02-18 22:16:06 +00:00
|
|
|
common_log(LOG_ERR, "Skipping " . $timelineUri . " timeline for " .
|
|
|
|
$flink->foreign_id . " since not OAuth.");
|
2009-08-28 08:02:27 +01:00
|
|
|
}
|
2009-04-22 03:09:27 +01:00
|
|
|
|
2009-08-04 03:21:18 +01:00
|
|
|
$timeline = null;
|
2009-04-22 03:09:27 +01:00
|
|
|
|
2013-02-18 22:16:06 +00:00
|
|
|
$lastId = Twitter_synch_status::getLastId($flink->foreign_id, $timelineUri);
|
2010-09-07 09:22:55 +01:00
|
|
|
|
2013-02-18 22:16:06 +00:00
|
|
|
common_log(LOG_DEBUG, "Got lastId value '" . $lastId . "' for foreign id '" .
|
|
|
|
$flink->foreign_id . "' and timeline '" . $timelineUri. "'");
|
2010-09-07 16:53:26 +01:00
|
|
|
|
2009-08-04 03:21:18 +01:00
|
|
|
try {
|
2013-02-18 22:16:06 +00:00
|
|
|
$timeline = $client->statusesTimeline($lastId, $timelineUri);
|
2009-08-28 08:02:27 +01:00
|
|
|
} catch (Exception $e) {
|
2013-02-18 22:16:06 +00:00
|
|
|
common_log(LOG_ERR, $this->name() .
|
|
|
|
' - Unable to get ' . $timelineUri . ' timeline for user ' . $flink->user_id .
|
|
|
|
' - code: ' . $e->getCode() . 'msg: ' . $e->getMessage());
|
2009-08-04 03:21:18 +01:00
|
|
|
}
|
2009-04-24 22:27:31 +01:00
|
|
|
|
2009-05-07 08:25:15 +01:00
|
|
|
if (empty($timeline)) {
|
2015-02-09 01:07:23 +00:00
|
|
|
common_log(LOG_DEBUG, $this->name() . " - Empty '" . $timelineUri . "' timeline.");
|
2009-05-07 08:25:15 +01:00
|
|
|
return;
|
2009-04-24 22:27:31 +01:00
|
|
|
}
|
|
|
|
|
2013-02-18 22:16:06 +00:00
|
|
|
common_log(LOG_INFO, $this->name() .
|
|
|
|
' - Retrieved ' . sizeof($timeline) . ' statuses from ' . $timelineUri . ' timeline' .
|
|
|
|
' - for user ' . $flink->user_id);
|
2010-03-27 23:36:04 +00:00
|
|
|
|
2013-02-18 22:22:08 +00:00
|
|
|
if (!empty($timeline)) {
|
|
|
|
$qm = QueueManager::get();
|
|
|
|
|
|
|
|
// Reverse to preserve order
|
|
|
|
foreach (array_reverse($timeline) as $status) {
|
|
|
|
$data = array(
|
|
|
|
'status' => $status,
|
|
|
|
'for_user' => $flink->foreign_id,
|
|
|
|
);
|
|
|
|
$qm->enqueue($data, 'tweetin');
|
2010-09-04 16:40:33 +01:00
|
|
|
}
|
2009-04-24 22:27:31 +01:00
|
|
|
|
2010-11-23 17:28:47 +00:00
|
|
|
$lastId = twitter_id($timeline[0]);
|
2013-02-18 22:16:06 +00:00
|
|
|
Twitter_synch_status::setLastId($flink->foreign_id, $timelineUri, $lastId);
|
|
|
|
common_debug("Set lastId value '$lastId' for foreign id '{$flink->foreign_id}' and timeline '" .
|
|
|
|
$timelineUri . "'");
|
2010-09-07 16:53:26 +01:00
|
|
|
}
|
2010-09-07 09:22:55 +01:00
|
|
|
|
2009-05-07 08:25:15 +01:00
|
|
|
// Okay, record the time we synced with Twitter for posterity
|
|
|
|
$flink->last_noticesync = common_sql_now();
|
|
|
|
$flink->update();
|
2009-04-22 03:09:27 +01:00
|
|
|
}
|
2009-05-07 08:25:15 +01:00
|
|
|
}
|
2009-04-24 22:27:31 +01:00
|
|
|
|
2009-08-06 23:52:58 +01:00
|
|
|
$id = null;
|
|
|
|
$debug = null;
|
2009-04-22 03:09:27 +01:00
|
|
|
|
2009-06-28 21:16:44 +01:00
|
|
|
if (have_option('i')) {
|
|
|
|
$id = get_option_value('i');
|
2019-11-01 12:27:36 +00:00
|
|
|
} elseif (have_option('--id')) {
|
2009-06-28 21:16:44 +01:00
|
|
|
$id = get_option_value('--id');
|
2019-11-01 12:27:36 +00:00
|
|
|
} elseif (count($args) > 0) {
|
2009-06-28 21:16:44 +01:00
|
|
|
$id = $args[0];
|
|
|
|
} else {
|
|
|
|
$id = null;
|
|
|
|
}
|
|
|
|
|
2009-07-18 02:36:13 +01:00
|
|
|
if (have_option('d') || have_option('debug')) {
|
2009-08-06 23:52:58 +01:00
|
|
|
$debug = true;
|
2009-07-18 02:36:13 +01:00
|
|
|
}
|
2009-07-18 02:09:03 +01:00
|
|
|
|
2013-02-18 22:16:06 +00:00
|
|
|
$fetcher = new TwitterStatusFetcher($id, POLL_INTERVAL, MAXCHILDREN, $debug);
|
2009-05-07 08:25:15 +01:00
|
|
|
$fetcher->runOnce();
|