forked from GNUsocial/gnu-social
Initial stub code for pulling data from Twitter's User Streams and Site Streams interfaces. This should allow us to make a much more efficient background importer which can use a relatively small number of connections getting push data for either a single user or for many users with credentials on the site.
This commit is contained in:
parent
949ede654b
commit
3b304fc0ef
224
plugins/TwitterBridge/jsonstreamreader.php
Normal file
224
plugins/TwitterBridge/jsonstreamreader.php
Normal file
@ -0,0 +1,224 @@
|
|||||||
|
<?php
|
||||||
|
/**
|
||||||
|
* StatusNet, the distributed open-source microblogging tool
|
||||||
|
*
|
||||||
|
* PHP version 5
|
||||||
|
*
|
||||||
|
* LICENCE: This program is free software: you can redistribute it and/or modify
|
||||||
|
* it under the terms of the GNU Affero General Public License as published by
|
||||||
|
* the Free Software Foundation, either version 3 of the License, or
|
||||||
|
* (at your option) any later version.
|
||||||
|
*
|
||||||
|
* This program is distributed in the hope that it will be useful,
|
||||||
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||||
|
* GNU Affero General Public License for more details.
|
||||||
|
*
|
||||||
|
* You should have received a copy of the GNU Affero General Public License
|
||||||
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||||
|
*
|
||||||
|
* @category Plugin
|
||||||
|
* @package StatusNet
|
||||||
|
* @author Brion Vibber <brion@status.net>
|
||||||
|
* @copyright 2010 StatusNet, Inc.
|
||||||
|
* @license http://www.fsf.org/licensing/licenses/agpl-3.0.html GNU Affero General Public License version 3.0
|
||||||
|
* @link http://status.net/
|
||||||
|
*/
|
||||||
|
|
||||||
|
class OAuthData
|
||||||
|
{
|
||||||
|
public $consumer_key, $consumer_secret, $token, $token_secret;
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
*
|
||||||
|
*/
|
||||||
|
abstract class JsonStreamReader
|
||||||
|
{
|
||||||
|
const CRLF = "\r\n";
|
||||||
|
|
||||||
|
public $id;
|
||||||
|
protected $socket = null;
|
||||||
|
protected $state = 'init'; // 'init', 'connecting', 'waiting', 'headers', 'active'
|
||||||
|
|
||||||
|
public function __construct()
|
||||||
|
{
|
||||||
|
$this->id = get_class($this) . '.' . substr(md5(mt_rand()), 0, 8);
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Starts asynchronous connect operation...
|
||||||
|
*
|
||||||
|
* @param <type> $url
|
||||||
|
*/
|
||||||
|
public function connect($url)
|
||||||
|
{
|
||||||
|
common_log(LOG_DEBUG, "$this->id opening connection to $url");
|
||||||
|
|
||||||
|
$scheme = parse_url($url, PHP_URL_SCHEME);
|
||||||
|
if ($scheme == 'http') {
|
||||||
|
$rawScheme = 'tcp';
|
||||||
|
} else if ($scheme == 'https') {
|
||||||
|
$rawScheme = 'ssl';
|
||||||
|
} else {
|
||||||
|
throw new ServerException('Invalid URL scheme for HTTP stream reader');
|
||||||
|
}
|
||||||
|
|
||||||
|
$host = parse_url($url, PHP_URL_HOST);
|
||||||
|
$port = parse_url($url, PHP_URL_PORT);
|
||||||
|
if (!$port) {
|
||||||
|
if ($scheme == 'https') {
|
||||||
|
$port = 443;
|
||||||
|
} else {
|
||||||
|
$port = 80;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
$path = parse_url($url, PHP_URL_PATH);
|
||||||
|
$query = parse_url($url, PHP_URL_QUERY);
|
||||||
|
if ($query) {
|
||||||
|
$path .= '?' . $query;
|
||||||
|
}
|
||||||
|
|
||||||
|
$errno = $errstr = null;
|
||||||
|
$timeout = 5;
|
||||||
|
//$flags = STREAM_CLIENT_CONNECT | STREAM_CLIENT_ASYNC_CONNECT;
|
||||||
|
$flags = STREAM_CLIENT_CONNECT;
|
||||||
|
// @fixme add SSL params
|
||||||
|
$this->socket = stream_socket_client("$rawScheme://$host:$port", $errno, $errstr, $timeout, $flags);
|
||||||
|
|
||||||
|
$this->send($this->httpOpen($host, $path));
|
||||||
|
|
||||||
|
stream_set_blocking($this->socket, false);
|
||||||
|
$this->state = 'waiting';
|
||||||
|
}
|
||||||
|
|
||||||
|
function send($buffer)
|
||||||
|
{
|
||||||
|
echo "Writing...\n";
|
||||||
|
var_dump($buffer);
|
||||||
|
fwrite($this->socket, $buffer);
|
||||||
|
}
|
||||||
|
|
||||||
|
function read()
|
||||||
|
{
|
||||||
|
echo "Reading...\n";
|
||||||
|
$buffer = fread($this->socket, 65536);
|
||||||
|
var_dump($buffer);
|
||||||
|
return $buffer;
|
||||||
|
}
|
||||||
|
|
||||||
|
protected function httpOpen($host, $path)
|
||||||
|
{
|
||||||
|
$lines = array(
|
||||||
|
"GET $path HTTP/1.1",
|
||||||
|
"Host: $host",
|
||||||
|
"User-Agent: StatusNet/" . STATUSNET_VERSION . " (TwitterBridgePlugin)",
|
||||||
|
"Connection: close",
|
||||||
|
"",
|
||||||
|
""
|
||||||
|
);
|
||||||
|
return implode(self::CRLF, $lines);
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Close the current connection, if open.
|
||||||
|
*/
|
||||||
|
public function close()
|
||||||
|
{
|
||||||
|
if ($this->isConnected()) {
|
||||||
|
common_log(LOG_DEBUG, "$this->id closing connection.");
|
||||||
|
fclose($this->socket);
|
||||||
|
$this->socket = null;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Are we currently connected?
|
||||||
|
*
|
||||||
|
* @return boolean
|
||||||
|
*/
|
||||||
|
public function isConnected()
|
||||||
|
{
|
||||||
|
return $this->socket !== null;
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Send any sockets we're listening on to the IO manager
|
||||||
|
* to wait for input.
|
||||||
|
*
|
||||||
|
* @return array of resources
|
||||||
|
*/
|
||||||
|
public function getSockets()
|
||||||
|
{
|
||||||
|
if ($this->isConnected()) {
|
||||||
|
return array($this->socket);
|
||||||
|
}
|
||||||
|
return array();
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Take a chunk of input over the horn and go go go! :D
|
||||||
|
* @param string $buffer
|
||||||
|
*/
|
||||||
|
function handleInput($socket)
|
||||||
|
{
|
||||||
|
if ($this->socket !== $socket) {
|
||||||
|
throw new Exception('Got input from unexpected socket!');
|
||||||
|
}
|
||||||
|
|
||||||
|
$buffer = $this->read();
|
||||||
|
switch ($this->state)
|
||||||
|
{
|
||||||
|
case 'waiting':
|
||||||
|
$this->handleInputWaiting($buffer);
|
||||||
|
break;
|
||||||
|
case 'headers':
|
||||||
|
$this->handleInputHeaders($buffer);
|
||||||
|
break;
|
||||||
|
case 'active':
|
||||||
|
$this->handleInputActive($buffer);
|
||||||
|
break;
|
||||||
|
default:
|
||||||
|
throw new Exception('Invalid state in handleInput: ' . $this->state);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
function handleInputWaiting($buffer)
|
||||||
|
{
|
||||||
|
common_log(LOG_DEBUG, "$this->id Does this happen? " . $buffer);
|
||||||
|
$this->state = 'headers';
|
||||||
|
$this->handleInputHeaders($buffer);
|
||||||
|
}
|
||||||
|
|
||||||
|
function handleInputHeaders($buffer)
|
||||||
|
{
|
||||||
|
$lines = explode(self::CRLF, $buffer);
|
||||||
|
foreach ($lines as $line) {
|
||||||
|
if ($line == '') {
|
||||||
|
$this->state = 'active';
|
||||||
|
common_log(LOG_DEBUG, "$this->id connection is active!");
|
||||||
|
} else {
|
||||||
|
common_log(LOG_DEBUG, "$this->id read HTTP header: $line");
|
||||||
|
$this->responseHeaders[] = $line;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
function handleInputActive($buffer)
|
||||||
|
{
|
||||||
|
// One JSON object on each line...
|
||||||
|
// Will we always deliver on packet boundaries?
|
||||||
|
$lines = explode("\n", $buffer);
|
||||||
|
foreach ($lines as $line) {
|
||||||
|
$data = json_decode($line, true);
|
||||||
|
if ($data) {
|
||||||
|
$this->handleJson($data);
|
||||||
|
} else {
|
||||||
|
common_log(LOG_ERR, "$this->id received bogus JSON data: " . $line);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
abstract function handleJson(array $data);
|
||||||
|
}
|
142
plugins/TwitterBridge/scripts/streamtest.php
Normal file
142
plugins/TwitterBridge/scripts/streamtest.php
Normal file
@ -0,0 +1,142 @@
|
|||||||
|
<?php
|
||||||
|
/**
|
||||||
|
* StatusNet, the distributed open-source microblogging tool
|
||||||
|
*
|
||||||
|
* PHP version 5
|
||||||
|
*
|
||||||
|
* LICENCE: This program is free software: you can redistribute it and/or modify
|
||||||
|
* it under the terms of the GNU Affero General Public License as published by
|
||||||
|
* the Free Software Foundation, either version 3 of the License, or
|
||||||
|
* (at your option) any later version.
|
||||||
|
*
|
||||||
|
* This program is distributed in the hope that it will be useful,
|
||||||
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||||
|
* GNU Affero General Public License for more details.
|
||||||
|
*
|
||||||
|
* You should have received a copy of the GNU Affero General Public License
|
||||||
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||||
|
*
|
||||||
|
* @category Plugin
|
||||||
|
* @package StatusNet
|
||||||
|
* @author Brion Vibber <brion@status.net>
|
||||||
|
* @copyright 2010 StatusNet, Inc.
|
||||||
|
* @license http://www.fsf.org/licensing/licenses/agpl-3.0.html GNU Affero General Public License version 3.0
|
||||||
|
* @link http://status.net/
|
||||||
|
*/
|
||||||
|
|
||||||
|
define('INSTALLDIR', realpath(dirname(__FILE__) . '/../../..'));
|
||||||
|
|
||||||
|
$shortoptions = 'n:';
|
||||||
|
$longoptions = array('nick=');
|
||||||
|
|
||||||
|
$helptext = <<<ENDOFHELP
|
||||||
|
USAGE: streamtest.php -n <username>
|
||||||
|
|
||||||
|
Attempts a User Stream connection to Twitter as the given user, dumping
|
||||||
|
data as it comes.
|
||||||
|
|
||||||
|
ENDOFHELP;
|
||||||
|
|
||||||
|
require_once INSTALLDIR.'/scripts/commandline.inc';
|
||||||
|
require_once dirname(dirname(__FILE__)) . '/jsonstreamreader.php';
|
||||||
|
require_once dirname(dirname(__FILE__)) . '/twitterstreamreader.php';
|
||||||
|
|
||||||
|
if (have_option('n')) {
|
||||||
|
$nickname = get_option_value('n');
|
||||||
|
} else if (have_option('nick')) {
|
||||||
|
$nickname = get_option_value('nickname');
|
||||||
|
} else {
|
||||||
|
show_help($helptext);
|
||||||
|
exit(0);
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
*
|
||||||
|
* @param User $user
|
||||||
|
* @return TwitterOAuthClient
|
||||||
|
*/
|
||||||
|
function twitterAuthForUser(User $user)
|
||||||
|
{
|
||||||
|
$flink = Foreign_link::getByUserID($user->id,
|
||||||
|
TWITTER_SERVICE);
|
||||||
|
if (!$flink) {
|
||||||
|
throw new ServerException("No Twitter config for this user.");
|
||||||
|
}
|
||||||
|
|
||||||
|
$token = TwitterOAuthClient::unpackToken($flink->credentials);
|
||||||
|
if (!$token) {
|
||||||
|
throw new ServerException("No Twitter OAuth credentials for this user.");
|
||||||
|
}
|
||||||
|
|
||||||
|
return new TwitterOAuthClient($token->key, $token->secret);
|
||||||
|
}
|
||||||
|
|
||||||
|
function homeStreamForUser(User $user)
|
||||||
|
{
|
||||||
|
$auth = twitterAuthForUser($user);
|
||||||
|
return new TwitterUserStream($auth);
|
||||||
|
}
|
||||||
|
|
||||||
|
$user = User::staticGet('nickname', $nickname);
|
||||||
|
$stream = homeStreamForUser($user);
|
||||||
|
$stream->hookEvent('raw', function($data) {
|
||||||
|
var_dump($data);
|
||||||
|
});
|
||||||
|
|
||||||
|
class TwitterManager extends IoManager
|
||||||
|
{
|
||||||
|
function __construct(TwitterStreamReader $stream)
|
||||||
|
{
|
||||||
|
$this->stream = $stream;
|
||||||
|
}
|
||||||
|
|
||||||
|
function getSockets()
|
||||||
|
{
|
||||||
|
return $this->stream->getSockets();
|
||||||
|
}
|
||||||
|
|
||||||
|
function handleInput($data)
|
||||||
|
{
|
||||||
|
$this->stream->handleInput($data);
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
function start()
|
||||||
|
{
|
||||||
|
$this->stream->connect();
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
function finish()
|
||||||
|
{
|
||||||
|
$this->stream->close();
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
public static function get()
|
||||||
|
{
|
||||||
|
throw new Exception('not a singleton');
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
class TwitterStreamMaster extends IoMaster
|
||||||
|
{
|
||||||
|
function __construct($id, $ioManager)
|
||||||
|
{
|
||||||
|
parent::__construct($id);
|
||||||
|
$this->ioManager = $ioManager;
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Initialize IoManagers which are appropriate to this instance.
|
||||||
|
*/
|
||||||
|
function initManagers()
|
||||||
|
{
|
||||||
|
$this->instantiate($this->ioManager);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
$master = new TwitterStreamMaster('TwitterStream', new TwitterManager($stream));
|
||||||
|
$master->init();
|
||||||
|
$master->service();
|
161
plugins/TwitterBridge/twitterstreamreader.php
Normal file
161
plugins/TwitterBridge/twitterstreamreader.php
Normal file
@ -0,0 +1,161 @@
|
|||||||
|
<?php
|
||||||
|
/**
|
||||||
|
* StatusNet, the distributed open-source microblogging tool
|
||||||
|
*
|
||||||
|
* PHP version 5
|
||||||
|
*
|
||||||
|
* LICENCE: This program is free software: you can redistribute it and/or modify
|
||||||
|
* it under the terms of the GNU Affero General Public License as published by
|
||||||
|
* the Free Software Foundation, either version 3 of the License, or
|
||||||
|
* (at your option) any later version.
|
||||||
|
*
|
||||||
|
* This program is distributed in the hope that it will be useful,
|
||||||
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||||
|
* GNU Affero General Public License for more details.
|
||||||
|
*
|
||||||
|
* You should have received a copy of the GNU Affero General Public License
|
||||||
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||||
|
*
|
||||||
|
* @category Plugin
|
||||||
|
* @package StatusNet
|
||||||
|
* @author Brion Vibber <brion@status.net>
|
||||||
|
* @copyright 2010 StatusNet, Inc.
|
||||||
|
* @license http://www.fsf.org/licensing/licenses/agpl-3.0.html GNU Affero General Public License version 3.0
|
||||||
|
* @link http://status.net/
|
||||||
|
*/
|
||||||
|
|
||||||
|
// A single stream connection
|
||||||
|
abstract class TwitterStreamReader extends JsonStreamReader
|
||||||
|
{
|
||||||
|
protected $callbacks = array();
|
||||||
|
|
||||||
|
function __construct(TwitterOAuthClient $auth, $baseUrl)
|
||||||
|
{
|
||||||
|
$this->baseUrl = $baseUrl;
|
||||||
|
$this->oauth = $auth;
|
||||||
|
}
|
||||||
|
|
||||||
|
public function connect($method)
|
||||||
|
{
|
||||||
|
$url = $this->oAuthUrl($this->baseUrl . '/' . $method);
|
||||||
|
return parent::connect($url);
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Sign our target URL with OAuth auth stuff.
|
||||||
|
*
|
||||||
|
* @param string $url
|
||||||
|
* @param array $params
|
||||||
|
* @return string
|
||||||
|
*/
|
||||||
|
function oAuthUrl($url, $params=array())
|
||||||
|
{
|
||||||
|
// In an ideal world this would be better encapsulated. :)
|
||||||
|
$request = OAuthRequest::from_consumer_and_token($this->oauth->consumer,
|
||||||
|
$this->oauth->token, 'GET', $url, $params);
|
||||||
|
$request->sign_request($this->oauth->sha1_method,
|
||||||
|
$this->oauth->consumer, $this->oauth->token);
|
||||||
|
|
||||||
|
return $request->to_url();
|
||||||
|
}
|
||||||
|
/**
|
||||||
|
* Add an event callback. Available event names include
|
||||||
|
* 'raw' (all data), 'friends', 'delete', 'scrubgeo', etc
|
||||||
|
*
|
||||||
|
* @param string $event
|
||||||
|
* @param callable $callback
|
||||||
|
*/
|
||||||
|
public function hookEvent($event, $callback)
|
||||||
|
{
|
||||||
|
$this->callbacks[$event][] = $callback;
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Call event handler callbacks for the given event.
|
||||||
|
*
|
||||||
|
* @param string $event
|
||||||
|
* @param mixed $arg1 ... one or more params to pass on
|
||||||
|
*/
|
||||||
|
public function fireEvent($event, $arg1)
|
||||||
|
{
|
||||||
|
if (array_key_exists($event, $this->callbacks)) {
|
||||||
|
$args = array_slice(func_get_args(), 1);
|
||||||
|
foreach ($this->callbacks[$event] as $callback) {
|
||||||
|
call_user_func_array($callback, $args);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
function handleJson(array $data)
|
||||||
|
{
|
||||||
|
$this->routeMessage($data);
|
||||||
|
}
|
||||||
|
|
||||||
|
abstract function routeMessage($data);
|
||||||
|
|
||||||
|
function handleMessage($data, $forUserId=null)
|
||||||
|
{
|
||||||
|
$this->fireEvent('raw', $data, $forUserId);
|
||||||
|
$known = array('friends');
|
||||||
|
foreach ($known as $key) {
|
||||||
|
if (isset($data[$key])) {
|
||||||
|
$this->fireEvent($key, $data[$key], $forUserId);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
class TwitterSiteStream extends TwitterStreamReader
|
||||||
|
{
|
||||||
|
protected $userIds;
|
||||||
|
|
||||||
|
public function __construct(TwitterOAuthClient $auth, $baseUrl='https://stream.twitter.com')
|
||||||
|
{
|
||||||
|
parent::__construct($auth, $baseUrl);
|
||||||
|
}
|
||||||
|
|
||||||
|
public function connect($method='2b/site.json')
|
||||||
|
{
|
||||||
|
return parent::connect($method);
|
||||||
|
}
|
||||||
|
|
||||||
|
function followUsers($userIds)
|
||||||
|
{
|
||||||
|
$this->userIds = $userIds;
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Each message in the site stream tells us which user ID it should be
|
||||||
|
* routed to; we'll need that to let the caller know what to do.
|
||||||
|
*
|
||||||
|
* @param array $data
|
||||||
|
*/
|
||||||
|
function routeMessage($data)
|
||||||
|
{
|
||||||
|
parent::handleMessage($data['message'], $data['for_user']);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
class TwitterUserStream extends TwitterStreamReader
|
||||||
|
{
|
||||||
|
public function __construct(TwitterOAuthClient $auth, $baseUrl='https://userstream.twitter.com')
|
||||||
|
{
|
||||||
|
parent::__construct($auth, $baseUrl);
|
||||||
|
}
|
||||||
|
|
||||||
|
public function connect($method='2/user.json')
|
||||||
|
{
|
||||||
|
return parent::connect($method);
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Each message in the user stream is just ready to go.
|
||||||
|
*
|
||||||
|
* @param array $data
|
||||||
|
*/
|
||||||
|
function routeMessage($data)
|
||||||
|
{
|
||||||
|
parent::handleMessage($data, $this->userId);
|
||||||
|
}
|
||||||
|
}
|
Loading…
Reference in New Issue
Block a user