123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313 |
- #!/usr/bin/env php
- <?php
- /*
- * StatusNet - the distributed open-source microblogging tool
- * Copyright (C) 2008-2010, StatusNet, Inc.
- *
- * This program is free software: you can redistribute it and/or modify
- * it under the terms of the GNU Affero General Public License as published by
- * the Free Software Foundation, either version 3 of the License, or
- * (at your option) any later version.
- *
- * This program is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- * GNU Affero General Public License for more details.
- *
- * You should have received a copy of the GNU Affero General Public License
- * along with this program. If not, see <http://www.gnu.org/licenses/>.
- */
- define('INSTALLDIR', realpath(dirname(__FILE__) . '/../../..'));
- $shortoptions = 'fi::a';
- $longoptions = array('id::', 'foreground', 'all');
- $helptext = <<<END_OF_TWITTERDAEMON_HELP
- Daemon script for receiving new notices from Twitter users.
- -i --id Identity (default none)
- -a --all Handle Twitter for all local sites
- (requires Stomp queue handler, status_network setup)
- -f --foreground Stay in the foreground (default background)
- END_OF_TWITTERDAEMON_HELP;
- require_once INSTALLDIR.'/scripts/commandline.inc';
- class TwitterDaemon extends SpawningDaemon
- {
- protected $allsites = false;
- function __construct($id=null, $daemonize=true, $threads=1, $allsites=false)
- {
- if ($threads != 1) {
- // This should never happen. :)
- throw new Exception("TwitterDaemon must run single-threaded");
- }
- parent::__construct($id, $daemonize, $threads);
- $this->allsites = $allsites;
- }
- function runThread()
- {
- common_log(LOG_INFO, 'Waiting to listen to Twitter and queues');
- $master = new TwitterMaster($this->get_id(), $this->processManager());
- $master->init($this->allsites);
- $master->service();
- common_log(LOG_INFO, 'terminating normally');
- return $master->respawn ? self::EXIT_RESTART : self::EXIT_SHUTDOWN;
- }
- }
- class TwitterMaster extends IoMaster
- {
- protected $processManager;
- function __construct($id, $processManager)
- {
- parent::__construct($id);
- $this->processManager = $processManager;
- }
- /**
- * Initialize IoManagers for the currently configured site
- * which are appropriate to this instance.
- */
- function initManagers()
- {
- $qm = QueueManager::get();
- $qm->setActiveGroup('twitter');
- $this->instantiate($qm);
- $this->instantiate(new TwitterManager());
- $this->instantiate($this->processManager);
- }
- }
- class TwitterManager extends IoManager
- {
- // Recommended resource limits from http://dev.twitter.com/pages/site_streams
- const MAX_STREAMS = 1000;
- const USERS_PER_STREAM = 100;
- const STREAMS_PER_SECOND = 20;
- protected $streams;
- protected $users;
- /**
- * Pull the site's active Twitter-importing users and start spawning
- * some data streams for them!
- *
- * @fixme check their last-id and check whether we'll need to do a manual pull.
- * @fixme abstract out the fetching so we can work over multiple sites.
- */
- protected function initStreams()
- {
- common_log(LOG_INFO, 'init...');
- // Pull Twitter user IDs for all users we want to pull data for
- $flink = new Foreign_link();
- $flink->service = TWITTER_SERVICE;
- // @fixme probably should do the bitfield check in a whereAdd but it's ugly :D
- $flink->find();
- $userIds = array();
- while ($flink->fetch()) {
- if (($flink->noticesync & FOREIGN_NOTICE_RECV) ==
- FOREIGN_NOTICE_RECV) {
- $userIds[] = $flink->foreign_id;
- if (count($userIds) >= self::USERS_PER_STREAM) {
- $this->spawnStream($userIds);
- $userIds = array();
- }
- }
- }
- if (count($userIds)) {
- $this->spawnStream($userIds);
- }
- }
- /**
- * Prepare a Site Stream connection for the given chunk of users.
- * The actual connection will be opened later.
- *
- * @param $userIds array of Twitter-side user IDs
- */
- protected function spawnStream($userIds)
- {
- $stream = $this->initSiteStream();
- $stream->followUsers($userIds);
- // Slip the stream reader into our list of active streams.
- // We'll manage its actual connection on the next go-around.
- $this->streams[] = $stream;
- // Record the user->stream mappings; this makes it easier for us to know
- // later if we need to kill something.
- foreach ($userIds as $id) {
- $this->users[$id] = $stream;
- }
- }
- /**
- * Initialize a generic site streams connection object.
- * All our connections will look like this, then we'll add users to them.
- *
- * @return TwitterStreamReader
- */
- protected function initSiteStream()
- {
- $auth = $this->siteStreamAuth();
- $stream = new TwitterSiteStream($auth);
- // Add our event handler callbacks. Whee!
- $this->setupEvents($stream);
- return $stream;
- }
- /**
- * Fetch the Twitter OAuth credentials to use to connect to the Site Streams API.
- *
- * This will use the locally-stored credentials for the applictation's owner account
- * from the site configuration. These should be configured through the administration
- * panels or manually in the config file.
- *
- * Will throw an exception if no credentials can be found -- but beware that invalid
- * credentials won't cause breakage until later.
- *
- * @return TwitterOAuthClient
- */
- protected function siteStreamAuth()
- {
- $token = common_config('twitter', 'stream_token');
- $secret = common_config('twitter', 'stream_secret');
- if (empty($token) || empty($secret)) {
- throw new ServerException('Twitter site streams have not been correctly configured. Configure the app owner account via the admin panel.');
- }
- return new TwitterOAuthClient($token, $secret);
- }
- /**
- * Collect the sockets for all active connections for i/o monitoring.
- *
- * @return array of resources
- */
- public function getSockets()
- {
- $sockets = array();
- foreach ($this->streams as $stream) {
- foreach ($stream->getSockets() as $socket) {
- $sockets[] = $socket;
- }
- }
- return $sockets;
- }
- /**
- * We're ready to process input from one of our data sources! Woooooo!
- * @fixme is there an easier way to map from socket back to owning module? :(
- *
- * @param resource $socket
- * @return boolean success
- */
- public function handleInput($socket)
- {
- foreach ($this->streams as $stream) {
- foreach ($stream->getSockets() as $aSocket) {
- if ($socket === $aSocket) {
- $stream->handleInput($socket);
- }
- }
- }
- return true;
- }
- /**
- * Start the i/o system up! Prepare our connections and start opening them.
- *
- * @fixme do some rate-limiting on the stream setup
- * @fixme do some sensible backoff on failure etc
- */
- public function start()
- {
- $this->initStreams();
- foreach ($this->streams as $stream) {
- $stream->connect();
- }
- return true;
- }
- /**
- * Close down our connections when the daemon wraps up for business.
- */
- public function finish()
- {
- foreach ($this->streams as $index => $stream) {
- $stream->close();
- unset($this->streams[$index]);
- }
- return true;
- }
- public static function get()
- {
- throw new Exception('not a singleton');
- }
- /**
- * Set up event handlers on the streaming interface.
- *
- * @fixme add more event types as we add handling for them
- */
- protected function setupEvents(TwitterStreamReader $stream)
- {
- $handlers = array(
- 'status',
- );
- foreach ($handlers as $event) {
- $stream->hookEvent($event, array($this, 'onTwitter' . ucfirst($event)));
- }
- }
- /**
- * Event callback notifying that a user has a new message in their home timeline.
- * We store the incoming message into the queues for processing, keeping our own
- * daemon running as shiny-fast as possible.
- *
- * @param object $status JSON data: Twitter status update
- * @fixme in all-sites mode we may need to route queue items into another site's
- * destination queues, or multiple sites.
- */
- protected function onTwitterStatus($status, $context)
- {
- $data = array(
- 'status' => $status,
- 'for_user' => $context->for_user,
- );
- $qm = QueueManager::get();
- $qm->enqueue($data, 'tweetin');
- }
- }
- if (have_option('i', 'id')) {
- $id = get_option_value('i', 'id');
- } else if (count($args) > 0) {
- $id = $args[0];
- } else {
- $id = null;
- }
- $foreground = have_option('f', 'foreground');
- $all = have_option('a') || have_option('--all');
- $daemon = new TwitterDaemon($id, !$foreground, 1, $all);
- $daemon->runOnce();
|