123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241 |
- #!/usr/bin/env php
- <?php
- /**
- * StatusNet - the distributed open-source microblogging tool
- * Copyright (C) 2008-2010, StatusNet, Inc.
- *
- * This program is free software: you can redistribute it and/or modify
- * it under the terms of the GNU Affero General Public License as published by
- * the Free Software Foundation, either version 3 of the License, or
- * (at your option) any later version.
- *
- * This program is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- * GNU Affero General Public License for more details.
- *
- * You should have received a copy of the GNU Affero General Public License
- * along with this program. If not, see <http://www.gnu.org/licenses/>.
- */
- define('INSTALLDIR', realpath(dirname(__FILE__) . '/../../..'));
- // Tune number of processes and how often to poll Twitter
- // XXX: Should these things be in config.php?
- define('MAXCHILDREN', 2);
- define('POLL_INTERVAL', 70); // in seconds, Twitter API v1.1 says 15 calls every 15 mins
- $shortoptions = 'di::';
- $longoptions = array('id::', 'debug');
- $helptext = <<<END_OF_TRIM_HELP
- Batch script for retrieving Twitter messages from foreign service.
- -i --id Identity (default 'generic')
- -d --debug Debug (lots of log output)
- END_OF_TRIM_HELP;
- require_once INSTALLDIR . '/scripts/commandline.inc';
- require_once INSTALLDIR . '/lib/common.php';
- require_once INSTALLDIR . '/lib/daemon.php';
- require_once dirname(__DIR__) . '/twitter.php';
- /**
- * Fetch statuses from Twitter
- *
- * Fetches statuses from Twitter and inserts them as notices
- *
- * NOTE: an Avatar path MUST be set in config.php for this
- * script to work, e.g.:
- * $config['avatar']['path'] = $config['site']['path'] . '/avatar/';
- *
- * @todo @fixme @gar Fix the above. For some reason $_path is always empty when
- * this script is run, so the default avatar path is always set wrong in
- * default.php. Therefore it must be set explicitly in config.php. --Z
- *
- * @category Twitter
- * @package StatusNet
- * @author Zach Copley <zach@status.net>
- * @author Evan Prodromou <evan@status.net>
- * @license http://www.fsf.org/licensing/licenses/agpl-3.0.html GNU Affero General Public License version 3.0
- * @link http://status.net/
- */
- class TwitterStatusFetcher extends ParallelizingDaemon
- {
- /**
- * Constructor
- *
- * @param string $id the name/id of this daemon
- * @param int $interval sleep this long before doing everything again
- * @param int $max_children maximum number of child processes at a time
- * @param boolean $debug debug output flag
- *
- * @return void
- *
- **/
- function __construct($id = null, $interval = 60,
- $max_children = 2, $debug = null)
- {
- parent::__construct($id, $interval, $max_children, $debug);
- }
- /**
- * Name of this daemon
- *
- * @return string Name of the daemon.
- */
- function name()
- {
- return ('twitterstatusfetcher.'.$this->_id);
- }
- /**
- * Find all the Twitter foreign links for users who have requested
- * importing of their friends' timelines
- *
- * @return array flinks an array of Foreign_link objects
- */
- function getObjects()
- {
- global $_DB_DATAOBJECT;
- $flink = new Foreign_link();
- $conn = &$flink->getDatabaseConnection();
- $flink->service = TWITTER_SERVICE;
- $flink->orderBy('last_noticesync');
- $flink->find();
- $flinks = array();
- while ($flink->fetch()) {
- if (($flink->noticesync & FOREIGN_NOTICE_RECV) ==
- FOREIGN_NOTICE_RECV) {
- $flinks[] = clone($flink);
- common_log(LOG_INFO, "sync: foreign id $flink->foreign_id");
- } else {
- common_log(LOG_INFO, "nothing to sync");
- }
- }
- $flink->free();
- unset($flink);
- $conn->disconnect();
- unset($_DB_DATAOBJECT['CONNECTIONS']);
- return $flinks;
- }
- function childTask($flink) {
- // Each child ps needs its own DB connection
- // Note: DataObject::getDatabaseConnection() creates
- // a new connection if there isn't one already
- $conn = &$flink->getDatabaseConnection();
- $this->getTimeline($flink, 'home_timeline');
- $this->getTimeline($flink, 'mentions_timeline');
- $flink->last_friendsync = common_sql_now();
- $flink->update();
- $conn->disconnect();
- // XXX: Couldn't find a less brutal way to blow
- // away a cached connection
- global $_DB_DATAOBJECT;
- unset($_DB_DATAOBJECT['CONNECTIONS']);
- }
- function getTimeline($flink, $timelineUri = 'home_timeline')
- {
- if (empty($flink)) {
- common_log(LOG_ERR, $this->name() .
- " - Can't retrieve Foreign_link for foreign ID $fid");
- return;
- }
- common_log(LOG_DEBUG, $this->name() . ' - Trying to get ' . $timelineUri .
- ' timeline for Twitter user ' . $flink->foreign_id);
- $client = null;
- if (TwitterOAuthClient::isPackedToken($flink->credentials)) {
- $token = TwitterOAuthClient::unpackToken($flink->credentials);
- $client = new TwitterOAuthClient($token->key, $token->secret);
- common_log(LOG_DEBUG, $this->name() . ' - Grabbing ' . $timelineUri . ' timeline with OAuth.');
- } else {
- common_log(LOG_ERR, "Skipping " . $timelineUri . " timeline for " .
- $flink->foreign_id . " since not OAuth.");
- }
- $timeline = null;
- $lastId = Twitter_synch_status::getLastId($flink->foreign_id, $timelineUri);
- common_log(LOG_DEBUG, "Got lastId value '" . $lastId . "' for foreign id '" .
- $flink->foreign_id . "' and timeline '" . $timelineUri. "'");
- try {
- $timeline = $client->statusesTimeline($lastId, $timelineUri);
- } catch (Exception $e) {
- common_log(LOG_ERR, $this->name() .
- ' - Unable to get ' . $timelineUri . ' timeline for user ' . $flink->user_id .
- ' - code: ' . $e->getCode() . 'msg: ' . $e->getMessage());
- }
- if (empty($timeline)) {
- common_log(LOG_DEBUG, $this->name() . " - Empty '" . $timelineUri . "' timeline.");
- return;
- }
- common_log(LOG_INFO, $this->name() .
- ' - Retrieved ' . sizeof($timeline) . ' statuses from ' . $timelineUri . ' timeline' .
- ' - for user ' . $flink->user_id);
- if (!empty($timeline)) {
- $qm = QueueManager::get();
- // Reverse to preserve order
- foreach (array_reverse($timeline) as $status) {
- $data = array(
- 'status' => $status,
- 'for_user' => $flink->foreign_id,
- );
- $qm->enqueue($data, 'tweetin');
- }
- $lastId = twitter_id($timeline[0]);
- Twitter_synch_status::setLastId($flink->foreign_id, $timelineUri, $lastId);
- common_debug("Set lastId value '$lastId' for foreign id '{$flink->foreign_id}' and timeline '" .
- $timelineUri . "'");
- }
- // Okay, record the time we synced with Twitter for posterity
- $flink->last_noticesync = common_sql_now();
- $flink->update();
- }
- }
- $id = null;
- $debug = null;
- if (have_option('i')) {
- $id = get_option_value('i');
- } else if (have_option('--id')) {
- $id = get_option_value('--id');
- } else if (count($args) > 0) {
- $id = $args[0];
- } else {
- $id = null;
- }
- if (have_option('d') || have_option('debug')) {
- $debug = true;
- }
- $fetcher = new TwitterStatusFetcher($id, POLL_INTERVAL, MAXCHILDREN, $debug);
- $fetcher->runOnce();
|