2009-04-22 11:09:27 +09:00
|
|
|
#!/usr/bin/env php
|
|
|
|
<?php
|
2009-06-18 04:31:35 +09:00
|
|
|
/**
|
2009-08-26 07:14:12 +09:00
|
|
|
* StatusNet - the distributed open-source microblogging tool
|
2010-02-04 10:53:08 +09:00
|
|
|
* Copyright (C) 2008-2010, StatusNet, Inc.
|
2009-04-22 11:09:27 +09:00
|
|
|
*
|
|
|
|
* This program is free software: you can redistribute it and/or modify
|
|
|
|
* it under the terms of the GNU Affero General Public License as published by
|
|
|
|
* the Free Software Foundation, either version 3 of the License, or
|
|
|
|
* (at your option) any later version.
|
|
|
|
*
|
|
|
|
* This program is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
* GNU Affero General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU Affero General Public License
|
|
|
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
*/
|
|
|
|
|
2009-08-26 09:59:06 +09:00
|
|
|
define('INSTALLDIR', realpath(dirname(__FILE__) . '/../../..'));
|
2009-04-22 11:09:27 +09:00
|
|
|
|
2009-05-06 04:28:57 +09:00
|
|
|
// Tune number of processes and how often to poll Twitter
|
2009-05-07 16:25:15 +09:00
|
|
|
// XXX: Should these things be in config.php?
|
|
|
|
define('MAXCHILDREN', 2);
|
|
|
|
define('POLL_INTERVAL', 60); // in seconds
|
2009-05-06 04:28:57 +09:00
|
|
|
|
2009-07-18 10:36:13 +09:00
|
|
|
$shortoptions = 'di::';
|
|
|
|
$longoptions = array('id::', 'debug');
|
2009-06-29 05:16:44 +09:00
|
|
|
|
2009-06-23 08:39:21 +09:00
|
|
|
$helptext = <<<END_OF_TRIM_HELP
|
|
|
|
Batch script for retrieving Twitter messages from foreign service.
|
2009-06-21 06:58:47 +09:00
|
|
|
|
2009-07-18 10:36:13 +09:00
|
|
|
-i --id Identity (default 'generic')
|
|
|
|
-d --debug Debug (lots of log output)
|
2009-07-18 10:09:03 +09:00
|
|
|
|
2009-06-23 08:39:21 +09:00
|
|
|
END_OF_TRIM_HELP;
|
2009-06-21 06:58:47 +09:00
|
|
|
|
2009-08-26 09:59:06 +09:00
|
|
|
require_once INSTALLDIR . '/scripts/commandline.inc';
|
2009-10-14 13:50:16 +09:00
|
|
|
require_once INSTALLDIR . '/lib/common.php';
|
2009-06-18 04:31:35 +09:00
|
|
|
require_once INSTALLDIR . '/lib/daemon.php';
|
2009-08-26 09:59:06 +09:00
|
|
|
require_once INSTALLDIR . '/plugins/TwitterBridge/twitter.php';
|
2009-06-18 04:31:35 +09:00
|
|
|
|
|
|
|
/**
|
2010-03-28 08:36:04 +09:00
|
|
|
* Fetch statuses from Twitter
|
2009-06-18 04:31:35 +09:00
|
|
|
*
|
2010-03-28 08:36:04 +09:00
|
|
|
* Fetches statuses from Twitter and inserts them as notices
|
|
|
|
*
|
|
|
|
* NOTE: an Avatar path MUST be set in config.php for this
|
|
|
|
* script to work, e.g.:
|
|
|
|
* $config['avatar']['path'] = $config['site']['path'] . '/avatar/';
|
|
|
|
*
|
|
|
|
* @todo @fixme @gar Fix the above. For some reason $_path is always empty when
|
|
|
|
* this script is run, so the default avatar path is always set wrong in
|
|
|
|
* default.php. Therefore it must be set explicitly in config.php. --Z
|
2009-06-18 04:31:35 +09:00
|
|
|
*
|
|
|
|
* @category Twitter
|
2009-08-26 07:12:20 +09:00
|
|
|
* @package StatusNet
|
2009-08-26 07:19:04 +09:00
|
|
|
* @author Zach Copley <zach@status.net>
|
|
|
|
* @author Evan Prodromou <evan@status.net>
|
2009-06-18 04:31:35 +09:00
|
|
|
* @license http://www.fsf.org/licensing/licenses/agpl-3.0.html GNU Affero General Public License version 3.0
|
2009-08-26 07:16:46 +09:00
|
|
|
* @link http://status.net/
|
2009-06-18 04:31:35 +09:00
|
|
|
*/
|
2009-08-07 07:52:58 +09:00
|
|
|
class TwitterStatusFetcher extends ParallelizingDaemon
|
2009-05-07 16:25:15 +09:00
|
|
|
{
|
2009-08-07 07:52:58 +09:00
|
|
|
/**
|
|
|
|
* Constructor
|
|
|
|
*
|
|
|
|
* @param string $id the name/id of this daemon
|
|
|
|
* @param int $interval sleep this long before doing everything again
|
|
|
|
* @param int $max_children maximum number of child processes at a time
|
|
|
|
* @param boolean $debug debug output flag
|
|
|
|
*
|
|
|
|
* @return void
|
|
|
|
*
|
|
|
|
**/
|
|
|
|
function __construct($id = null, $interval = 60,
|
|
|
|
$max_children = 2, $debug = null)
|
2009-07-18 10:09:03 +09:00
|
|
|
{
|
2009-08-07 07:52:58 +09:00
|
|
|
parent::__construct($id, $interval, $max_children, $debug);
|
2009-07-18 10:09:03 +09:00
|
|
|
}
|
|
|
|
|
2009-06-18 04:31:35 +09:00
|
|
|
/**
|
|
|
|
* Name of this daemon
|
|
|
|
*
|
|
|
|
* @return string Name of the daemon.
|
|
|
|
*/
|
2009-05-07 16:25:15 +09:00
|
|
|
function name()
|
|
|
|
{
|
2009-06-29 05:16:44 +09:00
|
|
|
return ('twitterstatusfetcher.'.$this->_id);
|
2009-05-07 16:25:15 +09:00
|
|
|
}
|
2009-05-06 10:12:26 +09:00
|
|
|
|
2009-06-18 04:31:35 +09:00
|
|
|
/**
|
2009-08-07 07:52:58 +09:00
|
|
|
* Find all the Twitter foreign links for users who have requested
|
|
|
|
* importing of their friends' timelines
|
2009-06-18 04:31:35 +09:00
|
|
|
*
|
2009-08-07 07:52:58 +09:00
|
|
|
* @return array flinks an array of Foreign_link objects
|
2009-06-18 04:31:35 +09:00
|
|
|
*/
|
2009-08-07 07:52:58 +09:00
|
|
|
function getObjects()
|
2009-06-18 04:31:35 +09:00
|
|
|
{
|
2009-08-05 09:16:12 +09:00
|
|
|
global $_DB_DATAOBJECT;
|
2009-05-07 16:25:15 +09:00
|
|
|
$flink = new Foreign_link();
|
2009-08-05 09:16:12 +09:00
|
|
|
$conn = &$flink->getDatabaseConnection();
|
2009-06-18 04:31:35 +09:00
|
|
|
|
2009-08-04 11:21:18 +09:00
|
|
|
$flink->service = TWITTER_SERVICE;
|
2009-05-07 16:25:15 +09:00
|
|
|
$flink->orderBy('last_noticesync');
|
2009-08-07 07:52:58 +09:00
|
|
|
$flink->find();
|
2009-05-06 04:28:57 +09:00
|
|
|
|
2009-05-07 16:25:15 +09:00
|
|
|
$flinks = array();
|
2009-05-06 04:28:57 +09:00
|
|
|
|
2009-05-07 16:25:15 +09:00
|
|
|
while ($flink->fetch()) {
|
2009-05-06 04:28:57 +09:00
|
|
|
|
2009-05-07 17:10:31 +09:00
|
|
|
if (($flink->noticesync & FOREIGN_NOTICE_RECV) ==
|
|
|
|
FOREIGN_NOTICE_RECV) {
|
2009-05-07 16:25:15 +09:00
|
|
|
$flinks[] = clone($flink);
|
2009-10-29 04:29:20 +09:00
|
|
|
common_log(LOG_INFO, "sync: foreign id $flink->foreign_id");
|
|
|
|
} else {
|
|
|
|
common_log(LOG_INFO, "nothing to sync");
|
2009-05-07 16:25:15 +09:00
|
|
|
}
|
|
|
|
}
|
2009-05-06 04:28:57 +09:00
|
|
|
|
2009-05-07 16:25:15 +09:00
|
|
|
$flink->free();
|
|
|
|
unset($flink);
|
2009-05-06 04:28:57 +09:00
|
|
|
|
2009-08-05 09:16:12 +09:00
|
|
|
$conn->disconnect();
|
|
|
|
unset($_DB_DATAOBJECT['CONNECTIONS']);
|
|
|
|
|
2009-05-07 16:25:15 +09:00
|
|
|
return $flinks;
|
|
|
|
}
|
2009-05-06 04:28:57 +09:00
|
|
|
|
2009-08-07 07:52:58 +09:00
|
|
|
function childTask($flink) {
|
|
|
|
// Each child ps needs its own DB connection
|
|
|
|
|
|
|
|
// Note: DataObject::getDatabaseConnection() creates
|
2009-11-10 04:01:46 +09:00
|
|
|
// a new connection if there isn't one already
|
2009-08-07 07:52:58 +09:00
|
|
|
$conn = &$flink->getDatabaseConnection();
|
|
|
|
|
2013-02-19 07:16:06 +09:00
|
|
|
$this->getTimeline($flink, 'home_timeline');
|
2013-02-11 04:06:30 +09:00
|
|
|
$this->getTimeline($flink, 'mentions_timeline');
|
2009-08-07 07:52:58 +09:00
|
|
|
|
|
|
|
$flink->last_friendsync = common_sql_now();
|
|
|
|
$flink->update();
|
|
|
|
|
|
|
|
$conn->disconnect();
|
|
|
|
|
2009-11-09 07:28:51 +09:00
|
|
|
// XXX: Couldn't find a less brutal way to blow
|
2009-08-07 07:52:58 +09:00
|
|
|
// away a cached connection
|
|
|
|
global $_DB_DATAOBJECT;
|
|
|
|
unset($_DB_DATAOBJECT['CONNECTIONS']);
|
2009-05-06 04:28:57 +09:00
|
|
|
}
|
|
|
|
|
2013-02-19 07:16:06 +09:00
|
|
|
function getTimeline($flink, $timelineUri = 'home_timeline')
|
2009-05-07 16:25:15 +09:00
|
|
|
{
|
2009-08-28 16:02:27 +09:00
|
|
|
if (empty($flink)) {
|
2013-02-19 07:16:06 +09:00
|
|
|
common_log(LOG_ERR, $this->name() .
|
2009-11-09 07:28:51 +09:00
|
|
|
" - Can't retrieve Foreign_link for foreign ID $fid");
|
2009-05-07 16:25:15 +09:00
|
|
|
return;
|
2009-04-22 11:09:27 +09:00
|
|
|
}
|
|
|
|
|
2013-02-19 07:16:06 +09:00
|
|
|
common_log(LOG_DEBUG, $this->name() . ' - Trying to get ' . $timelineUri .
|
|
|
|
' timeline for Twitter user ' . $flink->foreign_id);
|
2009-04-22 11:09:27 +09:00
|
|
|
|
2009-08-28 16:02:27 +09:00
|
|
|
$client = null;
|
2009-08-10 16:00:59 +09:00
|
|
|
|
2009-08-28 16:02:27 +09:00
|
|
|
if (TwitterOAuthClient::isPackedToken($flink->credentials)) {
|
|
|
|
$token = TwitterOAuthClient::unpackToken($flink->credentials);
|
|
|
|
$client = new TwitterOAuthClient($token->key, $token->secret);
|
2013-02-19 07:16:06 +09:00
|
|
|
common_log(LOG_DEBUG, $this->name() . ' - Grabbing ' . $timelineUri . ' timeline with OAuth.');
|
2009-08-28 16:02:27 +09:00
|
|
|
} else {
|
2013-02-19 07:16:06 +09:00
|
|
|
common_log(LOG_ERR, "Skipping " . $timelineUri . " timeline for " .
|
|
|
|
$flink->foreign_id . " since not OAuth.");
|
2009-08-28 16:02:27 +09:00
|
|
|
}
|
2009-04-22 11:09:27 +09:00
|
|
|
|
2009-08-04 11:21:18 +09:00
|
|
|
$timeline = null;
|
2009-04-22 11:09:27 +09:00
|
|
|
|
2013-02-19 07:16:06 +09:00
|
|
|
$lastId = Twitter_synch_status::getLastId($flink->foreign_id, $timelineUri);
|
2010-09-07 17:22:55 +09:00
|
|
|
|
2013-02-19 07:16:06 +09:00
|
|
|
common_log(LOG_DEBUG, "Got lastId value '" . $lastId . "' for foreign id '" .
|
|
|
|
$flink->foreign_id . "' and timeline '" . $timelineUri. "'");
|
2010-09-08 00:53:26 +09:00
|
|
|
|
2009-08-04 11:21:18 +09:00
|
|
|
try {
|
2013-02-19 07:16:06 +09:00
|
|
|
$timeline = $client->statusesTimeline($lastId, $timelineUri);
|
2009-08-28 16:02:27 +09:00
|
|
|
} catch (Exception $e) {
|
2013-02-19 07:16:06 +09:00
|
|
|
common_log(LOG_ERR, $this->name() .
|
|
|
|
' - Unable to get ' . $timelineUri . ' timeline for user ' . $flink->user_id .
|
|
|
|
' - code: ' . $e->getCode() . 'msg: ' . $e->getMessage());
|
2009-08-04 11:21:18 +09:00
|
|
|
}
|
2009-04-25 06:27:31 +09:00
|
|
|
|
2009-05-07 16:25:15 +09:00
|
|
|
if (empty($timeline)) {
|
2013-02-19 07:16:06 +09:00
|
|
|
common_log(LOG_WARNING, $this->name() . " - Empty '" . $timelineUri . "' timeline.");
|
2009-05-07 16:25:15 +09:00
|
|
|
return;
|
2009-04-25 06:27:31 +09:00
|
|
|
}
|
|
|
|
|
2013-02-19 07:16:06 +09:00
|
|
|
common_log(LOG_INFO, $this->name() .
|
|
|
|
' - Retrieved ' . sizeof($timeline) . ' statuses from ' . $timelineUri . ' timeline' .
|
|
|
|
' - for user ' . $flink->user_id);
|
2010-03-28 08:36:04 +09:00
|
|
|
|
2013-02-19 07:22:08 +09:00
|
|
|
if (!empty($timeline)) {
|
|
|
|
$qm = QueueManager::get();
|
|
|
|
|
|
|
|
// Reverse to preserve order
|
|
|
|
foreach (array_reverse($timeline) as $status) {
|
|
|
|
$data = array(
|
|
|
|
'status' => $status,
|
|
|
|
'for_user' => $flink->foreign_id,
|
|
|
|
);
|
|
|
|
$qm->enqueue($data, 'tweetin');
|
2010-09-05 00:40:33 +09:00
|
|
|
}
|
2009-04-25 06:27:31 +09:00
|
|
|
|
2010-11-24 02:28:47 +09:00
|
|
|
$lastId = twitter_id($timeline[0]);
|
2013-02-19 07:16:06 +09:00
|
|
|
Twitter_synch_status::setLastId($flink->foreign_id, $timelineUri, $lastId);
|
|
|
|
common_debug("Set lastId value '$lastId' for foreign id '{$flink->foreign_id}' and timeline '" .
|
|
|
|
$timelineUri . "'");
|
2010-09-08 00:53:26 +09:00
|
|
|
}
|
2010-09-07 17:22:55 +09:00
|
|
|
|
2009-05-07 16:25:15 +09:00
|
|
|
// Okay, record the time we synced with Twitter for posterity
|
|
|
|
$flink->last_noticesync = common_sql_now();
|
|
|
|
$flink->update();
|
2009-04-22 11:09:27 +09:00
|
|
|
}
|
2009-05-07 16:25:15 +09:00
|
|
|
}
|
2009-04-25 06:27:31 +09:00
|
|
|
|
2009-08-07 07:52:58 +09:00
|
|
|
$id = null;
|
|
|
|
$debug = null;
|
2009-04-22 11:09:27 +09:00
|
|
|
|
2009-06-29 05:16:44 +09:00
|
|
|
if (have_option('i')) {
|
|
|
|
$id = get_option_value('i');
|
|
|
|
} else if (have_option('--id')) {
|
|
|
|
$id = get_option_value('--id');
|
|
|
|
} else if (count($args) > 0) {
|
|
|
|
$id = $args[0];
|
|
|
|
} else {
|
|
|
|
$id = null;
|
|
|
|
}
|
|
|
|
|
2009-07-18 10:36:13 +09:00
|
|
|
if (have_option('d') || have_option('debug')) {
|
2009-08-07 07:52:58 +09:00
|
|
|
$debug = true;
|
2009-07-18 10:36:13 +09:00
|
|
|
}
|
2009-07-18 10:09:03 +09:00
|
|
|
|
2013-02-19 07:16:06 +09:00
|
|
|
$fetcher = new TwitterStatusFetcher($id, POLL_INTERVAL, MAXCHILDREN, $debug);
|
2009-05-07 16:25:15 +09:00
|
|
|
$fetcher->runOnce();
|