4 * StatusNet - the distributed open-source microblogging tool
5 * Copyright (C) 2008-2010, StatusNet, Inc.
7 * This program is free software: you can redistribute it and/or modify
8 * it under the terms of the GNU Affero General Public License as published by
9 * the Free Software Foundation, either version 3 of the License, or
10 * (at your option) any later version.
12 * This program is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU Affero General Public License for more details.
17 * You should have received a copy of the GNU Affero General Public License
18 * along with this program. If not, see <http://www.gnu.org/licenses/>.
21 define('INSTALLDIR', realpath(dirname(__FILE__) . '/../../..'));
23 // Tune number of processes and how often to poll Twitter
24 // XXX: Should these things be in config.php?
25 define('MAXCHILDREN', 2);
26 define('POLL_INTERVAL', 60); // in seconds
28 $shortoptions = 'di::';
29 $longoptions = array('id::', 'debug');
31 $helptext = <<<END_OF_TRIM_HELP
32 Batch script for retrieving Twitter messages from foreign service.
34 -i --id Identity (default 'generic')
35 -d --debug Debug (lots of log output)
39 require_once INSTALLDIR . '/scripts/commandline.inc';
40 require_once INSTALLDIR . '/lib/common.php';
41 require_once INSTALLDIR . '/lib/daemon.php';
42 require_once INSTALLDIR . '/plugins/TwitterBridge/twitter.php';
43 require_once INSTALLDIR . '/plugins/TwitterBridge/twitterbasicauthclient.php';
44 require_once INSTALLDIR . '/plugins/TwitterBridge/twitteroauthclient.php';
47 * Fetch statuses from Twitter
49 * Fetches statuses from Twitter and inserts them as notices
51 * NOTE: an Avatar path MUST be set in config.php for this
52 * script to work, e.g.:
53 * $config['avatar']['path'] = $config['site']['path'] . '/avatar/';
55 * @todo @fixme @gar Fix the above. For some reason $_path is always empty when
56 * this script is run, so the default avatar path is always set wrong in
57 * default.php. Therefore it must be set explicitly in config.php. --Z
61 * @author Zach Copley <zach@status.net>
62 * @author Evan Prodromou <evan@status.net>
63 * @license http://www.fsf.org/licensing/licenses/agpl-3.0.html GNU Affero General Public License version 3.0
64 * @link http://status.net/
67 class TwitterStatusFetcher extends ParallelizingDaemon
72 * @param string $id the name/id of this daemon
73 * @param int $interval sleep this long before doing everything again
74 * @param int $max_children maximum number of child processes at a time
75 * @param boolean $debug debug output flag
80 function __construct($id = null, $interval = 60,
81 $max_children = 2, $debug = null)
83 parent::__construct($id, $interval, $max_children, $debug);
89 * @return string Name of the daemon.
94 return ('twitterstatusfetcher.'.$this->_id);
98 * Find all the Twitter foreign links for users who have requested
99 * importing of their friends' timelines
101 * @return array flinks an array of Foreign_link objects
104 function getObjects()
106 global $_DB_DATAOBJECT;
108 $flink = new Foreign_link();
109 $conn = &$flink->getDatabaseConnection();
111 $flink->service = TWITTER_SERVICE;
112 $flink->orderBy('last_noticesync');
117 while ($flink->fetch()) {
119 if (($flink->noticesync & FOREIGN_NOTICE_RECV) ==
120 FOREIGN_NOTICE_RECV) {
121 $flinks[] = clone($flink);
122 common_log(LOG_INFO, "sync: foreign id $flink->foreign_id");
124 common_log(LOG_INFO, "nothing to sync");
132 unset($_DB_DATAOBJECT['CONNECTIONS']);
137 function childTask($flink) {
139 // Each child ps needs its own DB connection
141 // Note: DataObject::getDatabaseConnection() creates
142 // a new connection if there isn't one already
144 $conn = &$flink->getDatabaseConnection();
146 $this->getTimeline($flink);
148 $flink->last_friendsync = common_sql_now();
153 // XXX: Couldn't find a less brutal way to blow
154 // away a cached connection
156 global $_DB_DATAOBJECT;
157 unset($_DB_DATAOBJECT['CONNECTIONS']);
160 function getTimeline($flink)
163 common_log(LOG_WARNING, $this->name() .
164 " - Can't retrieve Foreign_link for foreign ID $fid");
168 common_debug($this->name() . ' - Trying to get timeline for Twitter user ' .
171 // XXX: Biggest remaining issue - How do we know at which status
172 // to start importing? How many statuses? Right now I'm going
173 // with the default last 20.
177 if (TwitterOAuthClient::isPackedToken($flink->credentials)) {
178 $token = TwitterOAuthClient::unpackToken($flink->credentials);
179 $client = new TwitterOAuthClient($token->key, $token->secret);
180 common_debug($this->name() . ' - Grabbing friends timeline with OAuth.');
182 $client = new TwitterBasicAuthClient($flink);
183 common_debug($this->name() . ' - Grabbing friends timeline with basic auth.');
189 $timeline = $client->statusesFriendsTimeline();
190 } catch (Exception $e) {
191 common_log(LOG_WARNING, $this->name() .
192 ' - Twitter client unable to get friends timeline for user ' .
193 $flink->user_id . ' - code: ' .
194 $e->getCode() . 'msg: ' . $e->getMessage());
197 if (empty($timeline)) {
198 common_log(LOG_WARNING, $this->name() . " - Empty timeline.");
202 common_debug(LOG_INFO, $this->name() . ' - Retrieved ' . sizeof($timeline) . ' statuses from Twitter.');
204 // Reverse to preserve order
206 foreach (array_reverse($timeline) as $status) {
208 // Hacktastic: filter out stuff coming from this StatusNet
210 $source = mb_strtolower(common_config('integration', 'source'));
212 if (preg_match("/$source/", mb_strtolower($status->source))) {
213 common_debug($this->name() . ' - Skipping import of status ' .
214 $status->id . ' with source ' . $source);
218 $this->saveStatus($status, $flink);
221 // Okay, record the time we synced with Twitter for posterity
223 $flink->last_noticesync = common_sql_now();
227 function saveStatus($status, $flink)
229 $profile = $this->ensureProfile($status->user);
231 if (empty($profile)) {
232 common_log(LOG_ERR, $this->name() .
233 ' - Problem saving notice. No associated Profile.');
237 $statusUri = 'http://twitter.com/'
238 . $status->user->screen_name
242 // check to see if we've already imported the status
244 $dupe = $this->checkDupe($profile, $statusUri);
250 " - Ignoring duplicate import: $statusUri"
255 $notice = new Notice();
257 $notice->profile_id = $profile->id;
258 $notice->uri = $statusUri;
259 $notice->url = $statusUri;
260 $notice->created = strftime(
262 strtotime($status->created_at)
265 $notice->source = 'twitter';
266 $notice->reply_to = null;
267 $notice->is_local = Notice::GATEWAY;
269 $notice->content = common_shorten_links($status->text);
270 $notice->rendered = common_render_content(
275 if (Event::handle('StartNoticeSave', array(&$notice))) {
277 $id = $notice->insert();
280 common_log_db_error($notice, 'INSERT', __FILE__);
281 common_log(LOG_ERR, $this->name() .
282 ' - Problem saving notice.');
285 Event::handle('EndNoticeSave', array($notice));
288 $orig = clone($notice);
289 $conv = Conversation::create();
291 $notice->conversation = $conv->id;
293 if (!$notice->update($orig)) {
294 common_log_db_error($notice, 'UPDATE', __FILE__);
295 common_log(LOG_ERR, $this->name() .
296 ' - Problem saving notice.');
299 Inbox::insertNotice($flink->user_id, $notice->id);
300 $notice->blowOnInsert();
306 * Look up a Profile by profileurl field. Profile::staticGet() was
307 * not working consistently.
309 * @param string $nickname local nickname of the Twitter user
310 * @param string $profileurl the profile url
312 * @return mixed value the first Profile with that url, or null
315 function getProfileByUrl($nickname, $profileurl)
317 $profile = new Profile();
318 $profile->nickname = $nickname;
319 $profile->profileurl = $profileurl;
322 if ($profile->find()) {
331 * Check to see if this Twitter status has already been imported
333 * @param Profile $profile Twitter user's local profile
334 * @param string $statusUri URI of the status on Twitter
336 * @return mixed value a matching Notice or null
339 function checkDupe($profile, $statusUri)
341 $notice = new Notice();
342 $notice->uri = $statusUri;
343 $notice->profile_id = $profile->id;
346 if ($notice->find()) {
354 function ensureProfile($user)
356 // check to see if there's already a profile for this user
358 $profileurl = 'http://twitter.com/' . $user->screen_name;
359 $profile = $this->getProfileByUrl($user->screen_name, $profileurl);
361 if (!empty($profile)) {
362 common_debug($this->name() .
363 " - Profile for $profile->nickname found.");
365 // Check to see if the user's Avatar has changed
367 $this->checkAvatar($user, $profile);
372 common_debug($this->name() . ' - Adding profile and remote profile ' .
373 "for Twitter user: $profileurl.");
375 $profile = new Profile();
376 $profile->query("BEGIN");
378 $profile->nickname = $user->screen_name;
379 $profile->fullname = $user->name;
380 $profile->homepage = $user->url;
381 $profile->bio = $user->description;
382 $profile->location = $user->location;
383 $profile->profileurl = $profileurl;
384 $profile->created = common_sql_now();
387 $id = $profile->insert();
388 } catch(Exception $e) {
389 common_log(LOG_WARNING, $this->name . ' Couldn\'t insert profile - ' . $e->getMessage());
393 common_log_db_error($profile, 'INSERT', __FILE__);
394 $profile->query("ROLLBACK");
398 // check for remote profile
400 $remote_pro = Remote_profile::staticGet('uri', $profileurl);
402 if (empty($remote_pro)) {
404 $remote_pro = new Remote_profile();
406 $remote_pro->id = $id;
407 $remote_pro->uri = $profileurl;
408 $remote_pro->created = common_sql_now();
411 $rid = $remote_pro->insert();
412 } catch (Exception $e) {
413 common_log(LOG_WARNING, $this->name() . ' Couldn\'t save remote profile - ' . $e->getMessage());
417 common_log_db_error($profile, 'INSERT', __FILE__);
418 $profile->query("ROLLBACK");
423 $profile->query("COMMIT");
425 $this->saveAvatars($user, $id);
431 function checkAvatar($twitter_user, $profile)
435 $path_parts = pathinfo($twitter_user->profile_image_url);
437 $newname = 'Twitter_' . $twitter_user->id . '_' .
438 $path_parts['basename'];
440 $oldname = $profile->getAvatar(48)->filename;
442 if ($newname != $oldname) {
443 common_debug($this->name() . ' - Avatar for Twitter user ' .
444 "$profile->nickname has changed.");
445 common_debug($this->name() . " - old: $oldname new: $newname");
447 $this->updateAvatars($twitter_user, $profile);
450 if ($this->missingAvatarFile($profile)) {
451 common_debug($this->name() . ' - Twitter user ' .
453 ' is missing one or more local avatars.');
454 common_debug($this->name() ." - old: $oldname new: $newname");
456 $this->updateAvatars($twitter_user, $profile);
460 function updateAvatars($twitter_user, $profile) {
464 $path_parts = pathinfo($twitter_user->profile_image_url);
466 $img_root = substr($path_parts['basename'], 0, -11);
467 $ext = $path_parts['extension'];
468 $mediatype = $this->getMediatype($ext);
470 foreach (array('mini', 'normal', 'bigger') as $size) {
471 $url = $path_parts['dirname'] . '/' .
472 $img_root . '_' . $size . ".$ext";
473 $filename = 'Twitter_' . $twitter_user->id . '_' .
474 $img_root . "_$size.$ext";
476 $this->updateAvatar($profile->id, $size, $mediatype, $filename);
477 $this->fetchAvatar($url, $filename);
481 function missingAvatarFile($profile) {
482 foreach (array(24, 48, 73) as $size) {
483 $filename = $profile->getAvatar($size)->filename;
484 $avatarpath = Avatar::path($filename);
485 if (file_exists($avatarpath) == FALSE) {
492 function getMediatype($ext)
496 switch (strtolower($ext)) {
498 $mediatype = 'image/jpg';
501 $mediatype = 'image/gif';
504 $mediatype = 'image/png';
510 function saveAvatars($user, $id)
514 $path_parts = pathinfo($user->profile_image_url);
515 $ext = $path_parts['extension'];
516 $end = strlen('_normal' . $ext);
517 $img_root = substr($path_parts['basename'], 0, -($end+1));
518 $mediatype = $this->getMediatype($ext);
520 foreach (array('mini', 'normal', 'bigger') as $size) {
521 $url = $path_parts['dirname'] . '/' .
522 $img_root . '_' . $size . ".$ext";
523 $filename = 'Twitter_' . $user->id . '_' .
524 $img_root . "_$size.$ext";
526 if ($this->fetchAvatar($url, $filename)) {
527 $this->newAvatar($id, $size, $mediatype, $filename);
529 common_log(LOG_WARNING, $id() .
530 " - Problem fetching Avatar: $url");
535 function updateAvatar($profile_id, $size, $mediatype, $filename) {
537 common_debug($this->name() . " - Updating avatar: $size");
539 $profile = Profile::staticGet($profile_id);
541 if (empty($profile)) {
542 common_debug($this->name() . " - Couldn't get profile: $profile_id!");
546 $sizes = array('mini' => 24, 'normal' => 48, 'bigger' => 73);
547 $avatar = $profile->getAvatar($sizes[$size]);
549 // Delete the avatar, if present
555 $this->newAvatar($profile->id, $size, $mediatype, $filename);
558 function newAvatar($profile_id, $size, $mediatype, $filename)
562 $avatar = new Avatar();
563 $avatar->profile_id = $profile_id;
568 $avatar->height = 24;
572 $avatar->height = 48;
576 // Note: Twitter's big avatars are a different size than
577 // StatusNet's (StatusNet's = 96)
580 $avatar->height = 73;
583 $avatar->original = 0; // we don't have the original
584 $avatar->mediatype = $mediatype;
585 $avatar->filename = $filename;
586 $avatar->url = Avatar::url($filename);
588 $avatar->created = common_sql_now();
591 $id = $avatar->insert();
592 } catch (Exception $e) {
593 common_log(LOG_WARNING, $this->name() . ' Couldn\'t insert avatar - ' . $e->getMessage());
597 common_log_db_error($avatar, 'INSERT', __FILE__);
601 common_debug($this->name() .
602 " - Saved new $size avatar for $profile_id.");
608 * Fetch a remote avatar image and save to local storage.
610 * @param string $url avatar source URL
611 * @param string $filename bare local filename for download
612 * @return bool true on success, false on failure
614 function fetchAvatar($url, $filename)
616 common_debug($this->name() . " - Fetching Twitter avatar: $url");
618 $request = HTTPClient::start();
619 $response = $request->get($url);
620 if ($response->isOk()) {
621 $avatarfile = Avatar::path($filename);
622 $ok = file_put_contents($avatarfile, $response->getBody());
624 common_log(LOG_WARNING, $this->name() .
625 " - Couldn't open file $filename");
639 if (have_option('i')) {
640 $id = get_option_value('i');
641 } else if (have_option('--id')) {
642 $id = get_option_value('--id');
643 } else if (count($args) > 0) {
649 if (have_option('d') || have_option('debug')) {
653 $fetcher = new TwitterStatusFetcher($id, 60, 2, $debug);