4 * Laconica - a distributed open-source microblogging tool
5 * Copyright (C) 2008, Controlez-Vous, Inc.
7 * This program is free software: you can redistribute it and/or modify
8 * it under the terms of the GNU Affero General Public License as published by
9 * the Free Software Foundation, either version 3 of the License, or
10 * (at your option) any later version.
12 * This program is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU Affero General Public License for more details.
17 * You should have received a copy of the GNU Affero General Public License
18 * along with this program. If not, see <http://www.gnu.org/licenses/>.
21 // Abort if called from a web server
22 if (isset($_SERVER) && array_key_exists('REQUEST_METHOD', $_SERVER)) {
23 print "This script must be run from the command line\n";
27 define('INSTALLDIR', realpath(dirname(__FILE__) . '/..'));
28 define('LACONICA', true);
30 // Tune number of processes and how often to poll Twitter
31 // XXX: Should these things be in config.php?
32 define('MAXCHILDREN', 2);
33 define('POLL_INTERVAL', 60); // in seconds
35 // Uncomment this to get useful logging
36 define('SCRIPT_DEBUG', true);
38 require_once(INSTALLDIR . '/lib/common.php');
39 require_once(INSTALLDIR . '/lib/daemon.php');
41 class TwitterStatusFetcher extends Daemon
44 private $children = array();
48 return ('twitterstatusfetcher.generic');
55 $flinks = $this->refreshFlinks();
57 foreach ($flinks as $f){
59 // We have to disconnect from the DB before forking so
60 // each sub-process will open its own connection and
61 // avoid stomping on the others
63 $conn = &$f->getDatabaseConnection();
69 die ("Couldn't fork!");
75 if (defined('SCRIPT_DEBUG')) {
76 common_debug("Parent: forked new status fetcher process " . $pid);
79 $this->children[] = $pid;
84 $this->getTimeline($f);
88 // Remove child from ps list as it finishes
89 while(($c = pcntl_wait($status, WNOHANG OR WUNTRACED)) > 0) {
91 if (defined('SCRIPT_DEBUG')) {
92 common_debug("Child $c finished.");
95 $this->remove_ps($this->children, $c);
98 // Wait! We have too many damn kids.
99 if (sizeof($this->children) > MAXCHILDREN) {
101 if (defined('SCRIPT_DEBUG')) {
102 common_debug('Too many children. Waiting...');
105 if (($c = pcntl_wait($status, WUNTRACED)) > 0){
107 if (defined('SCRIPT_DEBUG')) {
108 common_debug("Finished waiting for $c");
111 $this->remove_ps($this->children, $c);
116 // Remove all children from the process list before restarting
117 while(($c = pcntl_wait($status, WUNTRACED)) > 0) {
119 if (defined('SCRIPT_DEBUG')) {
120 common_debug("Child $c finished.");
123 $this->remove_ps($this->children, $c);
126 // Rest for a bit before we fetch more statuses
128 if (defined('SCRIPT_DEBUG')) {
129 common_debug('Waiting ' . POLL_INTERVAL .
130 ' secs before hitting Twitter again.');
133 if (POLL_INTERVAL > 0) {
134 sleep(POLL_INTERVAL);
140 function refreshFlinks() {
142 $flink = new Foreign_link();
143 $flink->service = 1; // Twitter
144 $flink->orderBy('last_noticesync');
146 $cnt = $flink->find();
148 if (defined('SCRIPT_DEBUG')) {
149 common_debug('Updating Twitter friends subscriptions' .
155 while ($flink->fetch()) {
157 if (($flink->noticesync & FOREIGN_NOTICE_RECV) ==
158 FOREIGN_NOTICE_RECV) {
159 $flinks[] = clone($flink);
169 function remove_ps(&$plist, $ps){
170 for ($i = 0; $i < sizeof($plist); $i++) {
171 if ($plist[$i] == $ps) {
173 $plist = array_values($plist);
179 function getTimeline($flink)
183 common_log(LOG_WARNING,
184 "Can't retrieve Foreign_link for foreign ID $fid");
188 $fuser = $flink->getForeignUser();
191 common_log(LOG_WARNING, "Unmatched user for ID " .
196 if (defined('SCRIPT_DEBUG')) {
197 common_debug('Trying to get timeline for Twitter user ' .
198 "$fuser->nickname ($flink->foreign_id).");
201 // XXX: Biggest remaining issue - How do we know at which status
202 // to start importing? How many statuses? Right now I'm going
203 // with the default last 20.
205 $url = 'http://twitter.com/statuses/friends_timeline.json';
207 $timeline_json = get_twitter_data($url, $fuser->nickname,
208 $flink->credentials);
210 $timeline = json_decode($timeline_json);
212 if (empty($timeline)) {
213 common_log(LOG_WARNING, "Empty timeline.");
217 // Reverse to preserve order
218 foreach (array_reverse($timeline) as $status) {
220 // Hacktastic: filter out stuff coming from this Laconica
221 $source = mb_strtolower(common_config('integration', 'source'));
223 if (preg_match("/$source/", mb_strtolower($status->source))) {
224 if (defined('SCRIPT_DEBUG')) {
225 common_debug('Skipping import of status ' . $status->id .
226 ' with source ' . $source);
231 $this->saveStatus($status, $flink);
234 // Okay, record the time we synced with Twitter for posterity
235 $flink->last_noticesync = common_sql_now();
239 function saveStatus($status, $flink)
241 $id = $this->ensureProfile($status->user);
242 $profile = Profile::staticGet($id);
246 'Problem saving notice. No associated Profile.');
250 $uri = 'http://twitter.com/' . $status->user->screen_name .
251 '/status/' . $status->id;
253 $notice = Notice::staticGet('uri', $uri);
255 // check to see if we've already imported the status
258 $notice = new Notice();
259 $notice->profile_id = $id;
261 $notice->query('BEGIN');
263 // XXX: figure out reply_to
264 $notice->reply_to = null;
266 // XXX: Should this be common_sql_now() instead of status create date?
268 $notice->created = strftime('%Y-%m-%d %H:%M:%S',
269 strtotime($status->created_at));
270 $notice->content = $status->text;
271 $notice->rendered = common_render_content($status->text, $notice);
272 $notice->source = 'twitter';
273 $notice->is_local = 0;
276 $notice_id = $notice->insert();
279 common_log_db_error($notice, 'INSERT', __FILE__);
280 if (defined('SCRIPT_DEBUG')) {
281 common_debug('Could not save notice!');
285 // XXX: Figure out a better way to link Twitter replies?
286 $notice->saveReplies();
288 // XXX: Do we want to pollute our tag cloud with
289 // hashtags from Twitter?
291 $notice->saveGroups();
293 $notice->query('COMMIT');
295 if (defined('SCRIPT_DEBUG')) {
296 common_debug("Saved status $status->id" .
297 " as notice $notice->id.");
301 if (!Notice_inbox::staticGet('notice_id', $notice->id)) {
304 $inbox = new Notice_inbox();
305 $inbox->user_id = $flink->user_id;
306 $inbox->notice_id = $notice->id;
307 $inbox->created = common_sql_now();
313 function ensureProfile($user)
315 // check to see if there's already a profile for this user
316 $profileurl = 'http://twitter.com/' . $user->screen_name;
317 $profile = Profile::staticGet('profileurl', $profileurl);
320 if (defined('SCRIPT_DEBUG')) {
321 common_debug("Profile for $profile->nickname found.");
324 // Check to see if the user's Avatar has changed
325 $this->checkAvatar($user, $profile);
330 if (defined('SCRIPT_DEBUG')) {
331 common_debug('Adding profile and remote profile ' .
332 "for Twitter user: $profileurl");
335 $profile = new Profile();
336 $profile->query("BEGIN");
338 $profile->nickname = $user->screen_name;
339 $profile->fullname = $user->name;
340 $profile->homepage = $user->url;
341 $profile->bio = $user->description;
342 $profile->location = $user->location;
343 $profile->profileurl = $profileurl;
344 $profile->created = common_sql_now();
346 $id = $profile->insert();
349 common_log_db_error($profile, 'INSERT', __FILE__);
350 $profile->query("ROLLBACK");
354 // check for remote profile
355 $remote_pro = Remote_profile::staticGet('uri', $profileurl);
359 $remote_pro = new Remote_profile();
361 $remote_pro->id = $id;
362 $remote_pro->uri = $profileurl;
363 $remote_pro->created = common_sql_now();
365 $rid = $remote_pro->insert();
368 common_log_db_error($profile, 'INSERT', __FILE__);
369 $profile->query("ROLLBACK");
374 $profile->query("COMMIT");
376 $this->saveAvatars($user, $id);
382 function checkAvatar($user, $profile)
386 $path_parts = pathinfo($user->profile_image_url);
387 $newname = 'Twitter_' . $user->id . '_' .
388 $path_parts['basename'];
390 $oldname = $profile->getAvatar(48)->filename;
392 if ($newname != $oldname) {
394 if (defined('SCRIPT_DEBUG')) {
395 common_debug('Avatar for Twitter user ' .
396 "$profile->nickname has changed.");
397 common_debug("old: $oldname new: $newname");
400 $img_root = substr($path_parts['basename'], 0, -11);
401 $ext = $path_parts['extension'];
402 $mediatype = $this->getMediatype($ext);
404 foreach (array('mini', 'normal', 'bigger') as $size) {
405 $url = $path_parts['dirname'] . '/' .
406 $img_root . '_' . $size . ".$ext";
407 $filename = 'Twitter_' . $user->id . '_' .
408 $img_root . "_$size.$ext";
410 if ($this->fetchAvatar($url, $filename)) {
411 $this->updateAvatar($profile->id, $size, $mediatype, $filename);
417 function getMediatype($ext)
421 switch (strtolower($ext)) {
423 $mediatype = 'image/jpg';
426 $mediatype = 'image/gif';
429 $mediatype = 'image/png';
435 function saveAvatars($user, $id)
439 $path_parts = pathinfo($user->profile_image_url);
440 $ext = $path_parts['extension'];
441 $end = strlen('_normal' . $ext);
442 $img_root = substr($path_parts['basename'], 0, -($end+1));
443 $mediatype = $this->getMediatype($ext);
445 foreach (array('mini', 'normal', 'bigger') as $size) {
446 $url = $path_parts['dirname'] . '/' .
447 $img_root . '_' . $size . ".$ext";
448 $filename = 'Twitter_' . $user->id . '_' .
449 $img_root . "_$size.$ext";
451 if ($this->fetchAvatar($url, $filename)) {
452 $this->newAvatar($id, $size, $mediatype, $filename);
454 common_log(LOG_WARNING, "Problem fetching Avatar: $url", __FILE__);
459 function updateAvatar($profile_id, $size, $mediatype, $filename) {
461 if (defined('SCRIPT_DEBUG')) {
462 common_debug("Updating avatar: $size");
465 $profile = Profile::staticGet($profile_id);
468 if (defined('SCRIPT_DEBUG')) {
469 common_debug("Couldn't get profile: $profile_id!");
474 $sizes = array('mini' => 24, 'normal' => 48, 'bigger' => 73);
475 $avatar = $profile->getAvatar($sizes[$size]);
478 if (defined('SCRIPT_DEBUG')) {
479 common_debug("Deleting $size avatar for $profile->nickname.");
481 @unlink(INSTALLDIR . '/avatar/' . $avatar->filename);
485 $this->newAvatar($profile->id, $size, $mediatype, $filename);
488 function newAvatar($profile_id, $size, $mediatype, $filename)
492 $avatar = new Avatar();
493 $avatar->profile_id = $profile_id;
498 $avatar->height = 24;
502 $avatar->height = 48;
506 // Note: Twitter's big avatars are a different size than
507 // Laconica's (Laconica's = 96)
510 $avatar->height = 73;
513 $avatar->original = 0; // we don't have the original
514 $avatar->mediatype = $mediatype;
515 $avatar->filename = $filename;
516 $avatar->url = Avatar::url($filename);
518 if (defined('SCRIPT_DEBUG')) {
519 common_debug("new filename: $avatar->url");
522 $avatar->created = common_sql_now();
524 $id = $avatar->insert();
527 common_log_db_error($avatar, 'INSERT', __FILE__);
531 if (defined('SCRIPT_DEBUG')) {
532 common_debug("Saved new $size avatar for $profile_id.");
538 function fetchAvatar($url, $filename)
540 $avatar_dir = INSTALLDIR . '/avatar/';
542 $avatarfile = $avatar_dir . $filename;
544 $out = fopen($avatarfile, 'wb');
546 common_log(LOG_WARNING, "Couldn't open file $filename", __FILE__);
550 if (defined('SCRIPT_DEBUG')) {
551 common_debug("Fetching avatar: $url");
555 curl_setopt($ch, CURLOPT_URL, $url);
556 curl_setopt($ch, CURLOPT_FILE, $out);
557 curl_setopt($ch, CURLOPT_BINARYTRANSFER, true);
558 curl_setopt($ch, CURLOPT_FOLLOWLOCATION, true);
559 curl_setopt($ch, CURLOPT_CONNECTTIMEOUT, 0);
560 $result = curl_exec($ch);
569 ini_set("max_execution_time", "0");
570 ini_set("max_input_time", "0");
572 mb_internal_encoding('UTF-8');
575 $fetcher = new TwitterStatusFetcher();