]> git.mxchange.org Git - quix0rs-gnu-social.git/commitdiff
train a whole user
authorEvan Prodromou <evan@status.net>
Fri, 9 Mar 2012 12:20:07 +0000 (06:20 -0600)
committerEvan Prodromou <evan@status.net>
Fri, 9 Mar 2012 12:20:07 +0000 (06:20 -0600)
scripts/trainuser.php [new file with mode: 0644]

diff --git a/scripts/trainuser.php b/scripts/trainuser.php
new file mode 100644 (file)
index 0000000..8ee6387
--- /dev/null
@@ -0,0 +1,81 @@
+<?php
+/*
+ * StatusNet - the distributed open-source microblogging tool
+ * Copyright (C) 2012 StatusNet, Inc.
+ *
+ * This program is free software: you can redistribute it and/or modify
+ * it under the terms of the GNU Affero General Public License as published by
+ * the Free Software Foundation, either version 3 of the License, or
+ * (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ * GNU Affero General Public License for more details.
+ *
+ * You should have received a copy of the GNU Affero General Public License
+ * along with this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+
+define('INSTALLDIR', realpath(dirname(__FILE__) . '/../../../..'));
+
+$shortoptions = 'i:n:';
+$longoptions = array('id=', 'nickname=');
+
+$helptext = <<<END_OF_TRAINUSER_HELP
+trainuser.php [options]
+Train user activities against the spam filter
+
+  -i --id       ID of user to export
+  -n --nickname nickname of the user to export
+  -t --category Category; one of "spam" or "ham"
+
+END_OF_TRAINUSER_HELP;
+
+require_once INSTALLDIR.'/scripts/commandline.inc';
+
+function trainUser($filter, $user, $category) {
+
+    printfnq("Training user %s\n", $user->nickname);
+
+    $profile = Profile::staticGet('id', $user->id);
+
+    $str = new ProfileNoticeStream($profile, $profile);
+
+    $offset = 0;
+    $limit  = 100;
+
+    do {
+        $notice = $str->getNotices($offset, $limit);
+        while ($notice->fetch()) {
+            try {
+                printfv("Training notice %d...", $notice->id);
+                $filter->trainOnError($notice, $category);
+                $result = $filter->test($notice);
+                $score = Spam_score::save($notice, $result);
+                printfv("%s\n", ($result->isSpam) ? "SPAM" : "HAM");
+            } catch (Exception $e) {
+                printfnq("ERROR training notice %d\n: %s", $notice->id, $e->getMessage());
+            }
+        }
+        $offset += $notice->N;
+    } while ($notice->N > 0);
+}
+
+try {
+    $filter = null;
+    Event::handle('GetSpamFilter', array(&$filter));
+    if (empty($filter)) {
+        throw new Exception(_("No spam filter."));
+    }
+    $user = getUser();
+    $category = get_option_value('t', 'category');
+    if ($category !== SpamFilter::HAM &&
+        $category !== SpamFilter::SPAM) {
+        throw new Exception(_("No such category."));
+    }
+    trainUser($filter, $user, $category);
+} catch (Exception $e) {
+    print $e->getMessage()."\n";
+    exit(1);
+}