forked from GNUsocial/gnu-social
		
	
		
			
	
	
		
			157 lines
		
	
	
		
			4.4 KiB
		
	
	
	
		
			PHP
		
	
	
	
	
	
		
		
			
		
	
	
			157 lines
		
	
	
		
			4.4 KiB
		
	
	
	
		
			PHP
		
	
	
	
	
	
| 
								 | 
							
								<?php
							 | 
						||
| 
								 | 
							
								/**
							 | 
						||
| 
								 | 
							
								 * StatusNet - the distributed open-source microblogging tool
							 | 
						||
| 
								 | 
							
								 * Copyright (C) 2012, StatusNet, Inc.
							 | 
						||
| 
								 | 
							
								 *
							 | 
						||
| 
								 | 
							
								 * Spam filter class
							 | 
						||
| 
								 | 
							
								 * 
							 | 
						||
| 
								 | 
							
								 * PHP version 5
							 | 
						||
| 
								 | 
							
								 *
							 | 
						||
| 
								 | 
							
								 * This program is free software: you can redistribute it and/or modify
							 | 
						||
| 
								 | 
							
								 * it under the terms of the GNU Affero General Public License as published by
							 | 
						||
| 
								 | 
							
								 * the Free Software Foundation, either version 3 of the License, or
							 | 
						||
| 
								 | 
							
								 * (at your option) any later version.
							 | 
						||
| 
								 | 
							
								 *
							 | 
						||
| 
								 | 
							
								 * This program is distributed in the hope that it will be useful,
							 | 
						||
| 
								 | 
							
								 * but WITHOUT ANY WARRANTY; without even the implied warranty of
							 | 
						||
| 
								 | 
							
								 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
							 | 
						||
| 
								 | 
							
								 * GNU Affero General Public License for more details.
							 | 
						||
| 
								 | 
							
								 *
							 | 
						||
| 
								 | 
							
								 * You should have received a copy of the GNU Affero General Public License
							 | 
						||
| 
								 | 
							
								 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
							 | 
						||
| 
								 | 
							
								 *
							 | 
						||
| 
								 | 
							
								 * @category  Spam
							 | 
						||
| 
								 | 
							
								 * @package   StatusNet
							 | 
						||
| 
								 | 
							
								 * @author    Evan Prodromou <evan@status.net>
							 | 
						||
| 
								 | 
							
								 * @copyright 2012 StatusNet, Inc.
							 | 
						||
| 
								 | 
							
								 * @license   http://www.fsf.org/licensing/licenses/agpl-3.0.html AGPL 3.0
							 | 
						||
| 
								 | 
							
								 * @link      http://status.net/
							 | 
						||
| 
								 | 
							
								 */
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								if (!defined('STATUSNET')) {
							 | 
						||
| 
								 | 
							
								    // This check helps protect against security problems;
							 | 
						||
| 
								 | 
							
								    // your code file can't be executed directly from the web.
							 | 
						||
| 
								 | 
							
								    exit(1);
							 | 
						||
| 
								 | 
							
								}
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								/**
							 | 
						||
| 
								 | 
							
								 * Spam filter class
							 | 
						||
| 
								 | 
							
								 *
							 | 
						||
| 
								 | 
							
								 * Local proxy for remote filter
							 | 
						||
| 
								 | 
							
								 *
							 | 
						||
| 
								 | 
							
								 * @category  Spam
							 | 
						||
| 
								 | 
							
								 * @package   StatusNet
							 | 
						||
| 
								 | 
							
								 * @author    Evan Prodromou <evan@status.net>
							 | 
						||
| 
								 | 
							
								 * @copyright 2012 StatusNet, Inc.
							 | 
						||
| 
								 | 
							
								 * @license   http://www.fsf.org/licensing/licenses/agpl-3.0.html AGPL 3.0
							 | 
						||
| 
								 | 
							
								 * @link      http://status.net/
							 | 
						||
| 
								 | 
							
								 */
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								class SpamFilter {
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    const HAM  = 'ham';
							 | 
						||
| 
								 | 
							
								    const SPAM = 'spam';
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    public $server;
							 | 
						||
| 
								 | 
							
								    public $username;
							 | 
						||
| 
								 | 
							
								    public $password;
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    function __construct($server, $username, $password) {
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        $this->server   = $server;
							 | 
						||
| 
								 | 
							
								        $this->username = $username;
							 | 
						||
| 
								 | 
							
								        $this->password = $password;
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    protected function toActivity($notice) {
							 | 
						||
| 
								 | 
							
								        // FIXME: need this to autoload ActivityStreamsMediaLink
							 | 
						||
| 
								 | 
							
								        $doc = new ActivityStreamJSONDocument();
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        $activity = $notice->asActivity(null);
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        return $activity;
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    public function test($notice) {
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        $activity = $this->toActivity($notice);
							 | 
						||
| 
								 | 
							
								        return $this->testActivity($activity);
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								    
							 | 
						||
| 
								 | 
							
								    public function testActivity($activity) {
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        $client = new HTTPClient($this->server . "/is-this-spam");
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        $client->setMethod('POST');
							 | 
						||
| 
								 | 
							
								        $client->setAuth($this->username, $this->password);
							 | 
						||
| 
								 | 
							
								        $client->setHeader('Content-Type', 'application/json');
							 | 
						||
| 
								 | 
							
								        $client->setBody(json_encode($activity->asArray()));
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        $response = $client->send();
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        if (!$response->isOK()) {
							 | 
						||
| 
								 | 
							
								            throw new Exception("Error " . $response->getStatus() . " checking spam score: " . $response->getBody());
							 | 
						||
| 
								 | 
							
								        }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        $result = json_decode($response->getBody());
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        return $result;
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    public function train($notice, $category) {
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        $activity = $this->toActivity($notice);
							 | 
						||
| 
								 | 
							
								        return $this->trainActivity($activity, $category);
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    public function trainActivity($activity, $category) {
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        switch ($category) {
							 | 
						||
| 
								 | 
							
								        case self::HAM:
							 | 
						||
| 
								 | 
							
								            $endpoint = '/this-is-ham';
							 | 
						||
| 
								 | 
							
								            break;
							 | 
						||
| 
								 | 
							
								        case self::SPAM:
							 | 
						||
| 
								 | 
							
								            $endpoint = '/this-is-spam';
							 | 
						||
| 
								 | 
							
								            break;
							 | 
						||
| 
								 | 
							
								        default:
							 | 
						||
| 
								 | 
							
								            throw new Exception("Unknown category: " + $category);
							 | 
						||
| 
								 | 
							
								        }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        $client = new HTTPClient($this->server . $endpoint);
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        $client->setMethod('POST');
							 | 
						||
| 
								 | 
							
								        $client->setAuth($this->username, $this->password);
							 | 
						||
| 
								 | 
							
								        $client->setHeader('Content-Type', 'application/json');
							 | 
						||
| 
								 | 
							
								        $client->setBody(json_encode($activity->asArray()));
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        $response = $client->send();
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        if (!$response->isOK()) {
							 | 
						||
| 
								 | 
							
								            throw new Exception("Error " . $response->getStatus() . " checking spam score: " . $response->getBody());
							 | 
						||
| 
								 | 
							
								        }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        // We don't do much with the results
							 | 
						||
| 
								 | 
							
								        return true;
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								    public function trainOnError($notice, $category) {
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        $activity = $this->toActivity($notice);
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        return $this->trainActivityOnError($activity, $category);
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								    
							 | 
						||
| 
								 | 
							
								    public function trainActivityOnError($activity, $category) {
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        $result = $this->testActivity($activity);
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								        if (($category === self::SPAM && $result->isSpam) ||
							 | 
						||
| 
								 | 
							
								            ($category === self::HAM && !$result->isSpam)) {
							 | 
						||
| 
								 | 
							
								            return true;
							 | 
						||
| 
								 | 
							
								        } else {
							 | 
						||
| 
								 | 
							
								            return $this->trainActivity($activity, $category);
							 | 
						||
| 
								 | 
							
								        }
							 | 
						||
| 
								 | 
							
								    }
							 | 
						||
| 
								 | 
							
								}
							 |