gnu-social/plugins/BlogspamNet/BlogspamNetPlugin.php

163 lines
5.9 KiB
PHP
Raw Permalink Normal View History

<?php
/**
2009-08-25 23:29:56 +01:00
* StatusNet, the distributed open-source microblogging tool
*
* Plugin to check submitted notices with blogspam.net
*
* PHP version 5
*
* LICENCE: This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU Affero General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Affero General Public License for more details.
*
* You should have received a copy of the GNU Affero General Public License
* along with this program. If not, see <http://www.gnu.org/licenses/>.
*
* @category Plugin
2009-08-25 23:29:56 +01:00
* @package StatusNet
* @author Evan Prodromou <evan@status.net>
* @author Brion Vibber <brion@status.net>
2009-08-25 23:29:56 +01:00
* @copyright 2009 StatusNet, Inc.
* @license http://www.fsf.org/licensing/licenses/agpl-3.0.html GNU Affero General Public License version 3.0
2009-08-25 23:29:56 +01:00
* @link http://status.net/
*/
2009-08-25 23:42:34 +01:00
if (!defined('STATUSNET')) {
exit(1);
}
define('PLUGIN_VERSION', '0.1.0');
/**
* Plugin to check submitted notices with blogspam.net
*
* When new notices are saved, we check their text with blogspam.net (or
* a compatible service).
*
* Blogspam.net is supposed to catch blog comment spam, and I found that
* some of its tests (min/max size, bayesian match) gave a lot of false positives.
* So, I've turned those tests off by default. This may not get as many
* hits, but it's better than nothing.
*
* @category Plugin
2009-08-25 23:29:56 +01:00
* @package StatusNet
* @author Evan Prodromou <evan@status.net>
* @license http://www.fsf.org/licensing/licenses/agpl-3.0.html GNU Affero General Public License version 3.0
2009-08-25 23:29:56 +01:00
* @link http://status.net/
*
* @see Event
*/
class BlogspamNetPlugin extends Plugin
{
var $baseUrl = 'http://test.blogspam.net:8888/';
function __construct($url=null)
{
parent::__construct();
if ($url) {
$this->baseUrl = $url;
}
}
function onStartNoticeSave($notice)
{
$args = $this->testArgs($notice);
common_debug("Blogspamnet args = " . print_r($args, TRUE));
$requestBody = xmlrpc_encode_request('testComment', array($args));
$request = new HTTPClient($this->baseUrl, HTTPClient::METHOD_POST);
$request->setHeader('Content-Type', 'text/xml');
$request->setBody($requestBody);
$httpResponse = $request->send();
$response = xmlrpc_decode($httpResponse->getBody());
if (xmlrpc_is_fault($response)) {
throw new ServerException("$response[faultString] ($response[faultCode])", 500);
} else {
common_debug("Blogspamnet results = " . $response);
if (preg_match('/^ERROR(:(.*))?$/', $response, $match)) {
// TRANS: Server exception thrown when blogspam.net returns error status.
// TRANS: %1$s is the base URL, %2$s is the error (unknown contents; no period).
throw new ServerException(sprintf(_m('Error from %1$s: %2$s'), $this->baseUrl, $match[2]), 500);
} else if (preg_match('/^SPAM(:(.*))?$/', $response, $match)) {
// TRANS: Server exception thrown when blogspam.net returns spam status.
// TRANS: Does not end with period because of unknown contents for %s (spam match).
throw new ClientException(sprintf(_m('Spam checker results: %s'), $match[2]), 400);
} else if (preg_match('/^OK$/', $response)) {
// don't do anything
} else {
// TRANS: Server exception thrown when blogspam.net returns an unexpected status.
// TRANS: %1$s is the base URL, %2$s is the response (unknown contents; no period).
throw new ServerException(sprintf(_m('Unexpected response from %1$s: %2$s'), $this->baseUrl, $response), 500);
}
}
return true;
}
function testArgs($notice)
{
$args = array();
$args['comment'] = $notice->content;
$args['ip'] = $this->getClientIP();
if (isset($_SERVER) && array_key_exists('HTTP_USER_AGENT', $_SERVER)) {
$args['agent'] = $_SERVER['HTTP_USER_AGENT'];
}
$profile = $notice->getProfile();
if ($profile && $profile->homepage) {
$args['link'] = $profile->homepage;
}
if ($profile && $profile->fullname) {
$args['name'] = $profile->fullname;
} else {
$args['name'] = $profile->nickname;
}
$args['site'] = common_root_url();
$args['version'] = $this->userAgent();
$args['options'] = "max-size=" . common_config('site','textlimit') . ",min-size=0,min-words=0,exclude=bayasian";
return $args;
}
function getClientIP()
{
if (isset($_SERVER) && array_key_exists('REQUEST_METHOD', $_SERVER)) {
// Note: order matters here; use proxy-forwarded stuff first
foreach (array('HTTP_X_FORWARDED_FOR', 'CLIENT-IP', 'REMOTE_ADDR') as $k) {
if (isset($_SERVER[$k])) {
return $_SERVER[$k];
}
}
}
return '127.0.0.1';
}
function version()
{
return PLUGIN_VERSION;
}
2010-09-20 18:42:56 +01:00
public function onPluginVersion(array &$versions): bool
2010-09-20 18:42:56 +01:00
{
$versions[] = array('name' => 'BlogspamNet',
'version' => self::PLUGIN_VERSION,
2010-09-20 18:42:56 +01:00
'author' => 'Evan Prodromou, Brion Vibber',
'homepage' => GNUSOCIAL_ENGINE_REPO_URL . 'tree/master/plugins/BlogspamNet',
2010-09-20 18:42:56 +01:00
'rawdescription' =>
// TRANS: Plugin description.
2010-09-20 18:42:56 +01:00
_m('Plugin to check submitted notices with blogspam.net.'));
return true;
}
}