2010-03-22 04:25:49 +00:00
|
|
|
<?php
|
|
|
|
/**
|
|
|
|
* StatusNet - the distributed open-source microblogging tool
|
|
|
|
* Copyright (C) 2010, StatusNet, Inc.
|
|
|
|
*
|
|
|
|
* Creates a dynamic sitemap for a StatusNet site
|
|
|
|
*
|
|
|
|
* PHP version 5
|
|
|
|
*
|
|
|
|
* This program is free software: you can redistribute it and/or modify
|
|
|
|
* it under the terms of the GNU Affero General Public License as published by
|
|
|
|
* the Free Software Foundation, either version 3 of the License, or
|
|
|
|
* (at your option) any later version.
|
|
|
|
*
|
|
|
|
* This program is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
* GNU Affero General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU Affero General Public License
|
|
|
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
*
|
|
|
|
* @category Sample
|
|
|
|
* @package StatusNet
|
|
|
|
* @author Evan Prodromou <evan@status.net>
|
|
|
|
* @copyright 2010 StatusNet, Inc.
|
|
|
|
* @license http://www.fsf.org/licensing/licenses/agpl-3.0.html AGPL 3.0
|
|
|
|
* @link http://status.net/
|
|
|
|
*/
|
|
|
|
|
|
|
|
if (!defined('STATUSNET')) {
|
|
|
|
// This check helps protect against security problems;
|
|
|
|
// your code file can't be executed directly from the web.
|
|
|
|
exit(1);
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Sitemap plugin
|
|
|
|
*
|
|
|
|
* @category Sample
|
|
|
|
* @package StatusNet
|
|
|
|
* @author Evan Prodromou <evan@status.net>
|
|
|
|
* @copyright 2010 StatusNet, Inc.
|
|
|
|
* @license http://www.fsf.org/licensing/licenses/agpl-3.0.html AGPL 3.0
|
|
|
|
* @link http://status.net/
|
|
|
|
*/
|
|
|
|
|
|
|
|
class SitemapPlugin extends Plugin
|
|
|
|
{
|
2010-04-12 16:05:19 +01:00
|
|
|
const USERS_PER_MAP = 50000;
|
|
|
|
const NOTICES_PER_MAP = 50000;
|
2010-04-10 15:03:57 +01:00
|
|
|
|
2010-03-22 04:25:49 +00:00
|
|
|
/**
|
|
|
|
* Load related modules when needed
|
|
|
|
*
|
|
|
|
* @param string $cls Name of the class to be loaded
|
|
|
|
*
|
|
|
|
* @return boolean hook value; true means continue processing, false means stop.
|
|
|
|
*/
|
|
|
|
|
|
|
|
function onAutoload($cls)
|
|
|
|
{
|
|
|
|
$dir = dirname(__FILE__);
|
|
|
|
|
|
|
|
switch ($cls)
|
|
|
|
{
|
2010-05-21 21:47:30 +01:00
|
|
|
case 'Sitemap_user_count':
|
2010-05-31 15:48:14 +01:00
|
|
|
case 'Sitemap_notice_count':
|
2010-05-21 21:47:30 +01:00
|
|
|
require_once $dir . '/' . $cls . '.php';
|
|
|
|
return false;
|
2010-03-22 04:25:49 +00:00
|
|
|
case 'SitemapindexAction':
|
|
|
|
case 'NoticesitemapAction':
|
|
|
|
case 'UsersitemapAction':
|
|
|
|
require_once $dir . '/' . strtolower(mb_substr($cls, 0, -6)) . '.php';
|
|
|
|
return false;
|
|
|
|
case 'SitemapAction':
|
|
|
|
require_once $dir . '/' . strtolower($cls) . '.php';
|
2010-05-21 21:47:30 +01:00
|
|
|
return false;
|
2010-03-22 04:25:49 +00:00
|
|
|
default:
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2010-04-12 19:32:01 +01:00
|
|
|
/**
|
|
|
|
* Add sitemap-related information at the end of robots.txt
|
|
|
|
*
|
|
|
|
* @param Action $action Action being run
|
|
|
|
*
|
|
|
|
* @return boolean hook value.
|
|
|
|
*/
|
|
|
|
|
|
|
|
function onEndRobotsTxt($action)
|
|
|
|
{
|
|
|
|
$url = common_local_url('sitemapindex');
|
|
|
|
|
|
|
|
print "\nSitemap: $url\n";
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2010-03-22 04:25:49 +00:00
|
|
|
/**
|
|
|
|
* Map URLs to actions
|
|
|
|
*
|
|
|
|
* @param Net_URL_Mapper $m path-to-action mapper
|
|
|
|
*
|
|
|
|
* @return boolean hook value; true means continue processing, false means stop.
|
|
|
|
*/
|
|
|
|
|
|
|
|
function onRouterInitialized($m)
|
|
|
|
{
|
|
|
|
$m->connect('sitemapindex.xml',
|
|
|
|
array('action' => 'sitemapindex'));
|
2010-04-10 15:03:57 +01:00
|
|
|
|
2010-04-12 17:06:08 +01:00
|
|
|
$m->connect('/notice-sitemap-:year-:month-:day-:index.xml',
|
2010-03-22 04:25:49 +00:00
|
|
|
array('action' => 'noticesitemap'),
|
|
|
|
array('year' => '[0-9]{4}',
|
2010-03-26 03:56:09 +00:00
|
|
|
'month' => '[01][0-9]',
|
|
|
|
'day' => '[0123][0-9]',
|
|
|
|
'index' => '[1-9][0-9]*'));
|
2010-03-22 12:09:15 +00:00
|
|
|
|
2010-04-12 17:06:08 +01:00
|
|
|
$m->connect('/user-sitemap-:year-:month-:day-:index.xml',
|
2010-03-22 04:25:49 +00:00
|
|
|
array('action' => 'usersitemap'),
|
2010-04-10 15:21:19 +01:00
|
|
|
array('year' => '[0-9]{4}',
|
|
|
|
'month' => '[01][0-9]',
|
|
|
|
'day' => '[0123][0-9]',
|
|
|
|
'index' => '[1-9][0-9]*'));
|
2010-03-22 04:25:49 +00:00
|
|
|
return true;
|
|
|
|
}
|
2010-05-03 19:00:12 +01:00
|
|
|
|
2010-06-13 19:58:06 +01:00
|
|
|
/**
|
|
|
|
* Meta tags for "claiming" a site
|
|
|
|
*
|
|
|
|
* We add extra meta tags that search engines like Yahoo!, Google, and Bing
|
|
|
|
* require to let you claim your site.
|
|
|
|
*
|
|
|
|
* @param Action $action Action being executed
|
|
|
|
*
|
|
|
|
* @return boolean hook value.
|
|
|
|
*/
|
|
|
|
|
|
|
|
function onStartShowHeadElements($action)
|
|
|
|
{
|
|
|
|
$actionName = $action->trimmed('action');
|
|
|
|
|
|
|
|
$singleUser = common_config('singleuser', 'enabled');
|
|
|
|
|
|
|
|
// Different "top" pages if it's single user or not
|
|
|
|
|
|
|
|
if (($singleUser && $actionName == 'showstream') ||
|
|
|
|
(!$singleUser && $actionName == 'public')) {
|
|
|
|
|
|
|
|
$keys = array('googlekey' => 'google-site-verification',
|
|
|
|
'yahookey' => 'y_key',
|
|
|
|
'bingkey' => 'msvalidate.01'); // XXX: is this the same for all sites?
|
|
|
|
|
|
|
|
foreach ($keys as $config => $metaname) {
|
|
|
|
$content = common_config('sitemap', $config);
|
|
|
|
|
|
|
|
if (!empty($content)) {
|
|
|
|
$action->element('meta', array('name' => $metaname,
|
|
|
|
'content' => $content));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
2010-05-03 19:00:12 +01:00
|
|
|
/**
|
|
|
|
* Database schema setup
|
|
|
|
*
|
|
|
|
* We cache some data persistently to avoid overlong queries.
|
|
|
|
*
|
|
|
|
* @see Sitemap_user_count
|
|
|
|
* @see Sitemap_notice_count
|
|
|
|
*
|
|
|
|
* @return boolean hook value; true means continue processing, false means stop.
|
|
|
|
*/
|
|
|
|
|
|
|
|
function onCheckSchema()
|
|
|
|
{
|
|
|
|
$schema = Schema::get();
|
|
|
|
|
|
|
|
$schema->ensureTable('sitemap_user_count',
|
|
|
|
array(new ColumnDef('registration_date', 'date', null,
|
|
|
|
true, 'PRI'),
|
|
|
|
new ColumnDef('user_count', 'integer'),
|
|
|
|
new ColumnDef('created', 'datetime',
|
|
|
|
null, false),
|
|
|
|
new ColumnDef('modified', 'timestamp')));
|
|
|
|
|
|
|
|
$schema->ensureTable('sitemap_notice_count',
|
|
|
|
array(new ColumnDef('notice_date', 'date', null,
|
|
|
|
true, 'PRI'),
|
|
|
|
new ColumnDef('notice_count', 'integer'),
|
|
|
|
new ColumnDef('created', 'datetime',
|
|
|
|
null, false),
|
|
|
|
new ColumnDef('modified', 'timestamp')));
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
2010-03-22 04:25:49 +00:00
|
|
|
}
|