Code standards for deliciousbackupimporter.php

This commit is contained in:
Evan Prodromou 2010-12-21 09:42:44 -05:00
parent 17515aacac
commit 331639d6e4

View File

@ -1,123 +1,216 @@
<?php <?php
/**
* StatusNet - the distributed open-source microblogging tool
* Copyright (C) 2010, StatusNet, Inc.
*
* Importer class for Delicious.com backups
*
* PHP version 5
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU Affero General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Affero General Public License for more details.
*
* You should have received a copy of the GNU Affero General Public License
* along with this program. If not, see <http://www.gnu.org/licenses/>.
*
* @category Bookmark
* @package StatusNet
* @author Evan Prodromou <evan@status.net>
* @copyright 2010 StatusNet, Inc.
* @license http://www.fsf.org/licensing/licenses/agpl-3.0.html AGPL 3.0
* @link http://status.net/
*/
if (!defined('STATUSNET')) {
// This check helps protect against security problems;
// your code file can't be executed directly from the web.
exit(1);
}
require_once INSTALLDIR . '/lib/apiauth.php';
/**
* Importer class for Delicious bookmarks
*
* @category Bookmark
* @package StatusNet
* @author Evan Prodromou <evan@status.net>
* @copyright 2010 StatusNet, Inc.
* @license http://www.fsf.org/licensing/licenses/agpl-3.0.html AGPL 3.0
* @link http://status.net/
*/
class DeliciousBackupImporter class DeliciousBackupImporter
{ {
function importBookmarks($user, $body) /**
{ * Import an in-memory bookmark list to a user's account
$doc = $this->importHTML($body); *
* Take a delicious.com backup file (same as Netscape bookmarks.html)
* and import to StatusNet as Bookmark activities.
*
* The document format is terrible. It consists of a <dl> with
* a bunch of <dt>'s, occasionally with <dd>'s.
* There are sometimes <p>'s lost inside.
*
* @param User $user User whose feed we're going to fill
* @param string $body Body of the file
*
* @return void
*/
$dls = $doc->getElementsByTagName('dl'); function importBookmarks($user, $body)
{
$doc = $this->importHTML($body);
if ($dls->length != 1) { $dls = $doc->getElementsByTagName('dl');
throw new ClientException(_("Bad import file."));
}
$dl = $dls->item(0); if ($dls->length != 1) {
throw new ClientException(_("Bad import file."));
}
$children = $dl->childNodes; $dl = $dls->item(0);
$dt = null; $children = $dl->childNodes;
for ($i = 0; $i < $children->length; $i++) { $dt = null;
try {
$child = $children->item($i);
if ($child->nodeType != XML_ELEMENT_NODE) {
continue;
}
common_log(LOG_INFO, $child->tagName);
switch (strtolower($child->tagName)) {
case 'dt':
if (!empty($dt)) {
// No DD provided
$this->importBookmark($user, $dt);
$dt = null;
}
$dt = $child;
break;
case 'dd':
$dd = $child;
$saved = $this->importBookmark($user, $dt, $dd);
$dt = null;
$dd = null;
case 'p':
common_log(LOG_INFO, 'Skipping the <p> in the <dl>.');
break;
default:
common_log(LOG_WARNING, "Unexpected element $child->tagName found in import.");
}
} catch (Exception $e) {
common_log(LOG_ERR, $e->getMessage());
$dt = $dd = null;
}
}
}
function importBookmark($user, $dt, $dd = null) for ($i = 0; $i < $children->length; $i++) {
{ try {
// We have to go squirrelling around in the child nodes $child = $children->item($i);
// on the off chance that we've received another <dt> if ($child->nodeType != XML_ELEMENT_NODE) {
// as a child. continue;
}
common_log(LOG_INFO, $child->tagName);
switch (strtolower($child->tagName)) {
case 'dt':
if (!empty($dt)) {
// No DD provided
$this->importBookmark($user, $dt);
$dt = null;
}
$dt = $child;
break;
case 'dd':
$dd = $child;
for ($i = 0; $i < $dt->childNodes->length; $i++) { $saved = $this->importBookmark($user, $dt, $dd);
$child = $dt->childNodes->item($i);
if ($child->nodeType == XML_ELEMENT_NODE) {
if ($child->tagName == 'dt' && !is_null($dd)) {
$this->importBookmark($user, $dt);
$this->importBookmark($user, $child, $dd);
return;
}
}
}
$as = $dt->getElementsByTagName('a'); $dt = null;
$dd = null;
case 'p':
common_log(LOG_INFO, 'Skipping the <p> in the <dl>.');
break;
default:
common_log(LOG_WARNING,
"Unexpected element $child->tagName ".
" found in import.");
}
} catch (Exception $e) {
common_log(LOG_ERR, $e->getMessage());
$dt = $dd = null;
}
}
}
if ($as->length == 0) { /**
throw new ClientException(_("No <A> tag in a <DT>.")); * Import a single bookmark
} *
* Takes a <dt>/<dd> pair. The <dt> has a single
* <a> in it with some non-standard attributes.
*
* A <dt><dt><dd> sequence will appear as a <dt> with
* anothe <dt> as a child. We handle this case recursively.
*
* @param User $user User to import data as
* @param DOMElement $dt <dt> element
* @param DOMElement $dd <dd> element
*
* @return Notice imported notice
*/
$a = $as->item(0); function importBookmark($user, $dt, $dd = null)
{
$private = $a->getAttribute('private'); // We have to go squirrelling around in the child nodes
// on the off chance that we've received another <dt>
// as a child.
if ($private != 0) { for ($i = 0; $i < $dt->childNodes->length; $i++) {
throw new ClientException(_('Skipping private bookmark.')); $child = $dt->childNodes->item($i);
} if ($child->nodeType == XML_ELEMENT_NODE) {
if ($child->tagName == 'dt' && !is_null($dd)) {
$this->importBookmark($user, $dt);
$this->importBookmark($user, $child, $dd);
return;
}
}
}
if (!empty($dd)) { $as = $dt->getElementsByTagName('a');
$description = $dd->nodeValue;
} else {
$description = null;
}
$title = $a->nodeValue; if ($as->length == 0) {
$url = $a->getAttribute('href'); throw new ClientException(_("No <A> tag in a <DT>."));
$tags = $a->getAttribute('tags'); }
$addDate = $a->getAttribute('add_date');
$created = common_sql_date(intval($addDate));
$saved = Notice_bookmark::saveNew($user, $a = $as->item(0);
$title,
$url, $private = $a->getAttribute('private');
$tags,
$description,
array('created' => $created));
return $saved; if ($private != 0) {
} throw new ClientException(_('Skipping private bookmark.'));
}
function importHTML($body) if (!empty($dd)) {
{ $description = $dd->nodeValue;
} else {
$description = null;
}
$title = $a->nodeValue;
$url = $a->getAttribute('href');
$tags = $a->getAttribute('tags');
$addDate = $a->getAttribute('add_date');
$created = common_sql_date(intval($addDate));
$saved = Notice_bookmark::saveNew($user,
$title,
$url,
$tags,
$description,
array('created' => $created));
return $saved;
}
/**
* Parse some HTML
*
* Hides the errors that the dom parser returns
*
* @param string $body Data to import
*
* @return DOMDocument parsed document
*/
function importHTML($body)
{
// DOMDocument::loadHTML may throw warnings on unrecognized elements, // DOMDocument::loadHTML may throw warnings on unrecognized elements,
// and notices on unrecognized namespaces. // and notices on unrecognized namespaces.
$old = error_reporting(error_reporting() & ~(E_WARNING | E_NOTICE)); $old = error_reporting(error_reporting() & ~(E_WARNING | E_NOTICE));
$dom = new DOMDocument(); $dom = new DOMDocument();
$ok = $dom->loadHTML($body); $ok = $dom->loadHTML($body);
error_reporting($old); error_reporting($old);
if ($ok) { if ($ok) {
return $dom; return $dom;
} else { } else {
return null; return null;
} }
} }
} }