1
0
mirror of https://git.tt-rss.org/git/tt-rss.git synced 2026-02-10 16:01:33 +00:00

add basic tinyparser/atom

This commit is contained in:
Andrew Dolgov
2013-05-01 17:04:57 +04:00
parent 7fc041c6ef
commit cd07592c29
5 changed files with 255 additions and 13 deletions

View File

@@ -0,0 +1,7 @@
<?php
class FeedEnclosure {
public $link;
public $type;
public $length;
}
?>

15
classes/feeditem.php Normal file
View File

@@ -0,0 +1,15 @@
<?php
class FeedItem {
abstract function get_id();
abstract function get_date();
abstract function get_link();
abstract function get_title();
abstract function get_description();
abstract function get_content();
abstract function get_comments_url();
abstract function get_comments_count();
abstract function get_categories();
abstract function get_enclosures();
abstract function get_author();
}
?>

118
classes/feeditem/atom.php Normal file
View File

@@ -0,0 +1,118 @@
<?php
class FeedItem_Atom {
private $elem;
function __construct($elem) {
$this->elem = $elem;
}
function get_id() {
$id = $this->elem->getElementsByTagName("id")->item(0);
if ($id) {
return $id->nodeValue;
} else {
return $this->get_link();
}
}
function get_date() {
}
function get_link() {
$links = $this->elem->getElementsByTagName("link");
foreach ($links as $link) {
if ($link && $link->hasAttribute("href") && !$link->hasAttribute("rel")) {
return $link->getAttribute("href");
}
}
}
function get_title() {
$title = $this->elem->getElementsByTagName("title")->item(0);
if ($title) {
return $title->nodeValue;
}
}
function get_content() {
$content = $this->elem->getElementsByTagName("content")->item(0);
if ($content) {
return $content->nodeValue;
}
}
function get_description() {
$summary = $this->elem->getElementsByTagName("summary")->item(0);
if ($summary) {
return $summary->nodeValue;
}
}
// todo
function get_comments_url() {
}
// todo
function get_comments_count() {
}
function get_categories() {
$categories = $this->elem->getElementsByTagName("category");
$cats = array();
foreach ($categories as $cat) {
if ($cat->hasAttribute("term"))
array_push($cats, $cat->getAttribute("term"));
}
return $cats;
}
function get_enclosures() {
$links = $this->elem->getElementsByTagName("link");
$encs = array();
foreach ($links as $link) {
if ($link && $link->hasAttribute("href") && $link->hasAttribute("rel")) {
if ($link->getAttribute("rel") == "enclosure") {
$enc = new FeedEnclosure();
$enc->type = $link->getAttribute("type");
$enc->link = $link->getAttribute("href");
$enc->length = $link->getAttribute("length");
array_push($encs, $enc);
}
}
}
return $encs;
}
function get_author() {
$author = $this->elem->getElementsByTagName("author")->item(0);
if ($author) {
$name = $author->getElementsByTagName("name")->item(0);
if ($name) return $name->nodeValue;
$email = $author->getElementsByTagName("email")->item(0);
if ($email) return $email->nodeValue;
}
}
}
?>

101
classes/feedparser.php Normal file
View File

@@ -0,0 +1,101 @@
<?php
class FeedParser {
private $doc;
private $error;
private $items;
private $link;
private $title;
private $type;
const FEED_RDF = 0;
const FEED_RSS = 1;
const FEED_ATOM = 2;
function __construct($data) {
libxml_use_internal_errors(true);
libxml_clear_errors();
$this->doc = new DOMDocument();
$this->doc->loadXML($data);
$this->error = $this->format_error(libxml_get_last_error());
libxml_clear_errors();
$this->items = array();
}
function init() {
$root = $this->doc->firstChild;
if ($root) {
switch ($root->tagName) {
case "rss":
$this->type = $this::FEED_RSS;
break;
case "feed":
$this->type = $this::FEED_ATOM;
break;
default:
$this->error = "Unknown/unsupported feed type";
return;
}
$xpath = new DOMXPath($this->doc);
switch ($this->type) {
case $this::FEED_ATOM:
$xpath->registerNamespace('atom', 'http://www.w3.org/2005/Atom');
$title = $xpath->query("//atom:feed/atom:title")->item(0);
if ($title) {
$this->title = $title->nodeValue;
}
$link = $xpath->query("//atom:feed/atom:link[not(@rel)]")->item(0);
if ($link && $link->hasAttributes()) {
$this->link = $link->getAttribute("href");
}
$articles = $xpath->query("//atom:entry");
foreach ($articles as $article) {
array_push($this->items, new FeedItem_Atom($article));
}
break;
case $this::FEED_RDF:
break;
case $this::FEED_RSS:
break;
}
}
}
function format_error($error) {
if ($error) {
return sprintf("LibXML error %s at line %d (column %d): %s",
$error->code, $error->line, $error->column,
$error->message);
} else {
return "";
}
}
function error() {
return $this->error;
}
function get_link() {
return $this->link;
}
function get_title() {
return $this->title;
}
function get_items() {
return $this->items;
}
} ?>