summaryrefslogtreecommitdiffstats
path: root/3rdparty/ZendFeed/Reader/Feed/Rss.php
diff options
context:
space:
mode:
Diffstat (limited to '3rdparty/ZendFeed/Reader/Feed/Rss.php')
-rw-r--r--3rdparty/ZendFeed/Reader/Feed/Rss.php707
1 files changed, 707 insertions, 0 deletions
diff --git a/3rdparty/ZendFeed/Reader/Feed/Rss.php b/3rdparty/ZendFeed/Reader/Feed/Rss.php
new file mode 100644
index 000000000..fc7baa131
--- /dev/null
+++ b/3rdparty/ZendFeed/Reader/Feed/Rss.php
@@ -0,0 +1,707 @@
+<?php
+/**
+ * Zend Framework (http://framework.zend.com/)
+ *
+ * @link http://github.com/zendframework/zf2 for the canonical source repository
+ * @copyright Copyright (c) 2005-2014 Zend Technologies USA Inc. (http://www.zend.com)
+ * @license http://framework.zend.com/license/new-bsd New BSD License
+ */
+
+namespace Zend\Feed\Reader\Feed;
+
+use DateTime;
+use DOMDocument;
+use Zend\Feed\Reader;
+use Zend\Feed\Reader\Collection;
+use Zend\Feed\Reader\Exception;
+
+/**
+*/
+class Rss extends AbstractFeed
+{
+
+ /**
+ * Constructor
+ *
+ * @param DOMDocument $dom
+ * @param string $type
+ */
+ public function __construct(DOMDocument $dom, $type = null)
+ {
+ parent::__construct($dom, $type);
+
+ $manager = Reader\Reader::getExtensionManager();
+
+ $feed = $manager->get('DublinCore\Feed');
+ $feed->setDomDocument($dom);
+ $feed->setType($this->data['type']);
+ $feed->setXpath($this->xpath);
+ $this->extensions['DublinCore\Feed'] = $feed;
+
+ $feed = $manager->get('Atom\Feed');
+ $feed->setDomDocument($dom);
+ $feed->setType($this->data['type']);
+ $feed->setXpath($this->xpath);
+ $this->extensions['Atom\Feed'] = $feed;
+
+ if ($this->getType() !== Reader\Reader::TYPE_RSS_10
+ && $this->getType() !== Reader\Reader::TYPE_RSS_090
+ ) {
+ $xpathPrefix = '/rss/channel';
+ } else {
+ $xpathPrefix = '/rdf:RDF/rss:channel';
+ }
+ foreach ($this->extensions as $extension) {
+ $extension->setXpathPrefix($xpathPrefix);
+ }
+ }
+
+ /**
+ * Get a single author
+ *
+ * @param int $index
+ * @return string|null
+ */
+ public function getAuthor($index = 0)
+ {
+ $authors = $this->getAuthors();
+
+ if (isset($authors[$index])) {
+ return $authors[$index];
+ }
+
+ return null;
+ }
+
+ /**
+ * Get an array with feed authors
+ *
+ * @return array
+ */
+ public function getAuthors()
+ {
+ if (array_key_exists('authors', $this->data)) {
+ return $this->data['authors'];
+ }
+
+ $authors = array();
+ $authorsDc = $this->getExtension('DublinCore')->getAuthors();
+ if (!empty($authorsDc)) {
+ foreach ($authorsDc as $author) {
+ $authors[] = array(
+ 'name' => $author['name']
+ );
+ }
+ }
+
+ /**
+ * Technically RSS doesn't specific author element use at the feed level
+ * but it's supported on a "just in case" basis.
+ */
+ if ($this->getType() !== Reader\Reader::TYPE_RSS_10
+ && $this->getType() !== Reader\Reader::TYPE_RSS_090) {
+ $list = $this->xpath->query('//author');
+ } else {
+ $list = $this->xpath->query('//rss:author');
+ }
+ if ($list->length) {
+ foreach ($list as $author) {
+ $string = trim($author->nodeValue);
+ $email = null;
+ $name = null;
+ $data = array();
+ // Pretty rough parsing - but it's a catchall
+ if (preg_match("/^.*@[^ ]*/", $string, $matches)) {
+ $data['email'] = trim($matches[0]);
+ if (preg_match("/\((.*)\)$/", $string, $matches)) {
+ $data['name'] = $matches[1];
+ }
+ $authors[] = $data;
+ }
+ }
+ }
+
+ if (count($authors) == 0) {
+ $authors = $this->getExtension('Atom')->getAuthors();
+ } else {
+ $authors = new Reader\Collection\Author(
+ Reader\Reader::arrayUnique($authors)
+ );
+ }
+
+ if (count($authors) == 0) {
+ $authors = null;
+ }
+
+ $this->data['authors'] = $authors;
+
+ return $this->data['authors'];
+ }
+
+ /**
+ * Get the copyright entry
+ *
+ * @return string|null
+ */
+ public function getCopyright()
+ {
+ if (array_key_exists('copyright', $this->data)) {
+ return $this->data['copyright'];
+ }
+
+ $copyright = null;
+
+ if ($this->getType() !== Reader\Reader::TYPE_RSS_10 &&
+ $this->getType() !== Reader\Reader::TYPE_RSS_090) {
+ $copyright = $this->xpath->evaluate('string(/rss/channel/copyright)');
+ }
+
+ if (!$copyright && $this->getExtension('DublinCore') !== null) {
+ $copyright = $this->getExtension('DublinCore')->getCopyright();
+ }
+
+ if (empty($copyright)) {
+ $copyright = $this->getExtension('Atom')->getCopyright();
+ }
+
+ if (!$copyright) {
+ $copyright = null;
+ }
+
+ $this->data['copyright'] = $copyright;
+
+ return $this->data['copyright'];
+ }
+
+ /**
+ * Get the feed creation date
+ *
+ * @return string|null
+ */
+ public function getDateCreated()
+ {
+ return $this->getDateModified();
+ }
+
+ /**
+ * Get the feed modification date
+ *
+ * @return DateTime
+ * @throws Exception\RuntimeException
+ */
+ public function getDateModified()
+ {
+ if (array_key_exists('datemodified', $this->data)) {
+ return $this->data['datemodified'];
+ }
+
+ $dateModified = null;
+ $date = null;
+
+ if ($this->getType() !== Reader\Reader::TYPE_RSS_10 &&
+ $this->getType() !== Reader\Reader::TYPE_RSS_090) {
+ $dateModified = $this->xpath->evaluate('string(/rss/channel/pubDate)');
+ if (!$dateModified) {
+ $dateModified = $this->xpath->evaluate('string(/rss/channel/lastBuildDate)');
+ }
+ if ($dateModified) {
+ $dateModifiedParsed = strtotime($dateModified);
+ if ($dateModifiedParsed) {
+ $date = new DateTime('@' . $dateModifiedParsed);
+ } else {
+ $dateStandards = array(DateTime::RSS, DateTime::RFC822,
+ DateTime::RFC2822, null);
+ foreach ($dateStandards as $standard) {
+ try {
+ $date = DateTime::createFromFormat($standard, $dateModified);
+ break;
+ } catch (\Exception $e) {
+ if ($standard == null) {
+ throw new Exception\RuntimeException(
+ 'Could not load date due to unrecognised'
+ .' format (should follow RFC 822 or 2822):'
+ . $e->getMessage(),
+ 0, $e
+ );
+ }
+ }
+ }
+ }
+ }
+ }
+
+ if (!$date) {
+ $date = $this->getExtension('DublinCore')->getDate();
+ }
+
+ if (!$date) {
+ $date = $this->getExtension('Atom')->getDateModified();
+ }
+
+ if (!$date) {
+ $date = null;
+ }
+
+ $this->data['datemodified'] = $date;
+
+ return $this->data['datemodified'];
+ }
+
+ /**
+ * Get the feed lastBuild date
+ *
+ * @throws Exception\RuntimeException
+ * @return DateTime
+ */
+ public function getLastBuildDate()
+ {
+ if (array_key_exists('lastBuildDate', $this->data)) {
+ return $this->data['lastBuildDate'];
+ }
+
+ $lastBuildDate = null;
+ $date = null;
+
+ if ($this->getType() !== Reader\Reader::TYPE_RSS_10 &&
+ $this->getType() !== Reader\Reader::TYPE_RSS_090) {
+ $lastBuildDate = $this->xpath->evaluate('string(/rss/channel/lastBuildDate)');
+ if ($lastBuildDate) {
+ $lastBuildDateParsed = strtotime($lastBuildDate);
+ if ($lastBuildDateParsed) {
+ $date = new DateTime('@' . $lastBuildDateParsed);
+ } else {
+ $dateStandards = array(DateTime::RSS, DateTime::RFC822,
+ DateTime::RFC2822, null);
+ foreach ($dateStandards as $standard) {
+ try {
+ $date = DateTime::createFromFormat($standard, $lastBuildDateParsed);
+ break;
+ } catch (\Exception $e) {
+ if ($standard == null) {
+ throw new Exception\RuntimeException(
+ 'Could not load date due to unrecognised'
+ .' format (should follow RFC 822 or 2822):'
+ . $e->getMessage(),
+ 0, $e
+ );
+ }
+ }
+ }
+ }
+ }
+ }
+
+ if (!$date) {
+ $date = null;
+ }
+
+ $this->data['lastBuildDate'] = $date;
+
+ return $this->data['lastBuildDate'];
+ }
+
+ /**
+ * Get the feed description
+ *
+ * @return string|null
+ */
+ public function getDescription()
+ {
+ if (array_key_exists('description', $this->data)) {
+ return $this->data['description'];
+ }
+
+ $description = null;
+
+ if ($this->getType() !== Reader\Reader::TYPE_RSS_10 &&
+ $this->getType() !== Reader\Reader::TYPE_RSS_090) {
+ $description = $this->xpath->evaluate('string(/rss/channel/description)');
+ } else {
+ $description = $this->xpath->evaluate('string(/rdf:RDF/rss:channel/rss:description)');
+ }
+
+ if (!$description && $this->getExtension('DublinCore') !== null) {
+ $description = $this->getExtension('DublinCore')->getDescription();
+ }
+
+ if (empty($description)) {
+ $description = $this->getExtension('Atom')->getDescription();
+ }
+
+ if (!$description) {
+ $description = null;
+ }
+
+ $this->data['description'] = $description;
+
+ return $this->data['description'];
+ }
+
+ /**
+ * Get the feed ID
+ *
+ * @return string|null
+ */
+ public function getId()
+ {
+ if (array_key_exists('id', $this->data)) {
+ return $this->data['id'];
+ }
+
+ $id = null;
+
+ if ($this->getType() !== Reader\Reader::TYPE_RSS_10 &&
+ $this->getType() !== Reader\Reader::TYPE_RSS_090) {
+ $id = $this->xpath->evaluate('string(/rss/channel/guid)');
+ }
+
+ if (!$id && $this->getExtension('DublinCore') !== null) {
+ $id = $this->getExtension('DublinCore')->getId();
+ }
+
+ if (empty($id)) {
+ $id = $this->getExtension('Atom')->getId();
+ }
+
+ if (!$id) {
+ if ($this->getLink()) {
+ $id = $this->getLink();
+ } elseif ($this->getTitle()) {
+ $id = $this->getTitle();
+ } else {
+ $id = null;
+ }
+ }
+
+ $this->data['id'] = $id;
+
+ return $this->data['id'];
+ }
+
+ /**
+ * Get the feed image data
+ *
+ * @return array|null
+ */
+ public function getImage()
+ {
+ if (array_key_exists('image', $this->data)) {
+ return $this->data['image'];
+ }
+
+ if ($this->getType() !== Reader\Reader::TYPE_RSS_10 &&
+ $this->getType() !== Reader\Reader::TYPE_RSS_090) {
+ $list = $this->xpath->query('/rss/channel/image');
+ $prefix = '/rss/channel/image[1]';
+ } else {
+ $list = $this->xpath->query('/rdf:RDF/rss:channel/rss:image');
+ $prefix = '/rdf:RDF/rss:channel/rss:image[1]';
+ }
+ if ($list->length > 0) {
+ $image = array();
+ $value = $this->xpath->evaluate('string(' . $prefix . '/url)');
+ if ($value) {
+ $image['uri'] = $value;
+ }
+ $value = $this->xpath->evaluate('string(' . $prefix . '/link)');
+ if ($value) {
+ $image['link'] = $value;
+ }
+ $value = $this->xpath->evaluate('string(' . $prefix . '/title)');
+ if ($value) {
+ $image['title'] = $value;
+ }
+ $value = $this->xpath->evaluate('string(' . $prefix . '/height)');
+ if ($value) {
+ $image['height'] = $value;
+ }
+ $value = $this->xpath->evaluate('string(' . $prefix . '/width)');
+ if ($value) {
+ $image['width'] = $value;
+ }
+ $value = $this->xpath->evaluate('string(' . $prefix . '/description)');
+ if ($value) {
+ $image['description'] = $value;
+ }
+ } else {
+ $image = null;
+ }
+
+ $this->data['image'] = $image;
+
+ return $this->data['image'];
+ }
+
+ /**
+ * Get the feed language
+ *
+ * @return string|null
+ */
+ public function getLanguage()
+ {
+ if (array_key_exists('language', $this->data)) {
+ return $this->data['language'];
+ }
+
+ $language = null;
+
+ if ($this->getType() !== Reader\Reader::TYPE_RSS_10 &&
+ $this->getType() !== Reader\Reader::TYPE_RSS_090) {
+ $language = $this->xpath->evaluate('string(/rss/channel/language)');
+ }
+
+ if (!$language && $this->getExtension('DublinCore') !== null) {
+ $language = $this->getExtension('DublinCore')->getLanguage();
+ }
+
+ if (empty($language)) {
+ $language = $this->getExtension('Atom')->getLanguage();
+ }
+
+ if (!$language) {
+ $language = $this->xpath->evaluate('string(//@xml:lang[1])');
+ }
+
+ if (!$language) {
+ $language = null;
+ }
+
+ $this->data['language'] = $language;
+
+ return $this->data['language'];
+ }
+
+ /**
+ * Get a link to the feed
+ *
+ * @return string|null
+ */
+ public function getLink()
+ {
+ if (array_key_exists('link', $this->data)) {
+ return $this->data['link'];
+ }
+
+ $link = null;
+
+ if ($this->getType() !== Reader\Reader::TYPE_RSS_10 &&
+ $this->getType() !== Reader\Reader::TYPE_RSS_090) {
+ $link = $this->xpath->evaluate('string(/rss/channel/link)');
+ } else {
+ $link = $this->xpath->evaluate('string(/rdf:RDF/rss:channel/rss:link)');
+ }
+
+ if (empty($link)) {
+ $link = $this->getExtension('Atom')->getLink();
+ }
+
+ if (!$link) {
+ $link = null;
+ }
+
+ $this->data['link'] = $link;
+
+ return $this->data['link'];
+ }
+
+ /**
+ * Get a link to the feed XML
+ *
+ * @return string|null
+ */
+ public function getFeedLink()
+ {
+ if (array_key_exists('feedlink', $this->data)) {
+ return $this->data['feedlink'];
+ }
+
+ $link = null;
+
+ $link = $this->getExtension('Atom')->getFeedLink();
+
+ if ($link === null || empty($link)) {
+ $link = $this->getOriginalSourceUri();
+ }
+
+ $this->data['feedlink'] = $link;
+
+ return $this->data['feedlink'];
+ }
+
+ /**
+ * Get the feed generator entry
+ *
+ * @return string|null
+ */
+ public function getGenerator()
+ {
+ if (array_key_exists('generator', $this->data)) {
+ return $this->data['generator'];
+ }
+
+ $generator = null;
+
+ if ($this->getType() !== Reader\Reader::TYPE_RSS_10 &&
+ $this->getType() !== Reader\Reader::TYPE_RSS_090) {
+ $generator = $this->xpath->evaluate('string(/rss/channel/generator)');
+ }
+
+ if (!$generator) {
+ if ($this->getType() !== Reader\Reader::TYPE_RSS_10 &&
+ $this->getType() !== Reader\Reader::TYPE_RSS_090) {
+ $generator = $this->xpath->evaluate('string(/rss/channel/atom:generator)');
+ } else {
+ $generator = $this->xpath->evaluate('string(/rdf:RDF/rss:channel/atom:generator)');
+ }
+ }
+
+ if (empty($generator)) {
+ $generator = $this->getExtension('Atom')->getGenerator();
+ }
+
+ if (!$generator) {
+ $generator = null;
+ }
+
+ $this->data['generator'] = $generator;
+
+ return $this->data['generator'];
+ }
+
+ /**
+ * Get the feed title
+ *
+ * @return string|null
+ */
+ public function getTitle()
+ {
+ if (array_key_exists('title', $this->data)) {
+ return $this->data['title'];
+ }
+
+ $title = null;
+
+ if ($this->getType() !== Reader\Reader::TYPE_RSS_10 &&
+ $this->getType() !== Reader\Reader::TYPE_RSS_090) {
+ $title = $this->xpath->evaluate('string(/rss/channel/title)');
+ } else {
+ $title = $this->xpath->evaluate('string(/rdf:RDF/rss:channel/rss:title)');
+ }
+
+ if (!$title && $this->getExtension('DublinCore') !== null) {
+ $title = $this->getExtension('DublinCore')->getTitle();
+ }
+
+ if (!$title) {
+ $title = $this->getExtension('Atom')->getTitle();
+ }
+
+ if (!$title) {
+ $title = null;
+ }
+
+ $this->data['title'] = $title;
+
+ return $this->data['title'];
+ }
+
+ /**
+ * Get an array of any supported Pusubhubbub endpoints
+ *
+ * @return array|null
+ */
+ public function getHubs()
+ {
+ if (array_key_exists('hubs', $this->data)) {
+ return $this->data['hubs'];
+ }
+
+ $hubs = $this->getExtension('Atom')->getHubs();
+
+ if (empty($hubs)) {
+ $hubs = null;
+ } else {
+ $hubs = array_unique($hubs);
+ }
+
+ $this->data['hubs'] = $hubs;
+
+ return $this->data['hubs'];
+ }
+
+ /**
+ * Get all categories
+ *
+ * @return Reader\Collection\Category
+ */
+ public function getCategories()
+ {
+ if (array_key_exists('categories', $this->data)) {
+ return $this->data['categories'];
+ }
+
+ if ($this->getType() !== Reader\Reader::TYPE_RSS_10 &&
+ $this->getType() !== Reader\Reader::TYPE_RSS_090) {
+ $list = $this->xpath->query('/rss/channel//category');
+ } else {
+ $list = $this->xpath->query('/rdf:RDF/rss:channel//rss:category');
+ }
+
+ if ($list->length) {
+ $categoryCollection = new Collection\Category;
+ foreach ($list as $category) {
+ $categoryCollection[] = array(
+ 'term' => $category->nodeValue,
+ 'scheme' => $category->getAttribute('domain'),
+ 'label' => $category->nodeValue,
+ );
+ }
+ } else {
+ $categoryCollection = $this->getExtension('DublinCore')->getCategories();
+ }
+
+ if (count($categoryCollection) == 0) {
+ $categoryCollection = $this->getExtension('Atom')->getCategories();
+ }
+
+ $this->data['categories'] = $categoryCollection;
+
+ return $this->data['categories'];
+ }
+
+ /**
+ * Read all entries to the internal entries array
+ *
+ */
+ protected function indexEntries()
+ {
+ if ($this->getType() !== Reader\Reader::TYPE_RSS_10 && $this->getType() !== Reader\Reader::TYPE_RSS_090) {
+ $entries = $this->xpath->evaluate('//item');
+ } else {
+ $entries = $this->xpath->evaluate('//rss:item');
+ }
+
+ foreach ($entries as $index => $entry) {
+ $this->entries[$index] = $entry;
+ }
+ }
+
+ /**
+ * Register the default namespaces for the current feed format
+ *
+ */
+ protected function registerNamespaces()
+ {
+ switch ($this->data['type']) {
+ case Reader\Reader::TYPE_RSS_10:
+ $this->xpath->registerNamespace('rdf', Reader\Reader::NAMESPACE_RDF);
+ $this->xpath->registerNamespace('rss', Reader\Reader::NAMESPACE_RSS_10);
+ break;
+
+ case Reader\Reader::TYPE_RSS_090:
+ $this->xpath->registerNamespace('rdf', Reader\Reader::NAMESPACE_RDF);
+ $this->xpath->registerNamespace('rss', Reader\Reader::NAMESPACE_RSS_090);
+ break;
+ }
+ }
+}