View source
<?php
namespace Zend\Feed\Reader\Extension\Atom;
use DateTime;
use DOMDocument;
use DOMElement;
use stdClass;
use Zend\Feed\Reader;
use Zend\Feed\Reader\Collection;
use Zend\Feed\Reader\Extension;
use Zend\Feed\Uri;
class Entry extends Extension\AbstractEntry {
public function getAuthor($index = 0) {
$authors = $this
->getAuthors();
if (isset($authors[$index])) {
return $authors[$index];
}
return;
}
public function getAuthors() {
if (array_key_exists('authors', $this->data)) {
return $this->data['authors'];
}
$authors = [];
$list = $this
->getXpath()
->query($this
->getXpathPrefix() . '//atom:author');
if (!$list->length) {
$list = $this
->getXpath()
->query('//atom:author');
}
if ($list->length) {
foreach ($list as $author) {
$author = $this
->getAuthorFromElement($author);
if (!empty($author)) {
$authors[] = $author;
}
}
}
if (count($authors) == 0) {
$authors = new Collection\Author();
}
else {
$authors = new Collection\Author(Reader\Reader::arrayUnique($authors));
}
$this->data['authors'] = $authors;
return $this->data['authors'];
}
public function getContent() {
if (array_key_exists('content', $this->data)) {
return $this->data['content'];
}
$content = null;
$el = $this
->getXpath()
->query($this
->getXpathPrefix() . '/atom:content');
if ($el->length > 0) {
$el = $el
->item(0);
$type = $el
->getAttribute('type');
switch ($type) {
case '':
case 'text':
case 'text/plain':
case 'html':
case 'text/html':
$content = $el->nodeValue;
break;
case 'xhtml':
$this
->getXpath()
->registerNamespace('xhtml', 'http://www.w3.org/1999/xhtml');
$xhtml = $this
->getXpath()
->query($this
->getXpathPrefix() . '/atom:content/xhtml:div')
->item(0);
$d = new DOMDocument('1.0', $this
->getEncoding());
$deep = version_compare(PHP_VERSION, '7', 'ge') ? 1 : true;
$xhtmls = $d
->importNode($xhtml, $deep);
$d
->appendChild($xhtmls);
$content = $this
->collectXhtml($d
->saveXML(), $d
->lookupPrefix('http://www.w3.org/1999/xhtml'));
break;
}
}
if (!$content) {
$content = $this
->getDescription();
}
$this->data['content'] = trim($content);
return $this->data['content'];
}
protected function collectXhtml($xhtml, $prefix) {
if (!empty($prefix)) {
$prefix = $prefix . ':';
}
$matches = [
"/<\\?xml[^<]*>[^<]*<" . $prefix . "div[^<]*/",
"/<\\/" . $prefix . "div>\\s*\$/",
];
$xhtml = preg_replace($matches, '', $xhtml);
if (!empty($prefix)) {
$xhtml = preg_replace("/(<[\\/]?)" . $prefix . "([a-zA-Z]+)/", '$1$2', $xhtml);
}
return $xhtml;
}
public function getDateCreated() {
if (array_key_exists('datecreated', $this->data)) {
return $this->data['datecreated'];
}
$date = null;
if ($this
->getAtomType() === Reader\Reader::TYPE_ATOM_03) {
$dateCreated = $this
->getXpath()
->evaluate('string(' . $this
->getXpathPrefix() . '/atom:created)');
}
else {
$dateCreated = $this
->getXpath()
->evaluate('string(' . $this
->getXpathPrefix() . '/atom:published)');
}
if ($dateCreated) {
$date = new DateTime($dateCreated);
}
$this->data['datecreated'] = $date;
return $this->data['datecreated'];
}
public function getDateModified() {
if (array_key_exists('datemodified', $this->data)) {
return $this->data['datemodified'];
}
$date = null;
if ($this
->getAtomType() === Reader\Reader::TYPE_ATOM_03) {
$dateModified = $this
->getXpath()
->evaluate('string(' . $this
->getXpathPrefix() . '/atom:modified)');
}
else {
$dateModified = $this
->getXpath()
->evaluate('string(' . $this
->getXpathPrefix() . '/atom:updated)');
}
if ($dateModified) {
$date = new DateTime($dateModified);
}
$this->data['datemodified'] = $date;
return $this->data['datemodified'];
}
public function getDescription() {
if (array_key_exists('description', $this->data)) {
return $this->data['description'];
}
$description = $this
->getXpath()
->evaluate('string(' . $this
->getXpathPrefix() . '/atom:summary)');
if (!$description) {
$description = null;
}
$this->data['description'] = $description;
return $this->data['description'];
}
public function getEnclosure() {
if (array_key_exists('enclosure', $this->data)) {
return $this->data['enclosure'];
}
$enclosure = null;
$nodeList = $this
->getXpath()
->query($this
->getXpathPrefix() . '/atom:link[@rel="enclosure"]');
if ($nodeList->length > 0) {
$enclosure = new stdClass();
$enclosure->url = $nodeList
->item(0)
->getAttribute('href');
$enclosure->length = $nodeList
->item(0)
->getAttribute('length');
$enclosure->type = $nodeList
->item(0)
->getAttribute('type');
}
$this->data['enclosure'] = $enclosure;
return $this->data['enclosure'];
}
public function getId() {
if (array_key_exists('id', $this->data)) {
return $this->data['id'];
}
$id = $this
->getXpath()
->evaluate('string(' . $this
->getXpathPrefix() . '/atom:id)');
if (!$id) {
if ($this
->getPermalink()) {
$id = $this
->getPermalink();
}
elseif ($this
->getTitle()) {
$id = $this
->getTitle();
}
else {
$id = null;
}
}
$this->data['id'] = $id;
return $this->data['id'];
}
public function getBaseUrl() {
if (array_key_exists('baseUrl', $this->data)) {
return $this->data['baseUrl'];
}
$baseUrl = $this
->getXpath()
->evaluate('string(' . $this
->getXpathPrefix() . '/@xml:base[1]' . ')');
if (!$baseUrl) {
$baseUrl = $this
->getXpath()
->evaluate('string(//@xml:base[1])');
}
if (!$baseUrl) {
$baseUrl = null;
}
$this->data['baseUrl'] = $baseUrl;
return $this->data['baseUrl'];
}
public function getLink($index = 0) {
if (!array_key_exists('links', $this->data)) {
$this
->getLinks();
}
if (isset($this->data['links'][$index])) {
return $this->data['links'][$index];
}
return;
}
public function getLinks() {
if (array_key_exists('links', $this->data)) {
return $this->data['links'];
}
$links = [];
$list = $this
->getXpath()
->query($this
->getXpathPrefix() . '//atom:link[@rel="alternate"]/@href' . '|' . $this
->getXpathPrefix() . '//atom:link[not(@rel)]/@href');
if ($list->length) {
foreach ($list as $link) {
$links[] = $this
->absolutiseUri($link->value);
}
}
$this->data['links'] = $links;
return $this->data['links'];
}
public function getPermalink() {
return $this
->getLink(0);
}
public function getTitle() {
if (array_key_exists('title', $this->data)) {
return $this->data['title'];
}
$title = $this
->getXpath()
->evaluate('string(' . $this
->getXpathPrefix() . '/atom:title)');
if (!$title) {
$title = null;
}
$this->data['title'] = $title;
return $this->data['title'];
}
public function getCommentCount() {
if (array_key_exists('commentcount', $this->data)) {
return $this->data['commentcount'];
}
$count = null;
$this
->getXpath()
->registerNamespace('thread10', 'http://purl.org/syndication/thread/1.0');
$list = $this
->getXpath()
->query($this
->getXpathPrefix() . '//atom:link[@rel="replies"]/@thread10:count');
if ($list->length) {
$count = $list
->item(0)->value;
}
$this->data['commentcount'] = $count;
return $this->data['commentcount'];
}
public function getCommentLink() {
if (array_key_exists('commentlink', $this->data)) {
return $this->data['commentlink'];
}
$link = null;
$list = $this
->getXpath()
->query($this
->getXpathPrefix() . '//atom:link[@rel="replies" and @type="text/html"]/@href');
if ($list->length) {
$link = $list
->item(0)->value;
$link = $this
->absolutiseUri($link);
}
$this->data['commentlink'] = $link;
return $this->data['commentlink'];
}
public function getCommentFeedLink($type = 'atom') {
if (array_key_exists('commentfeedlink', $this->data)) {
return $this->data['commentfeedlink'];
}
$link = null;
$list = $this
->getXpath()
->query($this
->getXpathPrefix() . '//atom:link[@rel="replies" and @type="application/' . $type . '+xml"]/@href');
if ($list->length) {
$link = $list
->item(0)->value;
$link = $this
->absolutiseUri($link);
}
$this->data['commentfeedlink'] = $link;
return $this->data['commentfeedlink'];
}
public function getCategories() {
if (array_key_exists('categories', $this->data)) {
return $this->data['categories'];
}
if ($this
->getAtomType() == Reader\Reader::TYPE_ATOM_10) {
$list = $this
->getXpath()
->query($this
->getXpathPrefix() . '//atom:category');
}
else {
$this
->getXpath()
->registerNamespace('atom10', Reader\Reader::NAMESPACE_ATOM_10);
$list = $this
->getXpath()
->query($this
->getXpathPrefix() . '//atom10:category');
}
if ($list->length) {
$categoryCollection = new Collection\Category();
foreach ($list as $category) {
$categoryCollection[] = [
'term' => $category
->getAttribute('term'),
'scheme' => $category
->getAttribute('scheme'),
'label' => $category
->getAttribute('label'),
];
}
}
else {
return new Collection\Category();
}
$this->data['categories'] = $categoryCollection;
return $this->data['categories'];
}
public function getSource() {
if (array_key_exists('source', $this->data)) {
return $this->data['source'];
}
$source = null;
if ($this
->getType() == Reader\Reader::TYPE_ATOM_10) {
$list = $this
->getXpath()
->query($this
->getXpathPrefix() . '/atom:source[1]');
if ($list->length) {
$element = $list
->item(0);
$source = new Reader\Feed\Atom\Source($element, $this
->getXpathPrefix());
}
}
$this->data['source'] = $source;
return $this->data['source'];
}
protected function absolutiseUri($link) {
if (!Uri::factory($link)
->isAbsolute()) {
if ($this
->getBaseUrl() !== null) {
$link = $this
->getBaseUrl() . $link;
if (!Uri::factory($link)
->isValid()) {
$link = null;
}
}
}
return $link;
}
protected function getAuthorFromElement(DOMElement $element) {
$author = [];
$emailNode = $element
->getElementsByTagName('email');
$nameNode = $element
->getElementsByTagName('name');
$uriNode = $element
->getElementsByTagName('uri');
if ($emailNode->length && strlen($emailNode
->item(0)->nodeValue) > 0) {
$author['email'] = $emailNode
->item(0)->nodeValue;
}
if ($nameNode->length && strlen($nameNode
->item(0)->nodeValue) > 0) {
$author['name'] = $nameNode
->item(0)->nodeValue;
}
if ($uriNode->length && strlen($uriNode
->item(0)->nodeValue) > 0) {
$author['uri'] = $uriNode
->item(0)->nodeValue;
}
if (empty($author)) {
return;
}
return $author;
}
protected function registerNamespaces() {
switch ($this
->getAtomType()) {
case Reader\Reader::TYPE_ATOM_03:
$this
->getXpath()
->registerNamespace('atom', Reader\Reader::NAMESPACE_ATOM_03);
break;
default:
$this
->getXpath()
->registerNamespace('atom', Reader\Reader::NAMESPACE_ATOM_10);
break;
}
}
protected function getAtomType() {
$dom = $this
->getDomDocument();
$prefixAtom03 = $dom
->lookupPrefix(Reader\Reader::NAMESPACE_ATOM_03);
$prefixAtom10 = $dom
->lookupPrefix(Reader\Reader::NAMESPACE_ATOM_10);
if ($dom
->isDefaultNamespace(Reader\Reader::NAMESPACE_ATOM_03) || !empty($prefixAtom03)) {
return Reader\Reader::TYPE_ATOM_03;
}
if ($dom
->isDefaultNamespace(Reader\Reader::NAMESPACE_ATOM_10) || !empty($prefixAtom10)) {
return Reader\Reader::TYPE_ATOM_10;
}
}
}