Current oav website

This commit is contained in:
Charlie Root
2023-03-20 12:18:38 +01:00
commit a096ce07cf
3270 changed files with 261778 additions and 0 deletions

View File

@ -0,0 +1,270 @@
<?php
/**
* @class feedParser
* @brief Feed parser
*
* This class can read RSS 1.0, RSS 2.0, Atom 0.3 and Atom 1.0 feeds. Works with
* {@link feedReader}
*
* @package Clearbricks
* @subpackage Feeds
*
* @copyright Olivier Meunier & Association Dotclear
* @copyright GPL-2.0-only
*/
class feedParser
{
public $feed_type; ///< string Feed type
public $title; ///< string Feed title
public $link; ///< string Feed link
public $description; ///< string Feed description
public $pubdate; ///< string Feed publication date
public $generator; ///< string Feed generator
public $items = []; ///< array Feed items
protected $xml; ///< SimpleXMLElement Feed XML content
/**
* Constructor.
*
* Takes some <var>$data</var> as input. Returns false if data is
* not a valid XML stream. If everything's fine, feed is parsed and items
* are in {@link $items} property.
*
* @param string $data XML stream
*/
public function __construct($data)
{
$this->xml = @simplexml_load_string($data);
if (!$this->xml) {
return false;
}
if (preg_match('/<rdf:RDF/', $data)) {
$this->parseRSSRDF();
} elseif (preg_match('/<rss/', $data)) {
$this->parseRSS();
} elseif (preg_match('!www.w3.org/2005/Atom!', $data)) {
$this->parseAtom10();
} else {
$this->parseAtom03();
}
unset($data);
unset($this->xml);
}
/**
* RSS 1.0 parser.
*/
protected function parseRSSRDF()
{
$this->feed_type = 'rss 1.0 (rdf)';
$this->title = (string) $this->xml->channel->title;
$this->link = (string) $this->xml->channel->link;
$this->description = (string) $this->xml->channel->description;
$this->pubdate = (string) $this->xml->channel->children('http://purl.org/dc/elements/1.1/')->date;
# Feed generator agent
$g = $this->xml->channel->children('http://webns.net/mvcb/')->generatorAgent;
if ($g) {
$g = $g->attributes('http://www.w3.org/1999/02/22-rdf-syntax-ns#');
$this->generator = (string) $g['resource'];
}
if (empty($this->xml->item)) {
return;
}
foreach ($this->xml->item as $i) {
$item = new stdClass();
$item->title = (string) $i->title;
$item->link = (string) $i->link;
$item->creator = (string) $i->children('http://purl.org/dc/elements/1.1/')->creator;
$item->description = (string) $i->description;
$item->content = (string) $i->children('http://purl.org/rss/1.0/modules/content/')->encoded;
$item->subject = $this->nodes2array($i->children('http://purl.org/dc/elements/1.1/')->subject);
$item->pubdate = (string) $i->children('http://purl.org/dc/elements/1.1/')->date;
$item->TS = strtotime($item->pubdate);
$item->guid = (string) $item->link;
if (!empty($i->attributes('http://www.w3.org/1999/02/22-rdf-syntax-ns#')->about)) {
$item->guid = (string) $i->attributes('http://www.w3.org/1999/02/22-rdf-syntax-ns#')->about;
}
$this->items[] = $item;
}
}
/**
* RSS 2.0 parser
*/
protected function parseRSS()
{
$this->feed_type = 'rss ' . $this->xml['version'];
$this->title = (string) $this->xml->channel->title;
$this->link = (string) $this->xml->channel->link;
$this->description = (string) $this->xml->channel->description;
$this->pubdate = (string) $this->xml->channel->pubDate;
$this->generator = (string) $this->xml->channel->generator;
if (empty($this->xml->channel->item)) {
return;
}
foreach ($this->xml->channel->item as $i) {
$item = new stdClass();
$item->title = (string) $i->title;
$item->link = (string) $i->link;
$item->creator = (string) $i->children('http://purl.org/dc/elements/1.1/')->creator;
$item->description = (string) $i->description;
$item->content = (string) $i->children('http://purl.org/rss/1.0/modules/content/')->encoded;
$item->subject = array_merge(
$this->nodes2array($i->children('http://purl.org/dc/elements/1.1/')->subject),
$this->nodes2array($i->category)
);
$item->pubdate = (string) $i->pubDate;
if (!$item->pubdate && !empty($i->children('http://purl.org/dc/elements/1.1/')->date)) {
$item->pubdate = (string) $i->children('http://purl.org/dc/elements/1.1/')->date;
}
$item->TS = strtotime($item->pubdate);
$item->guid = (string) $item->link;
if (!empty($i->guid)) {
$item->guid = (string) $i->guid;
}
$this->items[] = $item;
}
}
/**
* Atom 0.3 parser
*/
protected function parseAtom03()
{
$this->feed_type = 'atom 0.3';
$this->title = (string) $this->xml->title;
$this->description = (string) $this->xml->subtitle;
$this->pubdate = (string) $this->xml->modified;
$this->generator = (string) $this->xml->generator;
foreach ($this->xml->link as $link) {
if ($link['rel'] == 'alternate' &&
($link['type'] == 'text/html' || $link['type'] == 'application/xhtml+xml')) {
$this->link = (string) $link['href'];
break;
}
}
if (empty($this->xml->entry)) {
return;
}
foreach ($this->xml->entry as $i) {
$item = new stdClass();
foreach ($i->link as $link) {
if ($link['rel'] == 'alternate' &&
($link['type'] == 'text/html' || $link['type'] == 'application/xhtml+xml')) {
$item->link = (string) $link['href'];
break;
}
$item->link = (string) $link['href'];
}
$item->title = (string) $i->title;
$item->creator = (string) $i->author->name;
$item->description = (string) $i->summary;
$item->content = (string) $i->content;
$item->subject = $this->nodes2array($i->children('http://purl.org/dc/elements/1.1/')->subject);
$item->pubdate = (string) $i->modified;
$item->TS = strtotime($item->pubdate);
$this->items[] = $item;
}
}
/**
* Atom 1.0 parser
*/
protected function parseAtom10()
{
$this->feed_type = 'atom 1.0';
$this->title = (string) $this->xml->title;
$this->description = (string) $this->xml->subtitle;
$this->pubdate = (string) $this->xml->updated;
$this->generator = (string) $this->xml->generator;
foreach ($this->xml->link as $link) {
if ($link['rel'] == 'alternate' &&
($link['type'] == 'text/html' || $link['type'] == 'application/xhtml+xml')) {
$this->link = (string) $link['href'];
break;
}
}
if (empty($this->xml->entry)) {
return;
}
foreach ($this->xml->entry as $i) {
$item = new stdClass();
foreach ($i->link as $link) {
if ($link['rel'] == 'alternate' &&
($link['type'] == 'text/html' || $link['type'] == 'application/xhtml+xml')) {
$item->link = (string) $link['href'];
break;
}
$item->link = (string) $link['href'];
}
$item->title = (string) $i->title;
$item->creator = (string) $i->author->name;
$item->description = (string) $i->summary;
$item->content = (string) $i->content;
$item->subject = $this->nodes2array($i->children('http://purl.org/dc/elements/1.1/')->subject);
$item->pubdate = !empty($i->published) ? (string) $i->published : (string) $i->updated;
$item->TS = strtotime($item->pubdate);
$this->items[] = $item;
}
}
/**
* SimpleXML to array
*
* Converts a SimpleXMLElement to an array.
*
* @param SimpleXMLElement $node SimpleXML Node
* @return array
*/
protected function nodes2array(&$node)
{
if (empty($node)) {
return [];
}
$res = [];
foreach ($node as $v) {
$res[] = (string) $v;
}
return $res;
}
}

View File

@ -0,0 +1,257 @@
<?php
/**
* @class feedReader
* @brief Feed Reader
*
* Features:
*
* - Reads RSS 1.0 (rdf), RSS 2.0 and Atom feeds.
* - HTTP cache negociation support
* - Cache TTL.
*
* @package Clearbricks
* @subpackage Feeds
*
* @copyright Olivier Meunier & Association Dotclear
* @copyright GPL-2.0-only
*/
/** @cond ONCE */
if (class_exists('netHttp')) {
/** @endcond */
class feedReader extends netHttp
{
protected $user_agent = 'Clearbricks Feed Reader/0.2';
protected $timeout = 5;
protected $validators = null; ///< array HTTP Cache validators
protected $cache_dir = null; ///< string Cache directory path
protected $cache_file_prefix = 'cbfeed'; ///< string Cache file prefix
protected $cache_ttl = '-30 minutes'; ///< string Cache TTL
/**
* Constructor.
*
* Does nothing. See {@link parse()} method for URL handling.
*/
public function __construct()
{
parent::__construct('');
}
/**
* Parse Feed
*
* Returns a new feedParser instance for given URL or false if source URL is
* not a valid feed.
*
* @uses feedParser
*
* @param string $url Feed URL
* @return feedParser|false
*/
public function parse($url)
{
$this->validators = [];
if ($this->cache_dir) {
return $this->withCache($url);
} else {
if (!$this->getFeed($url)) {
return false;
}
if ($this->getStatus() != '200') {
return false;
}
return new feedParser($this->getContent());
}
}
/**
* Quick Parse
*
* This static method returns a new {@link feedParser} instance for given URL. If a
* <var>$cache_dir</var> is specified, cache will be activated.
*
* @param string $url Feed URL
* @param string $cache_dir Cache directory
* @return feedParser|false
*/
public static function quickParse($url, $cache_dir = null)
{
$parser = new self();
if ($cache_dir) {
$parser->setCacheDir($cache_dir);
}
return $parser->parse($url);
}
/**
* Set Cache Directory
*
* Returns true and sets {@link $cache_dir} property if <var>$dir</var> is
* a writable directory. Otherwise, returns false.
*
* @param string $dir Cache directory
* @return boolean
*/
public function setCacheDir($dir)
{
$this->cache_dir = null;
if (!empty($dir) && is_dir($dir) && is_writeable($dir)) {
$this->cache_dir = $dir;
return true;
}
return false;
}
/**
* Set Cache TTL
*
* Sets cache TTL. <var>$str</var> is a interval readable by strtotime
* (-3 minutes, -2 hours, etc.)
*
* @param string $str TTL
*/
public function setCacheTTL($str)
{
$str = trim($str);
if (!empty($str)) {
if (substr($str, 0, 1) != '-') {
$str = '-' . $str;
}
$this->cache_ttl = $str;
}
}
/**
* Feed Content
*
* Returns feed content for given URL.
*
* @param string $url Feed URL
* @return string
*/
protected function getFeed($url)
{
if (!self::readURL($url, $ssl, $host, $port, $path, $user, $pass)) {
return false;
}
$this->setHost($host, $port);
$this->useSSL($ssl);
$this->setAuthorization($user, $pass);
return $this->get($path);
}
/**
* Cache content
*
* Returns feedParser object from cache if present or write it to cache and
* returns result.
*
* @param string $url Feed URL
* @return feedParser
*/
protected function withCache($url)
{
$url_md5 = md5($url);
$cached_file = sprintf('%s/%s/%s/%s/%s.php',
$this->cache_dir,
$this->cache_file_prefix,
substr($url_md5, 0, 2),
substr($url_md5, 2, 2),
$url_md5
);
$may_use_cached = false;
if (@file_exists($cached_file)) {
$may_use_cached = true;
$ts = @filemtime($cached_file);
if ($ts > strtotime($this->cache_ttl)) {
# Direct cache
return unserialize(file_get_contents($cached_file));
}
$this->setValidator('IfModifiedSince', $ts);
}
if (!$this->getFeed($url)) {
if ($may_use_cached) {
# connection failed - fetched from cache
return unserialize(file_get_contents($cached_file));
}
return false;
}
switch ($this->getStatus()) {
case '304':
@files::touch($cached_file);
return unserialize(file_get_contents($cached_file));
case '200':
if ($feed = new feedParser($this->getContent())) {
try {
files::makeDir(dirname($cached_file), true);
} catch (Exception $e) {
return $feed;
}
if (($fp = @fopen($cached_file, 'wb'))) {
fwrite($fp, serialize($feed));
fclose($fp);
files::inheritChmod($cached_file);
}
return $feed;
}
}
return false;
}
/**
* Build request
*
* Adds HTTP cache headers to common headers.
*
* {@inheritdoc}
*/
protected function buildRequest()
{
$headers = parent::buildRequest();
# Cache validators
if (!empty($this->validators)) {
if (isset($this->validators['IfModifiedSince'])) {
$headers[] = 'If-Modified-Since: ' . $this->validators['IfModifiedSince'];
}
if (isset($this->validators['IfNoneMatch'])) {
if (is_array($this->validators['IfNoneMatch'])) {
$etags = implode(',', $this->validators['IfNoneMatch']);
} else {
$etags = $this->validators['IfNoneMatch'];
}
$headers[] = '';
}
}
return $headers;
}
private function setValidator($key, $value)
{
if ($key == 'IfModifiedSince') {
$value = gmdate('D, d M Y H:i:s', $value) . ' GMT';
}
$this->validators[$key] = $value;
}
}
/** @cond ONCE */
}
/** @endcond */