Sunday, April 19, 2009

rss_fetch 2.0

<?php

class rss_parser {
var $update_interval = 60;
var $data_directory = "/home/vol8/000space.com/space_3287474/vn4000php.co.cc/htdocs";
var $rss_url;
var $num_to_show;
var $offset;
var $do_update;
var $tags = array();
var $content;
var $rss = array();

var $feed_title;
var $feed_link;
var $feed_description;
var $feed_url;

var $my_html;

function rss_parser($url, $numtoshow = 10, $html = "", $update = FALSE, $offset = 1)
{
$this->rss_url = $url;
$this->num_to_show = $numtoshow;
$this->do_update = $update;
$this->my_html = preg_replace("/(#{.*?):(.*?})/", "\\1__\\2", $html);
$this->offset = --$offset;

$this->content = $this->fetch_feed();
$this->parse_feed();
$this->show();
}


/* string */
function fetch_feed()
{
$url_parts = parse_url($this->rss_url);

$filename = $url_parts['host'] . str_replace("/", ",", $url_parts['path']) . "_" . @$url_parts['query'];
if(file_exists($this->data_directory . "/$filename")) {
$last = filemtime($this->data_directory . "/$filename");
$create = 0;
if(time() - $last > $this->update_interval * 60 || $this->update_interval == 0) {
$update = 1;
} else {
$update = 0;
}
} else {
$create = 1;
$update = 1;
}

if($create == 1 || ($this->do_update == TRUE && $update == 1)) {
$fp = @fsockopen($url_parts['host'], 80, $errno, $errstr, 5);
if (!$fp) {
echo "Couldn't open rss feed {$this->feed_url} in {$_SERVER['PHP_SELF']}<br />\n";
return;
}

fputs($fp, "GET {$this->rss_url} HTTP/1.0\r\n"
."Host: " . $url_parts['host'] . "\r\n"
."User-Agent: vn4000's RSS Reader 0.1\r\n"
."Connection: Close\r\n\r\n");

while(!feof($fp)) {
$rss_data .= @fread($fp, 1024);
}

list(, $rss_data) = explode("\r\n\r\n", $rss_data, 2);

$output = @fopen($this->data_directory . "/$filename", "w+b");
if(!$output) {
return $rss_data;
} else {
flock($output, LOCK_EX);
fputs($output, $rss_data);
flock($output, LOCK_UN);
fclose($output);
}
} //update

return file_get_contents($this->data_directory . "/$filename");
}

/* void */
function parse_feed()
{
preg_match("/<title>(.*?)<\/title>/", $this->content, $title);
$this->feed_title = @$title[1];

preg_match("/<link>(.*?)<\/link>/", $this->content, $link);
$this->feed_link = @$link[1];

preg_match("/<description>(.*?)<\/description>/", $this->content, $description);
$this->feed_description = @$description[1];

preg_match("/<url>(.*?)<\/url>/", $this->content, $enclosure);
$this->feed_url = @$url[1];

preg_match_all("/<item[^>]*>(.*?)<\/item>/s", $this->content, $items);
if (sizeof($items[0]) == 0) {
echo "No item elements found in rss feed.<br />\n";
}

for($i = 0; $i < sizeof($items[0]); ++$i) {
preg_match_all("/(?:<([\w:]*)[^>]*>\s*(?:<!\[CDATA\[)?(.*?)(?:]]>)?\s*<\/\\1>)+?/si", preg_replace("/<item[^>]*>/", "", $items[0][$i]), $elements);
for($j = 0; $j < sizeof($elements[0]); ++$j) {
$elements[1][$j] = str_replace(":", "__", $elements[1][$j]);
$this->rss[$i][$elements[1][$j]] = trim($this->unhtmlentities($elements[2][$j]));
}
}
}


/* void */
function show()
{
if($this->my_html == "") {
$this->show_html();
} else {
$this->show_user_html();
}
}

function show_html()
{
$show = (sizeof($this->rss) > $this->num_to_show ? $this->num_to_show : sizeof($this->rss));
for($i = $this->offset; $i < $this->offset + $show; ++$i) {
echo "- <a href=\"{$this->rss[$i]['link']}\" target=\"_new\">{$this->rss[$i]['title']}</a><br />\n";
}
}

function show_user_html()
{
$show = (sizeof($this->rss) > $this->num_to_show + $this->offset ? $this->num_to_show : sizeof($this->rss));
$show = ($this->offset + $this->num_to_show > sizeof($this->rss) ? sizeof($this->rss) - $this->offset : $this->num_to_show);
for($i = $this->offset; $i < $this->offset + $show; ++$i) {
extract($this->rss[$i]);
$item = preg_replace("/#\{([^}]+)}/e", "$\\1", $this->my_html);
echo $item;
}
}

function unhtmlentities($string)
{
$trans_tbl = get_html_translation_table(HTML_ENTITIES);
$trans_tbl = array_flip($trans_tbl);
return strtr($string, $trans_tbl);
}

} // end class


?>