[bus.git] / busui / owa / owa_news.php
--- a/busui/owa/owa_news.php
+++ b/busui/owa/owa_news.php
@@ -1,1 +1,162 @@
-
+<?php

+

+//

+// Open Web Analytics - An Open Source Web Analytics Framework

+//

+// Copyright 2006 Peter Adams. All rights reserved.

+//

+// Licensed under GPL v2.0 http://www.gnu.org/copyleft/gpl.html

+//

+// Unless required by applicable law or agreed to in writing, software

+// distributed under the License is distributed on an "AS IS" BASIS,

+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

+// See the License for the specific language governing permissions and

+// limitations under the License.

+//

+// $Id$

+//

+

+require_once(OWA_BASE_DIR.'/owa_env.php');

+require_once(OWA_INCLUDE_DIR.'/lastRSS.php');

+require_once(OWA_BASE_DIR.'/owa_httpRequest.php');

+

+/**

+ * Grabs the OWA News Feed from the OWA Blog.

+ * 

+ * @author      Peter Adams <peter@openwebanalytics.com>

+ * @copyright   Copyright &copy; 2006 Peter Adams <peter@openwebanalytics.com>

+ * @license     http://www.gnu.org/copyleft/gpl.html GPL v2.0

+ * @category    owa

+ * @package     owa

+ * @version		$Revision$	      

+ * @since		owa 1.0.0

+ */

+

+class owa_news extends lastRSS {

+	

+	/**

+	 * Configuration

+	 *

+	 * @var array

+	 */

+	var $config;

+	

+	/**

+	 * Error handler

+	 *

+	 * @var object

+	 */

+	var $e;

+	

+	var $crawler;

+	

+	function owa_news() {

+	

+		$c = &owa_coreAPI::configSingleton();

+		$this->config = $c->fetch('base');

+		$this->e = &owa_coreAPI::errorSingleton();

+		$this->crawler = new owa_http;

+		$this->crawler->read_timeout = 20;

+		$this->cache_dir = '';

+		$this->date_format = "F j, Y";

+		$this->CDATA = 'content';

+		$this->items_limit = 3;

+		return;	

+	}

+	

+	/**

+	 * This is a redefined Parse function that uses Snoopy to fetch

+	 * the file instead of fopen.

+	 *

+	 * @param unknown_type $rss_url

+	 * @return unknown

+	 */

+	function Parse ($rss_url) {

+		// Open and load RSS file

+		

+		$this->crawler->getRequest($rss_url);

+		$rss_content = $this->crawler->response;

+		

+		if (!empty($rss_content)) {

+			

+			// Parse document encoding

+			$result['encoding'] = $this->my_preg_match("'encoding=[\'\"](.*?)[\'\"]'si", $rss_content);

+			// if document codepage is specified, use it

+			if ($result['encoding'] != '')

+				{ $this->rsscp = $result['encoding']; } // This is used in my_preg_match()

+			// otherwise use the default codepage

+			else

+				{ $this->rsscp = $this->default_cp; } // This is used in my_preg_match()

+

+			// Parse CHANNEL info

+			preg_match("'<channel.*?>(.*?)</channel>'si", $rss_content, $out_channel);

+			foreach($this->channeltags as $channeltag)

+			{

+				$temp = $this->my_preg_match("'<$channeltag.*?>(.*?)</$channeltag>'si", $out_channel[1]);

+				if ($temp != '') $result[$channeltag] = $temp; // Set only if not empty

+			}

+			// If date_format is specified and lastBuildDate is valid

+			if ($this->date_format != '' && ($timestamp = strtotime($result['lastBuildDate'])) !==-1) {

+						// convert lastBuildDate to specified date format

+						$result['lastBuildDate'] = date($this->date_format, $timestamp);

+			}

+

+			// Parse TEXTINPUT info

+			preg_match("'<textinput(|[^>]*[^/])>(.*?)</textinput>'si", $rss_content, $out_textinfo);

+				// This a little strange regexp means:

+				// Look for tag <textinput> with or without any attributes, but skip truncated version <textinput /> (it's not beggining tag)

+			if (isset($out_textinfo[2])) {

+				foreach($this->textinputtags as $textinputtag) {

+					$temp = $this->my_preg_match("'<$textinputtag.*?>(.*?)</$textinputtag>'si", $out_textinfo[2]);

+					if ($temp != '') $result['textinput_'.$textinputtag] = $temp; // Set only if not empty

+				}

+			}

+			// Parse IMAGE info

+			preg_match("'<image.*?>(.*?)</image>'si", $rss_content, $out_imageinfo);

+			if (isset($out_imageinfo[1])) {

+				foreach($this->imagetags as $imagetag) {

+					$temp = $this->my_preg_match("'<$imagetag.*?>(.*?)</$imagetag>'si", $out_imageinfo[1]);

+					if ($temp != '') $result['image_'.$imagetag] = $temp; // Set only if not empty

+				}

+			}

+			// Parse ITEMS

+			preg_match_all("'<item(| .*?)>(.*?)</item>'si", $rss_content, $items);

+			$rss_items = $items[2];

+			$i = 0;

+			$result['items'] = array(); // create array even if there are no items

+			foreach($rss_items as $rss_item) {

+				// If number of items is lower then limit: Parse one item

+				if ($i < $this->items_limit || $this->items_limit == 0) {

+					foreach($this->itemtags as $itemtag) {

+						$temp = $this->my_preg_match("'<$itemtag.*?>(.*?)</$itemtag>'si", $rss_item);

+						if ($temp != '') $result['items'][$i][$itemtag] = $temp; // Set only if not empty

+					}

+					// Strip HTML tags and other bullshit from DESCRIPTION

+					if ($this->stripHTML && $result['items'][$i]['description'])

+						$result['items'][$i]['description'] = strip_tags($this->unhtmlentities(strip_tags($result['items'][$i]['description'])));

+					// Strip HTML tags and other bullshit from TITLE

+					if ($this->stripHTML && $result['items'][$i]['title'])

+						$result['items'][$i]['title'] = strip_tags($this->unhtmlentities(strip_tags($result['items'][$i]['title'])));

+					// If date_format is specified and pubDate is valid

+					if ($this->date_format != '' && ($timestamp = strtotime($result['items'][$i]['pubDate'])) !==-1) {

+						// convert pubDate to specified date format

+						$result['items'][$i]['pubDate'] = date($this->date_format, $timestamp);

+					}

+					// Item counter

+					$i++;

+				}

+			}

+

+			$result['items_count'] = $i;

+			return $result;

+		}

+		else // Error in opening return False

+		{

+			$this->e->notice('no rss content found at: '.$rss_url);

+			return False;

+		}

+	}

+	

+}

+

+?>