summaryrefslogtreecommitdiffstats
path: root/sca-cpp/tags/native-sca-1.0.incubating-M3/samples/AlertAggregator/sample.alerter/RSSCheckerImpl.py
diff options
context:
space:
mode:
Diffstat (limited to 'sca-cpp/tags/native-sca-1.0.incubating-M3/samples/AlertAggregator/sample.alerter/RSSCheckerImpl.py')
-rw-r--r--sca-cpp/tags/native-sca-1.0.incubating-M3/samples/AlertAggregator/sample.alerter/RSSCheckerImpl.py76
1 files changed, 76 insertions, 0 deletions
diff --git a/sca-cpp/tags/native-sca-1.0.incubating-M3/samples/AlertAggregator/sample.alerter/RSSCheckerImpl.py b/sca-cpp/tags/native-sca-1.0.incubating-M3/samples/AlertAggregator/sample.alerter/RSSCheckerImpl.py
new file mode 100644
index 0000000000..2e320c0b22
--- /dev/null
+++ b/sca-cpp/tags/native-sca-1.0.incubating-M3/samples/AlertAggregator/sample.alerter/RSSCheckerImpl.py
@@ -0,0 +1,76 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements. See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership. The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied. See the License for the
+# specific language governing permissions and limitations
+# under the License.
+#
+
+import feedparser, datetime, xml.etree.ElementTree, re
+
+def getNewAlerts(rssaddress, lastchecktimestamp):
+
+ print "RSSCheckerImpl.getNewAlerts() called", rssaddress, lastchecktimestamp
+
+ #Get and parse the RSS/Atom data
+ d = feedparser.parse(rssaddress)
+
+ newalertsxml = "<alerts xmlns=\"http://tuscany.apache.org/samples/alerter\">\n"
+
+ lastcheckdate = datetime.datetime.min
+ if lastchecktimestamp:
+ lastcheckdate = datetime.datetime.strptime(lastchecktimestamp, "%Y-%m-%dT%H:%M:%S")
+
+ defaultTitle = d.feed.get('title', 'RSS feed article')
+ defaultLink = d.feed.get('link', 'http://incubator.apache.org/tuscany')
+ defaultSummary = 'No information provided'
+
+ for entry in d.entries:
+
+ if entry.has_key('date'):
+ (year, month, day, hour, minute, second, millisecond, microsecond, tzinfo) = entry.date_parsed
+ entrydate = datetime.datetime(year, month, day, hour, minute, second)
+ else:
+ entrydate = datetime.datetime.now()
+
+
+ if (entrydate > lastcheckdate) :
+
+ newalertsxml += "<alert><title>" + stripXML(entry.get('title', defaultTitle)) + "</title>\n"
+ newalertsxml += "<address>" + entry.get('link', defaultLink) + "</address>\n"
+ newalertsxml += "<date>" + entrydate.isoformat() + "</date>\n"
+ newalertsxml += "<summary>" + stripXML(entry.get('description', defaultSummary)) + "</summary></alert>\n"
+ newalertsxml += "</alerts>"
+
+ return xml.etree.ElementTree.XML(newalertsxml)
+
+def stripXML(data):
+ elementsRemoved = re.sub("<.*?>","", data)
+ entitiesRemoved = re.sub("&.*?;", " ", elementsRemoved)
+ asciiEncoded = entitiesRemoved.encode('ASCII', 'replace')
+ returnData = asciiEncoded.replace('&', 'and')
+ return returnData
+
+
+# Testing
+# print xml.etree.ElementTree.tostring(getNewAlerts("http://www.engadget.com/rss.xml", "2007-02-07T17:11:14"))
+#
+#
+# today = datetime.datetime.now().replace(hour=0, minute=0, second=0, microsecond=0)
+# data2 = getNewAlerts("http://newsrss.bbc.co.uk/rss/newsonline_uk_edition/front_page/rss.xml", today.isoformat())
+# print xml.etree.ElementTree.tostring(data2)
+#
+# print "1st call returned", len(data.findall("./{http://tuscany.apache.org/samples/alerter}alert")), "elements"
+# print "2nd call returned", len(data2.findall("./{http://tuscany.apache.org/samples/alerter}alert")), "elements"
+
+