# Description : Simple RSS Reader
# ============================================================================
-from os.path import isfile
-from os.path import isdir
+from os.path import isfile, isdir
from shutil import rmtree
from os import mkdir, remove
import pickle
import time
import urllib2
from BeautifulSoup import BeautifulSoup
-from urlparse import urlparse
+from urlparse import urljoin
#CONFIGDIR="/home/user/.feedingit/"
def getId(string):
return md5.new(string).hexdigest()
-def getProxy():
- import gconf
- if gconf.client_get_default().get_bool('/system/http_proxy/use_http_proxy'):
- port = gconf.client_get_default().get_int('/system/http_proxy/port')
- http = gconf.client_get_default().get_string('/system/http_proxy/host')
- proxy = proxy = urllib2.ProxyHandler( {"http":"http://%s:%s/"% (http,port)} )
- return (True, proxy)
- return (False, None)
+#def getProxy():
+# import gconf
+# if gconf.client_get_default().get_bool('/system/http_proxy/use_http_proxy'):
+# port = gconf.client_get_default().get_int('/system/http_proxy/port')
+# http = gconf.client_get_default().get_string('/system/http_proxy/host')
+# proxy = proxy = urllib2.ProxyHandler( {"http":"http://%s:%s/"% (http,port)} )
+# return (True, proxy)
+# return (False, None)
# Enable proxy support for images and ArchivedArticles
-(proxy_support, proxy) = getProxy()
-if proxy_support:
- opener = urllib2.build_opener(proxy)
- urllib2.install_opener(opener)
+#(proxy_support, proxy) = getProxy()
+#if proxy_support:
+# opener = urllib2.build_opener(proxy)
+# urllib2.install_opener(opener)
# Entry = {"title":XXX, "content":XXX, "date":XXX, "link":XXX, images = [] }
filename = self.configdir+key+".d/"+getId(url)
if not isfile(filename):
try:
- if url.startswith("http"):
- f = urllib2.urlopen(url)
- else:
- f = urllib2.urlopen(baseurl+"/"+url)
+ #if url.startswith("http"):
+ # f = urllib2.urlopen(url)
+ #else:
+ f = urllib2.urlopen(urljoin(baseurl,url))
outf = open(filename, "w")
outf.write(f.read())
f.close()
outf.close()
except:
- print "Could not download" + url
+ print "Could not download " + url
+ else:
+ open(filename,"a").close() # "Touch" the file
if filename in self.images:
self.images[filename] += 1
else:
tmpIds = []
for entry in tmp["entries"]:
(dateTuple, date) = self.extractDate(entry)
+ try:
+ entry["title"]
+ except:
+ entry["title"] = "No Title"
+ try:
+ entry["link"]
+ except:
+ entry["link"] = ""
tmpEntry = {"title":entry["title"], "content":self.extractContent(entry),
"date":date, "dateTuple":dateTuple, "link":entry["link"], "images":[] }
id = self.generateUniqueId(tmpEntry)
if not id in self.ids:
soup = BeautifulSoup(self.getArticle(tmpEntry)) #tmpEntry["content"])
images = soup('img')
- baseurl = ''.join(urlparse(tmpEntry["link"])[:-1])
+ baseurl = tmpEntry["link"]
if imageCache:
for img in images:
try:
img['src']=filename
tmpEntry["images"].append(filename)
except:
- print "Error downloading image %s" %img
+ print "Error downloading image %s" % img
tmpEntry["contentLink"] = configdir+self.uniqueId+".d/"+id+".html"
file = open(tmpEntry["contentLink"], "w")
file.write(soup.prettify())
self.readItems[id] = False
if self.readItems[id]==False:
tmpUnread = tmpUnread + 1
+ keys = self.readItems.keys()
+ for id in keys:
+ if not id in self.ids:
+ del self.readItems[id]
del tmp
self.countUnread = tmpUnread
self.updateTime = time.asctime()
f.close()
soup = BeautifulSoup(html)
images = soup('img')
- baseurl = ''.join(urlparse(entry["link"])[:-1])
+ baseurl = entry["link"]
for img in images:
filename = self.imageHandler.addImage(self.uniqueId, baseurl, img['src'])
- #filename = configdir+self.uniqueId+".d/"+getId(img['src'])
- #if not isfile(filename):
- # try:
- # if img['src'].startswith("http"):
- # f = urllib2.urlopen(img['src'])
- # else:
- # f = urllib2.urlopen(baseurl+"/"+img['src'])
- # #print baseurl+"/"+img['src']
- # print filename
- # outf = open(filename, "w")
- # outf.write(f.read())
- # f.close()
- # outf.close()
- # except:
- # print "Could not download" + img['src']
img['src']=filename
entry["images"].append(filename)
entry["contentLink"] = configdir+self.uniqueId+".d/"+id+".html"
self.setEntryUnread(id)
#except:
# pass
- currentTime = time.time()
- expiry = float(expiryTime) * 3600
- if currentTime - entry["time"] > expiry:
- if self.isEntryRead(id):
- self.removeEntry(id)
- else:
- if currentTime - entry["time"] > 2*expiry:
- self.removeEntry(id)
+ #currentTime = time.time()
+ #expiry = float(expiryTime) * 3600
+ #if currentTime - entry["time"] > expiry:
+ # if self.isEntryRead(id):
+ # self.removeEntry(id)
+ # else:
+ # if currentTime - entry["time"] > 2*expiry:
+ # self.removeEntry(id)
self.updateTime = time.asctime()
self.saveFeed(configdir)
+
+ def purgeReadArticles(self):
+ ids = self.getIds()
+ for id in ids:
+ entry = self.entries[id]
+ if self.isEntryRead(id):
+ self.removeEntry(id)
+
+ def removeArticle(self, id):
+ self.removeEntry(id)
def getArticle(self, index):
self.setEntryRead(index)
file.close()
else:
self.listOfFeeds = {getId("Slashdot"):{"title":"Slashdot", "url":"http://rss.slashdot.org/Slashdot/slashdot", "unread":0, "updateTime":"Never"}, }
- if isfile(self.configdir+"images.pickle"):
+ try:
file = open(self.configdir+"images.pickle")
self.imageHandler = pickle.load(file)
file.close()
- else:
+ except:
self.imageHandler = ImageHandler(self.configdir)
if self.listOfFeeds.has_key("font"):
del self.listOfFeeds["font"]
self.sortedKeys.remove("font")
self.sortedKeys.sort(key=lambda obj: self.getFeedTitle(obj))
list = self.sortedKeys[:]
- self.closeCurrentlyDisplayedFeed()
+ #self.closeCurrentlyDisplayedFeed()
def addArchivedArticle(self, key, index):
feed = self.getFeed(key)
feed.editFeed(url)
def getFeed(self, key):
- feed = self.loadFeed(key)
- feed.reloadUnread(self.configdir)
+ try:
+ feed = self.loadFeed(key)
+ feed.reloadUnread(self.configdir)
+ except:
+ # If the feed file gets corrupted, we need to reset the feed.
+ import dbus
+ bus = dbus.SessionBus()
+ remote_object = bus.get_object("org.freedesktop.Notifications", # Connection name
+ "/org/freedesktop/Notifications" # Object's path
+ )
+ iface = dbus.Interface(remote_object, 'org.freedesktop.Notifications')
+ iface.SystemNoteInfoprint("Error opening feed %s, it has been reset." % self.getFeedTitle(key))
+ if isdir(self.configdir+key+".d/"):
+ rmtree(self.configdir+key+".d/")
+ feed = self.loadFeed(key)
return feed
def getFeedUpdateTime(self, key):
index2 = (index+1)%len(self.sortedKeys)
self.sortedKeys[index] = self.sortedKeys[index2]
self.sortedKeys[index2] = key
-
- def setCurrentlyDisplayedFeed(self, key):
- self.currentlyDisplayedFeed = key
- def closeCurrentlyDisplayedFeed(self):
- self.currentlyDisplayedFeed = False
- def getCurrentlyDisplayedFeed(self):
- return self.currentlyDisplayedFeed
if __name__ == "__main__":
listing = Listing('/home/user/.feedingit/')
#list.reverse()
for key in list:
if key.startswith('d8'):
- print listing.getFeedUpdateTime(key)
\ No newline at end of file
+ print listing.getFeedUpdateTime(key)