newsbeuter - scrape mangahere latest to rss
This commit is contained in:
parent
6b12568ea2
commit
e9dbaad0d7
44
local/bin/mangahere_rss.py
Executable file
44
local/bin/mangahere_rss.py
Executable file
@ -0,0 +1,44 @@
|
||||
#!/usr/bin/python
|
||||
|
||||
from pyquery import PyQuery as pq
|
||||
from pprint import pprint
|
||||
import sys
|
||||
|
||||
ITEM = """
|
||||
<item>
|
||||
<title>{title}</title>
|
||||
<description>{description}</description>
|
||||
<link>{link}</link>
|
||||
</item>"""
|
||||
|
||||
class Release(object):
|
||||
|
||||
def __init__(self, title, link):
|
||||
self.title = title
|
||||
self.link = link
|
||||
|
||||
def __str__(self):
|
||||
return ITEM.format(
|
||||
title=self.title,
|
||||
description="New release: {}".format(self.title),
|
||||
link=self.link)
|
||||
|
||||
def __contains__(self, string):
|
||||
return string in self.title or string in self.link
|
||||
|
||||
latest = pq(url="http://www.mangahere.co/latest/")
|
||||
|
||||
print("""\
|
||||
<?xml version="1.0" encoding="UTF-8" ?>
|
||||
<rss version="2.0">
|
||||
<channel>""")
|
||||
|
||||
for item in map(pq, latest("dd > a")):
|
||||
release = Release(item.attr("title"), item.attr("href"))
|
||||
if any(word in release for word in sys.argv):
|
||||
print(str(release))
|
||||
|
||||
print("""
|
||||
</channel>
|
||||
</rss>
|
||||
""")
|
Loading…
Reference in New Issue
Block a user