-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathfeed.py
executable file
·78 lines (65 loc) · 1.97 KB
/
feed.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
#!/usr/bin/env python3
import argparse
import feedparser
import PyRSS2Gen
import toml
from datetime import datetime
from db import feeds_db
from time import mktime
parser = argparse.ArgumentParser(description='Make a feed from other feeds')
parser.add_argument(
'-c',
'--config-file',
help='Config file. default: feeds.toml',
default='feeds.toml'
)
args = parser.parse_args()
conf = toml.load(args.config_file)
fdb = feeds_db(conf['db_file'])
for name, url in conf['feeds'].items():
previous = fdb.get_previous(name)
print(f"fetching {name} ({url})...")
feedparser.USER_AGENT = conf['user_agent']
if previous:
feed = feedparser.parse(url, etag=previous["etag"], modified=previous["modified"])
else:
feed = feedparser.parse(url)
etag = feed.etag if hasattr(feed, 'etag') else None
modified = feed.modified if hasattr(feed, 'modified') else None
print(f"\t{feed.status} {etag} {modified}")
if feed.status == 304:
continue
if feed.status == 429:
continue
for entry in feed['entries']:
if "published_parsed" in entry:
entry_date = datetime.fromtimestamp(mktime(entry["published_parsed"]))
else:
entry_date = datetime.fromtimestamp(mktime(entry["updated_parsed"]))
fdb.insert_entry(
name,
entry['title'],
entry['description'],
entry['link'],
entry['guid'],
entry_date,
modified,
etag
)
items = []
for entry in fdb.get_entries():
items.append(PyRSS2Gen.RSSItem(
title=f"{entry['service']} :: {entry['title']}",
description=entry['description'],
link=entry['link'],
guid=entry['guid'],
pubDate=entry['pub_date']
))
rss = PyRSS2Gen.RSS2(
title=conf['title'],
link=conf['link'],
description=conf['description'],
lastBuildDate=datetime.now(),
items=items
)
rss.write_xml(open(conf['out_file'], 'w'))