forked from iambus/youku-lixian
-
Notifications
You must be signed in to change notification settings - Fork 0
/
bilibili.py
74 lines (58 loc) · 1.64 KB
/
bilibili.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
import re
from common import *
from iask import iask_download_by_id
from youku import youku_download_by_id
from tudou import tudou_download_by_id
def get_srt_xml(id):
url = 'http://comment.bilibili.tv/dm,%s' % id
return get_html(url).decode('utf-8')
def parse_srt_p(p):
fields = p.split(',')
assert len(fields) == 8, fields
time, mode, font_size, font_color, pub_time, pool, user_id, history = fields
time = float(time)
mode = int(mode)
assert 1 <= mode <= 8
# mode 1~3: scrolling
# mode 4: bottom
# mode 5: top
# mode 6: reverse?
# mode 7: position
# mode 8: advanced
pool = int(pool)
assert 0 <= pool <= 2
# pool 0: normal
# pool 1: srt
# pool 2: special?
font_size = int(font_size)
font_color = '#%06x' % int(font_color)
return pool, mode, font_size, font_color
def parse_srt_xml(xml):
d = re.findall(r'<d p="([^"]+)">(.*)</d>', xml)
for x, y in d:
p = parse_srt_p(x)
raise NotImplementedError()
def bilibili_download(url):
assert re.match(r'http://www.bilibili.tv/video/av(\d+)', url)
html = get_html(url)
title = r1(r'<h2 id="titles">([^<>]+)<a name="titles">', html).decode('utf-8')
title = unescape_html(title)
title = escape_file_path(title)
flashvars = r1(r'flashvars="([^"]+)"', html)
assert flashvars
t, id = flashvars.split('=', 1)
if t == 'vid':
iask_download_by_id(id, title)
elif t == 'ykid':
youku_download_by_id(id, title)
elif t == 'uid':
tudou_download_by_id(id, title)
else:
raise NotImplementedError(flashvars)
xml = get_srt_xml(id)
with open(title + '.xml', 'w') as x:
x.write(xml.encode('utf-8'))
def main():
script_main('bilibili', bilibili_download)
if __name__ == '__main__':
main()