-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathgen.py
executable file
·88 lines (73 loc) · 3.54 KB
/
gen.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
#!/usr/bin/env python
import os, re, sys, shutil
domain = "https://example.com/"
if sys.platform != 'win32':
if shutil.which('hoedown') is None:
print("Please, install 'hoedown'. https://github.com/hoedown/hoedown")
sys.exit()
else:
if shutil.which('pandoc') is None:
print("Please, install 'pandoc'. https://pandoc.org/installing.html")
sys.exit()
if os.path.exists('html'):
shutil.rmtree('html')
os.mkdir('html')
os.mkdir('html/tmp')
shutil.copytree('md/img', 'html/img')
shutil.copytree('theme/css', 'html/css')
shutil.copyfile('theme/_htaccess', 'html/.htaccess')
shutil.copyfile('theme/robots.txt', 'html/robots.txt')
# shutil.copyfile('theme/favicon.ico', 'html/favicon.ico')
if sys.platform != 'win32':
os.system('cd md && find . -iname "*.md" -type f -exec sh -c \'hoedown --tables "${0}" > "../html/tmp/${0%.md}.html"\' {} \;')
# os.system('cd md && find . -iname "*.md" -type f -exec sh -c \'pandoc "${0}" -o "../html/tmp/${0%.md}.html"\' {} \;')
else:
os.system('cd md && for %i in (*.md) do pandoc "%i" -o "../html/tmp/%~ni.html"')
ext = lambda s: re.sub('<[^<>]+>', '', s)
ul = "<ul>"
for f in sorted(os.listdir('html/tmp'), reverse=True):
if f not in ['index.html', '_header.html', '_aside.html', '_footer.html']:
if re.match("^\d{6}-.+?\.html$", f):
h1 = open('html/tmp/'+f, 'r').readline().strip()
ul += "<li><a href='%s'>%s</a></li>" % (f, ext(h1))
ul += "</ul>"
base = open('theme/base.html', 'r').read()
header = open('html/tmp/_header.html', 'r').read()
aside = open('html/tmp/_aside.html', 'r').read()
footer = open('html/tmp/_footer.html', 'r').read()
subtitle = re.search('<title>(.*)</title>', base).group(1)
base = base.replace('<nav></nav>', "<nav>%s</nav>" % ul)
base = base.replace('<header></header>', "<header>%s</header>" % header)
base = base.replace('<aside></aside>', "<aside>%s</aside>" % aside)
base = base.replace('<footer></footer>', "<footer>%s</footer>" % footer)
for f in os.listdir('html/tmp'):
if f not in ['_header.html', '_aside.html', '_footer.html']:
frag = open('html/tmp/'+f, 'r').read()
h1 = frag.split('\n', 1)[0]
desc, DESC_NUM = '', 350
for s in ext(frag).split('\n')[1:]:
s = s.strip()
if len(desc+s) > DESC_NUM:
break
desc += s
date = ''
if re.match("^\d{6}-.+?\.html$", f):
y, m, d = '20'+f[0:2], f[2:4], f[4:6]
date = '<time datetime="%s">%s</time>' % ('-'.join([y,m,d]), '.'.join([y,str(int(m)),str(int(d))]))
post = base.replace('<title>%s</title>' % subtitle, "<title>%s | %s</title>" % (ext(h1), subtitle))
post = post.replace('<meta name="description" content="">', '<meta name="description" content="%s">' % desc)
post = post.replace('<article></article>', "<article>%s%s</article>" % (frag, date))
open('html/'+f, 'w').write(post)
sitemapxml = '<?xml version="1.0" encoding="UTF-8"?>\n<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">'
for f in sorted(os.listdir('html'), reverse=True):
if f.endswith('.html'):
sitemapxml += '\n <url>\n <loc>' + domain
if re.match("^\d{6}-.+?\.html$", f):
lastmod = '-'.join(['20'+f[0:2], f[2:4], f[4:6]])
sitemapxml += f + '</loc>\n <lastmod>' + lastmod + '</lastmod>'
else:
sitemapxml += ('' if f == 'index.html' else f) + '</loc>'
sitemapxml += '\n </url>'
sitemapxml += '\n</urlset>'
open('html/sitemap.xml', 'w').write(sitemapxml)
shutil.rmtree('html/tmp')