My static website generator using poole https://www.xythobuz.de

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596
  1. # -*- coding: utf-8 -*-
  2. import re
  3. import itertools
  4. import email.utils
  5. import os.path
  6. import time
  7. import codecs
  8. from datetime import datetime
  9. DEFAULT_LANG = "en"
  10. BASE_URL = "https://www.xythobuz.de"
  11. # -----------------------------------------------------------------------------
  12. # sub page helper macro
  13. # -----------------------------------------------------------------------------
  14. def backToParent():
  15. url = page.get("parent", "") + ".html"
  16. posts = [p for p in pages if p.url == url]
  17. if len(posts) > 0:
  18. p = posts[0]
  19. print '<span class="listdesc">[...back to ' + p.title + ' overview](' + p.url + ')</span>'
  20. # -----------------------------------------------------------------------------
  21. # table helper macro
  22. # -----------------------------------------------------------------------------
  23. def tableHelper(style, header, content):
  24. print "<table>"
  25. if (header != None) and (len(header) == len(style)):
  26. print "<tr>"
  27. for h in header:
  28. print "<th>" + h + "</th>"
  29. print "</tr>"
  30. for ci in range(0, len(content)):
  31. if len(content[ci]) != len(style):
  32. # invalid call of table helper!
  33. continue
  34. print "<tr>"
  35. for i in range(0, len(style)):
  36. s = style[i]
  37. td_style = ""
  38. if "monospaced" in s:
  39. td_style += " font-family: monospace;"
  40. if "align-last-right" in s:
  41. if ci == (len(content) - 1):
  42. td_style += " text-align: right;"
  43. else:
  44. if "align-center" in s:
  45. td_style += " text-align: center;"
  46. elif "align-right" in s:
  47. td_style += " text-align: right;"
  48. elif "align-center" in s:
  49. td_style += " text-align: center;"
  50. td_args = ""
  51. if td_style != "":
  52. td_args = " style=\"" + td_style + "\""
  53. print "<td" + td_args + ">"
  54. if isinstance(content[ci][i], tuple):
  55. text, link = content[ci][i]
  56. print "<a href=\"" + link + "\">" + text + "</a>"
  57. else:
  58. text = content[ci][i]
  59. print text
  60. print "</td>"
  61. print "</tr>"
  62. print "</table>"
  63. # -----------------------------------------------------------------------------
  64. # menu helper macro
  65. # -----------------------------------------------------------------------------
  66. def githubCommitBadge(p, showInline = False):
  67. ret = ""
  68. if p.get("github", "") != "":
  69. link = p.get("git", p.github)
  70. linkParts = p.github.split("/")
  71. if len(linkParts) >= 5:
  72. ret += "<a href=\"" + link + "\"><img "
  73. if showInline:
  74. ret += "style =\"vertical-align: top;\" "
  75. ret += "src=\"https://img.shields.io/github/last-commit/"
  76. ret += linkParts[3] + "/" + linkParts[4]
  77. ret += ".svg?logo=git&style=flat\" /></a>"
  78. return ret
  79. def printMenuItem(p, yearsAsHeading = False, showDateSpan = False, showOnlyStartDate = False, nicelyFormatFullDate = False, lastyear = "0", lang = "", showLastCommit = True):
  80. title = p.title
  81. if lang != "":
  82. if p.get("title_" + lang, "") != "":
  83. title = p.get("title_" + lang, "")
  84. if p.title == "Blog":
  85. title = p.post
  86. year = p.get("date", "")[0:4]
  87. if year != lastyear:
  88. lastyear = year
  89. if yearsAsHeading:
  90. print "\n\n#### %s\n" % (year)
  91. dateto = ""
  92. if p.get("date", "" != ""):
  93. year = p.get("date", "")[0:4]
  94. if showOnlyStartDate:
  95. dateto = " (%s)" % (year)
  96. if p.get("update", "") != "" and p.get("update", "")[0:4] != year:
  97. if showDateSpan:
  98. dateto = " (%s - %s)" % (year, p.get("update", "")[0:4])
  99. if nicelyFormatFullDate:
  100. dateto = " - " + datetime.strptime(p.get("update", p.date), "%Y-%m-%d").strftime("%B %d, %Y")
  101. print " * **[%s](%s)**%s" % (title, p.url, dateto)
  102. if p.get("description", "") != "":
  103. description = p.get("description", "")
  104. if lang != "":
  105. if p.get("description_" + lang, "") != "":
  106. description = p.get("description_" + lang, "")
  107. print "<br><span class=\"listdesc\">" + description + "</span>"
  108. if showLastCommit:
  109. link = githubCommitBadge(p)
  110. if len(link) > 0:
  111. print "<br>" + link
  112. return lastyear
  113. def printRecentMenu(count = 5):
  114. posts = [p for p in pages if "date" in p]
  115. posts.sort(key=lambda p: p.get("update", p.get("date")), reverse=True)
  116. for p in posts[0:count]:
  117. printMenuItem(p, False, False, False, True, "0", "", False)
  118. def printBlogMenu():
  119. posts = [p for p in pages if "post" in p]
  120. posts.sort(key=lambda p: p.get("date", "9999-01-01"), reverse=True)
  121. lastyear = "0"
  122. for p in posts:
  123. lastyear = printMenuItem(p, True, False, False, True, lastyear)
  124. def printProjectsMenu():
  125. # prints all pages with parent 'projects' or 'stuff'.
  126. # first the ones without date, sorted by position.
  127. # then afterwards those with date, split by year.
  128. # also supports blog posts with parent.
  129. enpages = [p for p in pages if p.lang == "en"]
  130. dpages = [p for p in enpages if p.get("date", "") == ""]
  131. mpages = [p for p in dpages if any(x in p.get("parent", "") for x in [ 'projects', 'stuff' ])]
  132. mpages.sort(key=lambda p: [int(p.get("position", "999"))])
  133. for p in mpages:
  134. printMenuItem(p)
  135. dpages = [p for p in enpages if p.get("date", "") != ""]
  136. mpages = [p for p in dpages if any(x in p.get("parent", "") for x in [ 'projects', 'stuff' ])]
  137. mpages.sort(key=lambda p: [p.get("date", "9999-01-01")], reverse = True)
  138. lastyear = "0"
  139. for p in mpages:
  140. lastyear = printMenuItem(p, True, True, False, False, lastyear)
  141. def print3DPrintingMenu():
  142. mpages = [p for p in pages if p.get("parent", "") == "3d-printing" and p.lang == "en"]
  143. mpages.sort(key=lambda p: int(p["position"]))
  144. for p in mpages:
  145. printMenuItem(p, False, True, True)
  146. def printSmarthomeMenu():
  147. mpages = [p for p in pages if p.get("parent", "") == "smarthome" and p.lang == "en"]
  148. mpages.sort(key=lambda p: int(p["position"]))
  149. for p in mpages:
  150. printMenuItem(p, False, True, True)
  151. def printQuadcopterMenu():
  152. mpages = [p for p in pages if p.get("parent", "") == "quadcopters" and p.lang == "en"]
  153. mpages.sort(key=lambda p: int(p["position"]))
  154. for p in mpages:
  155. printMenuItem(p, False, True, True)
  156. def printQuadcopterRelatedMenu():
  157. mpages = [p for p in pages if p.get("show_in_quadcopters", "false") == "true"]
  158. mpages.sort(key=lambda p: [p.get("date", "9999-01-01")], reverse = True)
  159. for p in mpages:
  160. printMenuItem(p, False, True, True)
  161. def printRobotMenuEnglish():
  162. mpages = [p for p in pages if p.get("parent", "") == "xyrobot" and p.lang == "en"]
  163. mpages.sort(key=lambda p: int(p["position"]))
  164. for p in mpages:
  165. printMenuItem(p)
  166. def printRobotMenuDeutsch():
  167. mpages = [p for p in pages if p.get("parent", "") == "xyrobot" and p.lang == "de"]
  168. mpages.sort(key=lambda p: int(p["position"]))
  169. for p in mpages:
  170. printMenuItem(p, False, False, False, False, "0", "de")
  171. # -----------------------------------------------------------------------------
  172. # lightgallery helper macro
  173. # -----------------------------------------------------------------------------
  174. # call this macro like this
  175. # lightgallery([
  176. # [ "image-link", "description" ],
  177. # [ "image-link", "thumbnail-link", "description" ],
  178. # [ "youtube-link", "thumbnail-link", "description" ],
  179. # [ "video-link", "mime", "thumbnail-link", "image-link", "description" ]
  180. # ])
  181. def lightgallery(links):
  182. videos = [l for l in links if len(l) == 5]
  183. v_i = -1
  184. for v in videos:
  185. link, mime, thumb, poster, alt = v
  186. v_i += 1
  187. print '<div style="display:none;" id="video' + str(v_i) + '">'
  188. print '<video class="lg-video-object lg-html5" controls preload="none">'
  189. print '<source src="' + link + '" type="' + mime + '">'
  190. print 'Your browser does not support HTML5 video.'
  191. print '</video>'
  192. print '</div>'
  193. print '<div class="lightgallery">'
  194. v_i = -1
  195. for l in links:
  196. if (len(l) == 3) or (len(l) == 2):
  197. link = img = alt = ""
  198. if len(l) == 3:
  199. link, img, alt = l
  200. else:
  201. link, alt = l
  202. x = link.rfind('.')
  203. img = link[:x] + '_small' + link[x:]
  204. print '<div class="border" data-src="' + link + '"><a href="' + link + '"><img class="pic" src="' + img + '" alt="' + alt + '"></a></div>'
  205. elif len(l) == 5:
  206. v_i += 1
  207. link, mime, thumb, poster, alt = videos[v_i]
  208. print '<div class="border" data-poster="' + poster + '" data-sub-html="' + alt + '" data-html="#video' + str(v_i) + '"><a href="' + link + '"><img class="pic" src="' + thumb + '"></a></div>'
  209. else:
  210. raise NameError('Invalid number of arguments for lightgallery')
  211. print '</div>'
  212. # -----------------------------------------------------------------------------
  213. # github helper macros
  214. # -----------------------------------------------------------------------------
  215. import urllib, json
  216. def restRequest(url):
  217. response = urllib.urlopen(url)
  218. data = json.loads(response.read())
  219. return data
  220. def restReleases(user, repo):
  221. s = "https://api.github.com/repos/"
  222. s += user
  223. s += "/"
  224. s += repo
  225. s += "/releases"
  226. return restRequest(s)
  227. def printLatestRelease(user, repo):
  228. repo_url = "https://github.com/" + user + "/" + repo
  229. print("<div class=\"releasecard\">")
  230. print("Release builds for " + repo + " are <a href=\"" + repo_url + "/releases\">available on GitHub</a>.<br>\n")
  231. releases = restReleases(user, repo)
  232. if len(releases) <= 0:
  233. print("No release has been published on GitHub yet.")
  234. print("</div>")
  235. return
  236. releases.sort(key=lambda x: x["published_at"], reverse=True)
  237. r = releases[0]
  238. release_url = r["html_url"]
  239. print("Latest release of <a href=\"" + repo_url + "\">" + repo + "</a>, at the time of this writing: <a href=\"" + release_url + "\">" + r["name"] + "</a> (" + datetime.strptime(r["published_at"], "%Y-%m-%dT%H:%M:%SZ").strftime("%Y-%m-%d %H:%M:%S") + ")\n")
  240. if len(r["assets"]) <= 0:
  241. print("<br>No release assets have been published on GitHub for that.")
  242. print("</div>")
  243. return
  244. print("<ul>")
  245. print("Release Assets:")
  246. for a in r["assets"]:
  247. size = int(a["size"])
  248. ss = " "
  249. if size >= (1024 * 1024):
  250. ss += "(%.1f MiB)" % (size / (1024.0 * 1024.0))
  251. elif size >= 1024:
  252. ss += "(%d KiB)" % (size // 1024)
  253. else:
  254. ss += "(%d Byte)" % (size)
  255. print("<li><a href=\"" + a["browser_download_url"] + "\">" + a["name"] + "</a>" + ss)
  256. print("</ul></div>")
  257. # -----------------------------------------------------------------------------
  258. # preconvert hooks
  259. # -----------------------------------------------------------------------------
  260. # -----------------------------------------------------------------------------
  261. # multi language support
  262. # -----------------------------------------------------------------------------
  263. def hook_preconvert_anotherlang():
  264. MKD_PATT = r'\.(?:md|mkd|mdown|markdown)$'
  265. _re_lang = re.compile(r'^[\s+]?lang[\s+]?[:=]((?:.|\n )*)', re.MULTILINE)
  266. vpages = [] # Set of all virtual pages
  267. for p in pages:
  268. current_lang = DEFAULT_LANG # Default language
  269. langs = [] # List of languages for the current page
  270. page_vpages = {} # Set of virtual pages for the current page
  271. text_lang = re.split(_re_lang, p.source)
  272. text_grouped = dict(zip([current_lang,] + \
  273. [lang.strip() for lang in text_lang[1::2]], \
  274. text_lang[::2]))
  275. for lang, text in text_grouped.iteritems():
  276. spath = p.fname.split(os.path.sep)
  277. langs.append(lang)
  278. if lang == "en":
  279. filename = re.sub(MKD_PATT, "%s\g<0>" % "", p.fname).split(os.path.sep)[-1]
  280. else:
  281. filename = re.sub(MKD_PATT, ".%s\g<0>" % lang, p.fname).split(os.path.sep)[-1]
  282. vp = Page(filename, virtual=text)
  283. # Copy real page attributes to the virtual page
  284. for attr in p:
  285. if not vp.has_key(attr):
  286. vp[attr] = p[attr]
  287. # Define a title in the proper language
  288. vp["title"] = p["title_%s" % lang] \
  289. if p.has_key("title_%s" % lang) \
  290. else p["title"]
  291. # Keep track of the current lang of the virtual page
  292. vp["lang"] = lang
  293. # Fix post name if exists
  294. if vp.has_key("post"):
  295. if lang == "en":
  296. vp["post"] = vp["post"][:]
  297. else:
  298. vp["post"] = vp["post"][:-len(lang) - 1]
  299. page_vpages[lang] = vp
  300. # Each virtual page has to know about its sister vpages
  301. for lang, vpage in page_vpages.iteritems():
  302. vpage["lang_links"] = dict([(l, v["url"]) for l, v in page_vpages.iteritems()])
  303. vpage["other_lang"] = langs # set other langs and link
  304. vpages += page_vpages.values()
  305. pages[:] = vpages
  306. # -----------------------------------------------------------------------------
  307. # compatibility redirect for old website URLs
  308. # -----------------------------------------------------------------------------
  309. _COMPAT = """ case "%s":
  310. $loc = "%s/%s";
  311. break;
  312. """
  313. _COMPAT_404 = """ default:
  314. $loc = "%s";
  315. break;
  316. """
  317. def hook_preconvert_compat():
  318. fp = open(os.path.join(options.project, "output", "index.php"), 'w')
  319. fp.write("<?\n")
  320. fp.write("// Auto generated xyCMS compatibility index.php\n")
  321. fp.write("$loc = 'https://www.xythobuz.de/index.de.html';\n")
  322. fp.write("if (isset($_GET['p'])) {\n")
  323. fp.write(" if (isset($_GET['lang'])) {\n")
  324. fp.write(" $_GET['p'] .= 'EN';\n")
  325. fp.write(" }\n")
  326. fp.write(" switch($_GET['p']) {\n")
  327. for p in pages:
  328. if p.get("compat", "") != "":
  329. tmp = p["compat"]
  330. if p.get("lang", DEFAULT_LANG) == DEFAULT_LANG:
  331. tmp = tmp + "EN"
  332. fp.write(_COMPAT % (tmp, "https://www.xythobuz.de", p.url))
  333. fp.write("\n")
  334. fp.write(_COMPAT_404 % "/404.html")
  335. fp.write(" }\n")
  336. fp.write("}\n")
  337. fp.write("if ($_SERVER['SERVER_PROTOCOL'] == 'HTTP/1.1') {\n")
  338. fp.write(" if (php_sapi_name() == 'cgi') {\n")
  339. fp.write(" header('Status: 301 Moved Permanently');\n")
  340. fp.write(" } else {\n")
  341. fp.write(" header('HTTP/1.1 301 Moved Permanently');\n")
  342. fp.write(" }\n")
  343. fp.write("}\n");
  344. fp.write("header('Location: '.$loc);\n")
  345. fp.write("?>")
  346. fp.close()
  347. # -----------------------------------------------------------------------------
  348. # sitemap generation
  349. # -----------------------------------------------------------------------------
  350. _SITEMAP = """<?xml version="1.0" encoding="UTF-8"?>
  351. <urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
  352. %s
  353. </urlset>
  354. """
  355. _SITEMAP_URL = """
  356. <url>
  357. <loc>%s/%s</loc>
  358. <lastmod>%s</lastmod>
  359. <changefreq>%s</changefreq>
  360. <priority>%s</priority>
  361. </url>
  362. """
  363. def hook_preconvert_sitemap():
  364. date = datetime.strftime(datetime.now(), "%Y-%m-%d")
  365. urls = []
  366. for p in pages:
  367. urls.append(_SITEMAP_URL % (BASE_URL, p.url, date, p.get("changefreq", "monthly"), p.get("priority", "0.5")))
  368. fname = os.path.join(options.project, "output", "sitemap.xml")
  369. fp = open(fname, 'w')
  370. fp.write(_SITEMAP % "".join(urls))
  371. fp.close()
  372. # -----------------------------------------------------------------------------
  373. # postconvert hooks
  374. # -----------------------------------------------------------------------------
  375. # -----------------------------------------------------------------------------
  376. # rss feed generation
  377. # -----------------------------------------------------------------------------
  378. _RSS = """<?xml version="1.0" encoding="UTF-8"?>
  379. <rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
  380. <channel>
  381. <title>%s</title>
  382. <link>%s</link>
  383. <atom:link href="%s" rel="self" type="application/rss+xml" />
  384. <description>%s</description>
  385. <language>en-us</language>
  386. <pubDate>%s</pubDate>
  387. <lastBuildDate>%s</lastBuildDate>
  388. <docs>http://blogs.law.harvard.edu/tech/rss</docs>
  389. <generator>Poole</generator>
  390. <ttl>720</ttl>
  391. %s
  392. </channel>
  393. </rss>
  394. """
  395. _RSS_ITEM = """
  396. <item>
  397. <title>%s</title>
  398. <link>%s</link>
  399. <description>%s</description>
  400. <pubDate>%s</pubDate>
  401. <atom:updated>%s</atom:updated>
  402. <guid>%s</guid>
  403. </item>
  404. """
  405. def hook_postconvert_rss():
  406. items = []
  407. # all pages with "date" get put into feed
  408. posts = [p for p in pages if "date" in p]
  409. # sort by update if available, date else
  410. posts.sort(key=lambda p: p.get("update", p.date), reverse=True)
  411. # only put 20 most recent items in feed
  412. posts = posts[:20]
  413. for p in posts:
  414. title = p.title
  415. if "post" in p:
  416. title = p.post
  417. link = "%s/%s" % (BASE_URL, p.url)
  418. desc = p.html.replace("href=\"img", "%s%s%s" % ("href=\"", BASE_URL, "/img"))
  419. desc = desc.replace("src=\"img", "%s%s%s" % ("src=\"", BASE_URL, "/img"))
  420. desc = desc.replace("href=\"/img", "%s%s%s" % ("href=\"", BASE_URL, "/img"))
  421. desc = desc.replace("src=\"/img", "%s%s%s" % ("src=\"", BASE_URL, "/img"))
  422. desc = htmlspecialchars(desc)
  423. date = time.mktime(time.strptime("%s 12" % p.date, "%Y-%m-%d %H"))
  424. date = email.utils.formatdate(date)
  425. update = time.mktime(time.strptime("%s 12" % p.get("update", p.date), "%Y-%m-%d %H"))
  426. update = email.utils.formatdate(update)
  427. items.append(_RSS_ITEM % (title, link, desc, date, update, link))
  428. items = "".join(items)
  429. title = "xythobuz.de Blog"
  430. link = "%s" % BASE_URL
  431. feed = "%s/rss.xml" % BASE_URL
  432. desc = htmlspecialchars("xythobuz Electronics & Software Projects")
  433. date = email.utils.formatdate()
  434. rss = _RSS % (title, link, feed, desc, date, date, items)
  435. fp = codecs.open(os.path.join(output, "rss.xml"), "w", "utf-8")
  436. fp.write(rss)
  437. fp.close()
  438. # -----------------------------------------------------------------------------
  439. # compatibility redirect for old mobile pages
  440. # -----------------------------------------------------------------------------
  441. _COMPAT_MOB = """ case "%s":
  442. $loc = "%s/%s";
  443. break;
  444. """
  445. _COMPAT_404_MOB = """ default:
  446. $loc = "%s";
  447. break;
  448. """
  449. def hook_postconvert_mobilecompat():
  450. directory = os.path.join(output, "mobile")
  451. if not os.path.exists(directory):
  452. os.makedirs(directory)
  453. fp = codecs.open(os.path.join(directory, "index.php"), "w", "utf-8")
  454. fp.write("<?\n")
  455. fp.write("// Auto generated xyCMS compatibility mobile/index.php\n")
  456. fp.write("$loc = 'https://www.xythobuz.de/index.de.html';\n")
  457. fp.write("if (isset($_GET['p'])) {\n")
  458. fp.write(" if (isset($_GET['lang'])) {\n")
  459. fp.write(" $_GET['p'] .= 'EN';\n")
  460. fp.write(" }\n")
  461. fp.write(" switch($_GET['p']) {\n")
  462. for p in pages:
  463. if p.get("compat", "") != "":
  464. tmp = p["compat"]
  465. if p.get("lang", DEFAULT_LANG) == DEFAULT_LANG:
  466. tmp = tmp + "EN"
  467. fp.write(_COMPAT_MOB % (tmp, "https://www.xythobuz.de", re.sub(".html", ".html", p.url)))
  468. fp.write("\n")
  469. fp.write(_COMPAT_404_MOB % "/404.mob.html")
  470. fp.write(" }\n")
  471. fp.write("}\n")
  472. fp.write("if ($_SERVER['SERVER_PROTOCOL'] == 'HTTP/1.1') {\n")
  473. fp.write(" if (php_sapi_name() == 'cgi') {\n")
  474. fp.write(" header('Status: 301 Moved Permanently');\n")
  475. fp.write(" } else {\n")
  476. fp.write(" header('HTTP/1.1 301 Moved Permanently');\n")
  477. fp.write(" }\n")
  478. fp.write("}\n");
  479. fp.write("header('Location: '.$loc);\n")
  480. fp.write("?>")
  481. fp.close()
  482. # -----------------------------------------------------------------------------
  483. # displaying filesize for download links
  484. # -----------------------------------------------------------------------------
  485. def hook_postconvert_size():
  486. file_ext = '|'.join(['pdf', 'zip', 'rar', 'ods', 'odt', 'odp', 'doc', 'xls', 'ppt', 'docx', 'xlsx', 'pptx', 'exe', 'brd', 'plist'])
  487. def matched_link(matchobj):
  488. try:
  489. path = matchobj.group(1)
  490. if path.startswith("http") or path.startswith("//") or path.startswith("ftp"):
  491. return '<a href=\"%s\">%s</a>' % (matchobj.group(1), matchobj.group(3))
  492. elif path.startswith("/"):
  493. path = path.strip("/")
  494. path = os.path.join("static/", path)
  495. size = os.path.getsize(path)
  496. if size >= (1024 * 1024):
  497. return "<a href=\"%s\">%s</a>&nbsp;(%.1f MiB)" % (matchobj.group(1), matchobj.group(3), size / (1024.0 * 1024.0))
  498. elif size >= 1024:
  499. return "<a href=\"%s\">%s</a>&nbsp;(%d KiB)" % (matchobj.group(1), matchobj.group(3), size // 1024)
  500. else:
  501. return "<a href=\"%s\">%s</a>&nbsp;(%d Byte)" % (matchobj.group(1), matchobj.group(3), size)
  502. except:
  503. print "Unable to estimate file size for %s" % matchobj.group(1)
  504. return '<a href=\"%s\">%s</a>' % (matchobj.group(1), matchobj.group(3))
  505. _re_url = '<a href=\"([^\"]*?\.(%s))\">(.*?)<\/a>' % file_ext
  506. for p in pages:
  507. p.html = re.sub(_re_url, matched_link, p.html)