namu.py 44 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030
  1. from . import tool
  2. import datetime
  3. import html
  4. import re
  5. def table_parser(data, cel_data, start_data, num = 0):
  6. table_class = 'class="'
  7. all_table = 'style="'
  8. cel_style = 'style="'
  9. row_style = 'style="'
  10. row = ''
  11. cel = ''
  12. table_width = re.search("<table ?width=((?:(?!>).)*)>", data)
  13. if table_width:
  14. if re.search('^[0-9]+$', table_width.groups()[0]):
  15. all_table += 'width: ' + table_width.groups()[0] + 'px;'
  16. else:
  17. all_table += 'width: ' + table_width.groups()[0] + ';'
  18. table_height = re.search("<table ?height=((?:(?!>).)*)>", data)
  19. if table_height:
  20. if re.search('^[0-9]+$', table_height.groups()[0]):
  21. all_table += 'height: ' + table_height.groups()[0] + 'px;'
  22. else:
  23. all_table += 'height: ' + table_height.groups()[0] + ';'
  24. table_align = re.search("<table ?align=((?:(?!>).)*)>", data)
  25. if table_align:
  26. if table_align.groups()[0] == 'right':
  27. all_table += 'float: right;'
  28. elif table_align.groups()[0] == 'center':
  29. all_table += 'margin: auto;'
  30. table_text_align = re.search("<table ?textalign=((?:(?!>).)*)>", data)
  31. if table_text_align:
  32. num = 1
  33. if table_text_align.groups()[0] == 'right':
  34. all_table += 'text-align: right;'
  35. elif table_text_align.groups()[0] == 'center':
  36. all_table += 'text-align: center;'
  37. row_table_align = re.search("<row ?textalign=((?:(?!>).)*)>", data)
  38. if row_table_align:
  39. if row_table_align.groups()[0] == 'right':
  40. row_style += 'text-align: right;'
  41. elif row_table_align.groups()[0] == 'center':
  42. row_style += 'text-align: center;'
  43. else:
  44. row_style += 'text-align: left;'
  45. table_cel = re.search("<-((?:(?!>).)*)>", data)
  46. if table_cel:
  47. cel = 'colspan="' + table_cel.groups()[0] + '"'
  48. else:
  49. cel = 'colspan="' + str(round(len(start_data) / 2)) + '"'
  50. table_row = re.search("<\|((?:(?!>).)*)>", data)
  51. if table_row:
  52. row = 'rowspan="' + table_row.groups()[0] + '"'
  53. row_bgcolor = re.search("<rowbgcolor=(#(?:[0-9a-f-A-F]{3}){1,2}|\w+)>", data)
  54. if row_bgcolor:
  55. row_style += 'background: ' + row_bgcolor.groups()[0] + ';'
  56. table_border = re.search("<table ?bordercolor=(#(?:[0-9a-f-A-F]{3}){1,2}|\w+)>", data)
  57. if table_border:
  58. all_table += 'border: ' + table_border.groups()[0] + ' 2px solid;'
  59. table_bgcolor = re.search("<table ?bgcolor=(#(?:[0-9a-f-A-F]{3}){1,2}|\w+)>", data)
  60. if table_bgcolor:
  61. all_table += 'background: ' + table_bgcolor.groups()[0] + ';'
  62. bgcolor = re.search("<bgcolor=(#(?:[0-9a-f-A-F]{3}){1,2}|\w+)>", data)
  63. if bgcolor:
  64. cel_style += 'background: ' + bgcolor.groups()[0] + ';'
  65. cel_width = re.search("<width=((?:(?!>).)*)>", data)
  66. if cel_width:
  67. cel_style += 'width: ' + cel_width.groups()[0] + 'px;'
  68. cel_height = re.search("<height=((?:(?!>).)*)>", data)
  69. if cel_height:
  70. cel_style += 'height: ' + cel_height.groups()[0] + 'px;'
  71. text_right = re.search("<\)>", data)
  72. text_center = re.search("<:>", data)
  73. text_left = re.search("<\(>", data)
  74. if text_right:
  75. cel_style += 'text-align: right;'
  76. elif text_center:
  77. cel_style += 'text-align: center;'
  78. elif text_left:
  79. cel_style += 'text-align: left;'
  80. elif num == 0:
  81. if re.search('^ ', cel_data) and re.search(' $', cel_data):
  82. cel_style += 'text-align: center;'
  83. elif re.search('^ ', cel_data):
  84. cel_style += 'text-align: right;'
  85. elif re.search(' $', cel_data):
  86. cel_style += 'text-align: left;'
  87. text_class = re.search("<table ?class=((?:(?!>).)+)>", data)
  88. if text_class:
  89. table_class += text_class.groups()[0]
  90. all_table += '"'
  91. cel_style += '"'
  92. row_style += '"'
  93. table_class += '"'
  94. return [all_table, row_style, cel_style, row, cel, table_class, num]
  95. def table_start(data):
  96. while 1:
  97. table = re.search('\n((?:(?:(?:(?:\|\|)+(?:(?:(?!\|\|).(?:\n)*)*))+)\|\|(?:\n)?)+)', data)
  98. if table:
  99. table = table.groups()[0]
  100. while 1:
  101. all_table = re.search('^((?:\|\|)+)((?:<(?:(?:(?!>).)+)>)*)\n*((?:(?!\|\|).\n*)*)', table)
  102. if all_table:
  103. all_table = all_table.groups()
  104. return_table = table_parser(all_table[1], all_table[2], all_table[0])
  105. number = return_table[6]
  106. table = re.sub('^((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*', '\n<table ' + return_table[5] + ' ' + return_table[0] + '><tbody><tr ' + return_table[1] + '><td ' + return_table[2] + ' ' + return_table[3] + ' ' + return_table[4] + '>', table, 1)
  107. else:
  108. break
  109. table = re.sub('\|\|\n?$', '</td></tr></tbody></table>', table)
  110. while 1:
  111. row_table = re.search('\|\|\n((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*((?:(?!\|\||<\/td>).\n*)*)', table)
  112. if row_table:
  113. row_table = row_table.groups()
  114. return_table = table_parser(row_table[1], row_table[2], row_table[0], number)
  115. table = re.sub('\|\|\n((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*', '</td></tr><tr ' + return_table[1] + '><td ' + return_table[2] + ' ' + return_table[3] + ' ' + return_table[4] + '>', table, 1)
  116. else:
  117. break
  118. while 1:
  119. cel_table = re.search('((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*((?:(?:(?!\|\||<\/td>).)|\n)*\n*)', table)
  120. if cel_table:
  121. cel_table = cel_table.groups()
  122. return_table = table_parser(cel_table[1], re.sub('\n', ' ', cel_table[2]), cel_table[0], number)
  123. table = re.sub('((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*', '</td><td ' + return_table[2] + ' ' + return_table[3] + ' ' + return_table[4] + '>', table, 1)
  124. else:
  125. break
  126. data = re.sub('\n((?:(?:(?:(?:\|\|)+(?:(?:(?!\|\|).(?:\n)*)*))+)\|\|(?:\n)?)+)', table, data, 1)
  127. else:
  128. break
  129. return data
  130. def middle_parser(data, fol_num, syntax_num, folding_num):
  131. global end_data
  132. global plus_data
  133. middle_stack = 0
  134. middle_list = []
  135. middle_number = 0
  136. middle_re = re.compile('(?:{{{((?:(?! |{{{|}}}|&lt;).)*) ?|(}}}))')
  137. while 1:
  138. middle_data = middle_re.search(data)
  139. if middle_data:
  140. middle_data = middle_data.groups()
  141. if not middle_data[1]:
  142. if middle_stack > 0:
  143. middle_stack += 1
  144. data = re.sub('(?:{{{((?:(?! |{{{|}}}|&lt;).)*)(?P<in> ?)|(}}}))', '&#123;&#123;&#123;' + middle_data[0] + '\g<in>', data, 1)
  145. else:
  146. if re.search('^(#|@|\+|\-)', middle_data[0]) and not re.search('^(#|@|\+|\-){2}', middle_data[0]):
  147. middle_search = re.search('^(#(?:[0-9a-f-A-F]{3}){1,2})', middle_data[0])
  148. if middle_search:
  149. middle_list += ['span']
  150. data = middle_re.sub('<span style="color: ' + middle_search.groups()[0] + ';">', data, 1)
  151. else:
  152. middle_search = re.search('^(?:#(\w+))', middle_data[0])
  153. if middle_search:
  154. middle_list += ['span']
  155. data = middle_re.sub('<span style="color: ' + middle_search.groups()[0] + ';">', data, 1)
  156. else:
  157. middle_search = re.search('^(?:@((?:[0-9a-f-A-F]{3}){1,2}))', middle_data[0])
  158. if middle_search:
  159. middle_list += ['span']
  160. data = middle_re.sub('<span style="background: #' + middle_search.groups()[0] + ';">', data, 1)
  161. else:
  162. middle_search = re.search('^(?:@(\w+))', middle_data[0])
  163. if middle_search:
  164. middle_list += ['span']
  165. data = middle_re.sub('<span style="background: ' + middle_search.groups()[0] + ';">', data, 1)
  166. else:
  167. middle_search = re.search('^(\+|-)([1-5])', middle_data[0])
  168. if middle_search:
  169. middle_search = middle_search.groups()
  170. if middle_search[0] == '+':
  171. font_size = str(int(middle_search[1]) * 20 + 100)
  172. else:
  173. font_size = str(100 - int(middle_search[1]) * 10)
  174. middle_list += ['span']
  175. data = middle_re.sub('<span style="font-size: ' + font_size + '%;">', data, 1)
  176. else:
  177. middle_search = re.search('^#!wiki', middle_data[0])
  178. if middle_search:
  179. middle_data_2 = re.search('{{{#!wiki(?: style=(?:&quot;|&#x27;)((?:(?!&quot;|&#x27;).)*)(?:&quot;|&#x27;))?\n?', data)
  180. if middle_data_2:
  181. middle_data_2 = middle_data_2.groups()
  182. else:
  183. middle_data_2 = ['']
  184. middle_list += ['div_end']
  185. data = re.sub('{{{#!wiki(?: style=(?:&quot;|&#x27;)((?:(?!&quot;|&#x27;).)*)(?:&quot;|&#x27;))?\n?', '<div id="wiki_div" style="' + str(middle_data_2[0]) + '">', data, 1)
  186. else:
  187. middle_search = re.search('^#!syntax', middle_data[0])
  188. if middle_search:
  189. middle_data_2 = re.search('{{{#!syntax ((?:(?!\n).)+)\n?', data)
  190. if middle_data_2:
  191. middle_data_2 = middle_data_2.groups()
  192. else:
  193. middle_data_2 = ['python']
  194. if syntax_num == 0:
  195. plus_data += '''
  196. <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/9.12.0/styles/default.min.css">
  197. <script src="//cdnjs.cloudflare.com/ajax/libs/highlight.js/9.12.0/highlight.min.js"></script>
  198. '''
  199. syntax_num = 1
  200. middle_list += ['pre']
  201. data = re.sub('{{{#!syntax ?((?:(?!\n).)*)\n?', '<pre id="syntax"><code class="' + middle_data_2[0] + '">', data, 1)
  202. else:
  203. middle_search = re.search('^#!folding', middle_data[0])
  204. if middle_search:
  205. middle_list += ['2div']
  206. folding_data = re.search('{{{#!folding ?((?:(?!\n).)*)\n?', data)
  207. if folding_data:
  208. folding_data = folding_data.groups()
  209. else:
  210. folding_data = ['Test']
  211. if folding_num == 0:
  212. plus_data += '<script src="/views/main_css/parser.js"></script>'
  213. folding_num = 1
  214. data = re.sub('{{{#!folding ?((?:(?!\n).)*)\n?', '<div>' + str(folding_data[0]) + ' <div style="display: inline-block;"><a href="javascript:void(0);" onclick="folding(' + str(fol_num) + ');">[do]</a></div_end><div id="folding_' + str(fol_num) + '" style="display: none;"><div id="wiki_div" style="">', data, 1)
  215. fol_num += 1
  216. else:
  217. middle_list += ['span']
  218. data = middle_re.sub('<span>', data, 1)
  219. else:
  220. middle_list += ['code']
  221. middle_stack += 1
  222. data = middle_re.sub('<code>' + middle_data[0].replace('\\', '\\\\'), data, 1)
  223. middle_number += 1
  224. else:
  225. if middle_list == []:
  226. data = middle_re.sub('&#125;&#125;&#125;', data, 1)
  227. else:
  228. if middle_stack > 0:
  229. middle_stack -= 1
  230. if middle_stack > 0:
  231. data = middle_re.sub('&#125;&#125;&#125;', data, 1)
  232. else:
  233. if middle_number > 0:
  234. middle_number -= 1
  235. if middle_list[middle_number] == '2div':
  236. data = middle_re.sub('</div_end></div_end></div_end>', data, 1)
  237. elif middle_list[middle_number] == 'pre':
  238. data = middle_re.sub('</code></pre>', data, 1)
  239. else:
  240. data = middle_re.sub('</' + middle_list[middle_number] + '>', data, 1)
  241. del(middle_list[middle_number])
  242. else:
  243. break
  244. num = 0
  245. while 1:
  246. nowiki_data = re.search('<code>((?:(?:(?!<\/code>).)*\n*)*)<\/code>', data)
  247. if nowiki_data:
  248. nowiki_data = nowiki_data.groups()
  249. num += 1
  250. end_data += [['nowiki_' + str(num), nowiki_data[0], 'code']]
  251. data = re.sub('<code>((?:(?:(?!<\/code>).)*\n*)*)<\/code>', '<span id="nowiki_' + str(num) + '"></span>', data, 1)
  252. else:
  253. break
  254. num = 0
  255. while 1:
  256. syntax_data = re.search('<code class="((?:(?!").)+)">((?:(?:(?:(?!<\/code>|<span id="syntax_)).)+\n*)+)<\/code>', data)
  257. if syntax_data:
  258. syntax_data = syntax_data.groups()
  259. num += 1
  260. end_data += [['syntax_' + str(num), syntax_data[1], 'normal']]
  261. data = re.sub('<code class="((?:(?!").)+)">((?:(?:(?:(?!<\/code>|<span id="syntax_)).)+\n*)+)<\/code>', '<code class="' + syntax_data[0] + '"><span id="syntax_' + str(num) + '"></span></code>', data, 1)
  262. else:
  263. break
  264. return [data, [fol_num, syntax_num, folding_num]]
  265. def link_fix(main_link):
  266. if re.search('^:', main_link):
  267. main_link = re.sub('^:', '', main_link)
  268. main_link = re.sub('^사용자:', 'user:', main_link)
  269. main_link = re.sub('^파일:', 'file:', main_link)
  270. main_link = re.sub('^분류:', 'category:', main_link)
  271. other_link = re.search('(#.+)$', main_link)
  272. if other_link:
  273. other_link = other_link.groups()[0]
  274. main_link = re.sub('(#.+)$', '', main_link)
  275. else:
  276. other_link = ''
  277. return [main_link, other_link]
  278. def namu(conn, data, title, main_num):
  279. curs = conn.cursor()
  280. global plus_data
  281. global end_data
  282. data = '\n' + data + '\n'
  283. plus_data = ''
  284. backlink = []
  285. end_data = []
  286. data = html.escape(data)
  287. data = re.sub('\r\n', '\n', data)
  288. t_data = middle_parser(data, 0, 0, 0)
  289. data = t_data[0]
  290. include_re = re.compile('\[include\(((?:(?!\)\]).)+)\)\]', re.I)
  291. while 1:
  292. include = include_re.search(data)
  293. if include:
  294. include = include.groups()[0]
  295. include_data = re.search('^((?:(?!,).)+)', include)
  296. if include_data:
  297. include_data = include_data.groups()[0]
  298. else:
  299. include_data = 'Test'
  300. include_link = include_data
  301. backlink += [[title, include_link, 'include']]
  302. include = re.sub('^((?:(?!,).)+)', '', include)
  303. num = 0
  304. while 1:
  305. include_one_nowiki = re.search('(?:\\\\){2}(.)', include)
  306. if include_one_nowiki:
  307. include_one_nowiki = include_one_nowiki.groups()
  308. num += 1
  309. end_data += [['include_one_nowiki_' + str(num), include_one_nowiki[0], 'normal']]
  310. include = re.sub('(?:\\\\){2}(.)', '<span id="include_one_nowiki_' + str(num) + '"></span>', include, 1)
  311. else:
  312. break
  313. curs.execute("select data from data where title = ?", [include_data])
  314. include_data = curs.fetchall()
  315. if include_data:
  316. include_parser = include_re.sub('', include_data[0][0])
  317. include_parser = html.escape(include_parser)
  318. while 1:
  319. include_plus = re.search(', ?((?:(?!=).)+)=((?:(?!,).)+)', include)
  320. if include_plus:
  321. include_plus = include_plus.groups()
  322. include_parser = include_parser.replace('@' + include_plus[0] + '@', include_plus[1])
  323. include = re.sub(', ?((?:(?!=).)+)=((?:(?!,).)+)', '', include, 1)
  324. else:
  325. break
  326. include_parser = re.sub('\[\[(?:category|분류):(((?!\]\]|#include).)+)\]\]', '', include_parser)
  327. data = include_re.sub('<include>\n<a id="include_link" href="/w/' + tool.url_pas(include_link) + '">[' + include_link + ']</a>\n' + include_parser + '\n</include>', data, 1)
  328. else:
  329. data = include_re.sub('<a id="not_thing" href="/w/' + tool.url_pas(include_link) + '">' + include_link + '</a>', data, 1)
  330. else:
  331. break
  332. data = re.sub('\r\n', '\n', data)
  333. t_data = middle_parser(data, t_data[1][0], t_data[1][1], t_data[1][2])
  334. data = t_data[0]
  335. data = re.sub('&amp;', '&', data)
  336. data = re.sub('\n( +)\|\|', '\n||', data)
  337. data = re.sub('\|\|( +)\n', '||\n', data)
  338. data = re.sub('\n##(((?!\n).)+)', '', data)
  339. while 1:
  340. wiki_table_data = re.search('<div id="wiki_div" ((?:(?!>).)+)>((?:(?!<div id="wiki_div"|<\/div_end>).\n*)+)<\/div_end>', data)
  341. if wiki_table_data:
  342. wiki_table_data = wiki_table_data.groups()
  343. if re.search('\|\|', wiki_table_data[1]):
  344. end_parser = re.sub('\n$', '', re.sub('^\n', '', table_start('\n' + wiki_table_data[1] + '\n')))
  345. else:
  346. end_parser = wiki_table_data[1]
  347. data = re.sub('<div id="wiki_div" ((?:(?!>).)+)>((?:(?!<div id="wiki_div"|<\/div_end>).\n*)+)<\/div_end>', '<div ' + wiki_table_data[0] + '>' + end_parser + '</div>', data, 1)
  348. else:
  349. break
  350. data = re.sub('<\/div_end>', '</div>', data)
  351. data = re.sub('<\/td>', '</td_end>', data)
  352. first = 0
  353. math_re = re.compile('\[math\(((?:(?!\)\]).)+)\)\]', re.I)
  354. while 1:
  355. math = math_re.search(data)
  356. if math:
  357. if first == 0:
  358. plus_data += '''
  359. <link rel="stylesheet" href="/views/main_css/katex/katex.min.css">
  360. <script src="/views/main_css/katex/katex.min.js"></script>
  361. '''
  362. math = math.groups()[0]
  363. first += 1
  364. data = math_re.sub('<span id="math_' + str(first) + '"></span>', data, 1)
  365. plus_data += '<script>katex.render("' + math.replace('\\', '\\\\').replace('&lt;', '<').replace('&gt;', '>') +'", document.getElementById("math_' + str(first) + '"));</script>'
  366. else:
  367. break
  368. num = 0
  369. while 1:
  370. one_nowiki = re.search('(?:\\\\)(.)', data)
  371. if one_nowiki:
  372. one_nowiki = one_nowiki.groups()
  373. num += 1
  374. end_data += [['one_nowiki_' + str(num), one_nowiki[0], 'normal']]
  375. data = re.sub('(?:\\\\)(.)', '<span id="one_nowiki_' + str(num) + '"></span>', data, 1)
  376. else:
  377. break
  378. while 1:
  379. hr = re.search('\n-{4,9}\n', data)
  380. if hr:
  381. data = re.sub('\n-{4,9}\n', '\n<hr>\n', data, 1)
  382. else:
  383. break
  384. data += '\n'
  385. data = data.replace('\\', '&#92;')
  386. data = re.sub('&#x27;&#x27;&#x27;(?P<in>((?!&#x27;&#x27;&#x27;).)+)&#x27;&#x27;&#x27;', '<b>\g<in></b>', data)
  387. data = re.sub('&#x27;&#x27;(?P<in>((?!&#x27;&#x27;).)+)&#x27;&#x27;', '<i>\g<in></i>', data)
  388. data = re.sub('~~(?P<in>(?:(?!~~).)+)~~', '<s>\g<in></s>', data)
  389. data = re.sub('--(?P<in>(?:(?!--).)+)--', '<s>\g<in></s>', data)
  390. data = re.sub('__(?P<in>(?:(?!__).)+)__', '<u>\g<in></u>', data)
  391. data = re.sub('\^\^(?P<in>(?:(?!\^\^).)+)\^\^', '<sup>\g<in></sup>', data)
  392. data = re.sub(',,(?P<in>(?:(?!,,).)+),,', '<sub>\g<in></sub>', data)
  393. redirect_re = re.compile('\n#(?:redirect|넘겨주기) ((?:(?!\n).)+)\n', re.I)
  394. redirect = redirect_re.search(data)
  395. if redirect:
  396. redirect = redirect.groups()[0]
  397. return_link = link_fix(redirect)
  398. main_link = return_link[0]
  399. other_link = return_link[1]
  400. backlink += [[title, main_link, 'redirect']]
  401. data = redirect_re.sub('\n * ' + title + ' - [[' + main_link + ']]\n', data, 1)
  402. no_toc_re = re.compile('\[(?:목차|toc)\((?:no)\)\]\n', re.I)
  403. toc_re = re.compile('\[(?:목차|toc)\]', re.I)
  404. if not no_toc_re.search(data):
  405. if not toc_re.search(data):
  406. data = re.sub('\n(?P<in>={1,6}) ?(?P<out>(?:(?!=).)+) ?={1,6}\n', '\n[toc]\n\g<in> \g<out> \g<in>\n', data, 1)
  407. else:
  408. data = no_toc_re.sub('', data)
  409. toc_full = 0
  410. toc_top_stack = 6
  411. toc_stack = [0, 0, 0, 0, 0, 0]
  412. edit_number = 0
  413. toc_data = '<div id="toc"><span style="font-size: 18px;">toc</span>\n\n'
  414. while 1:
  415. toc = re.search('\n(={1,6}) ?((?:(?!\n).)+) ?\n', data)
  416. if toc:
  417. toc = toc.groups()
  418. toc_number = len(toc[0])
  419. edit_number += 1
  420. if toc_full > toc_number:
  421. for i in range(toc_number, 6):
  422. toc_stack[i] = 0
  423. if toc_top_stack > toc_number:
  424. toc_top_stack = toc_number
  425. toc_full = toc_number
  426. toc_stack[toc_number - 1] += 1
  427. toc_number = str(toc_number)
  428. all_stack = ''
  429. for i in range(0, 6):
  430. all_stack += str(toc_stack[i]) + '.'
  431. while 1:
  432. if re.search('[^0-9]0\.', all_stack):
  433. all_stack = re.sub('[^0-9]0\.', '.', all_stack)
  434. else:
  435. break
  436. all_stack = re.sub('^0\.', '', all_stack)
  437. data = re.sub('\n(={1,6}) ?((?:(?!\n).)+) ?\n', '\n<h' + toc_number + ' id="s-' + re.sub('\.$', '', all_stack) + '"><a href="#toc">' + all_stack + '</a> ' + re.sub('=*$', '', toc[1]) + ' <span style="font-size: 12px"><a href="/edit/' + tool.url_pas(title) + '?section=' + str(edit_number) + '">(Edit)</a></span></h' + toc_number + '>\n', data, 1)
  438. toc_main_data = toc[1]
  439. toc_main_data = re.sub('=*$', '', toc_main_data)
  440. toc_main_data = re.sub('\[\*((?:(?! |\]).)*)(?: ((?:(?!(\[\*(?:(?:(?!\]).)+)\]|\])).)+))?\]', '', toc_main_data)
  441. toc_main_data = re.sub('<span id="math_[0-9]"><\/span>', '(수식)', toc_main_data)
  442. toc_data += '<span style="margin-left: ' + str((toc_full - toc_top_stack) * 10) + 'px;"><a href="#s-' + re.sub('\.$', '', all_stack) + '">' + all_stack + '</a> ' + toc_main_data + '</span>\n'
  443. else:
  444. break
  445. toc_data += '</div>'
  446. data = toc_re.sub(toc_data, data)
  447. data = tool.savemark(data)
  448. anchor_re = re.compile("\[anchor\((?P<in>(?:(?!\)\]).)+)\)\]", re.I)
  449. data = anchor_re.sub('<span id="\g<in>"></span>', data)
  450. ruby_re = re.compile("\[ruby\((?P<in>(?:(?!,).)+)\, ?(?P<out>(?:(?!\)\]).)+)\)\]", re.I)
  451. data = ruby_re.sub('<ruby>\g<in><rp>(</rp><rt>\g<out></rt><rp>)</rp></ruby>', data)
  452. now_time = tool.get_time()
  453. date_re = re.compile('\[date\]', re.I)
  454. data = date_re.sub(now_time, data)
  455. time_data = re.search('^([0-9]{4}-[0-9]{2}-[0-9]{2})', now_time)
  456. time = time_data.groups()
  457. age_re = re.compile('\[age\(([0-9]{4}-[0-9]{2}-[0-9]{2})\)\]', re.I)
  458. while 1:
  459. age_data = age_re.search(data)
  460. if age_data:
  461. age = age_data.groups()[0]
  462. old = datetime.datetime.strptime(time[0], '%Y-%m-%d')
  463. will = datetime.datetime.strptime(age, '%Y-%m-%d')
  464. e_data = old - will
  465. data = age_re.sub(str(int(e_data.days / 365)), data, 1)
  466. else:
  467. break
  468. dday_re = re.compile('\[dday\(([0-9]{4}-[0-9]{2}-[0-9]{2})\)\]', re.I)
  469. while 1:
  470. dday_data = dday_re.search(data)
  471. if dday_data:
  472. dday = dday_data.groups()[0]
  473. old = datetime.datetime.strptime(time[0], '%Y-%m-%d')
  474. will = datetime.datetime.strptime(dday, '%Y-%m-%d')
  475. e_data = old - will
  476. if re.search('^-', str(e_data.days)):
  477. e_day = str(e_data.days)
  478. else:
  479. e_day = '+' + str(e_data.days)
  480. data = dday_re.sub(e_day, data, 1)
  481. else:
  482. break
  483. video_re = re.compile('\[(youtube|kakaotv|nicovideo)\(((?:(?!\)\]).)+)\)\]', re.I)
  484. youtube_re = re.compile('youtube', re.I)
  485. kakaotv_re = re.compile('kakaotv', re.I)
  486. while 1:
  487. video = video_re.search(data)
  488. if video:
  489. video = video.groups()
  490. width = re.search(', ?width=((?:(?!,).)+)', video[1])
  491. if width:
  492. video_width = width.groups()[0]
  493. else:
  494. video_width = '560'
  495. height = re.search(', ?height=((?:(?!,).)+)', video[1])
  496. if height:
  497. video_height = height.groups()[0]
  498. else:
  499. video_height = '315'
  500. code = re.search('^((?:(?!,).)+)', video[1])
  501. if code:
  502. video_code = code.groups()[0]
  503. else:
  504. video_code = ''
  505. if youtube_re.search(video[0]):
  506. video_code = re.sub('^https:\/\/www\.youtube\.com\/watch\?v=', '', video_code)
  507. video_code = re.sub('^https:\/\/youtu\.be\/', '', video_code)
  508. video_src = 'https://www.youtube.com/embed/' + video_code
  509. elif kakaotv_re.search(video[0]):
  510. video_code = re.sub('^https:\/\/tv\.kakao\.com\/channel\/9262\/cliplink\/', '', video_code)
  511. video_code = re.sub('^http:\/\/tv\.kakao\.com\/v\/', '', video_code)
  512. video_src = 'https://tv.kakao.com/embed/player/cliplink/' + video_code +'?service=kakao_tv'
  513. else:
  514. video_src = 'https://embed.nicovideo.jp/watch/' + video_code
  515. data = video_re.sub('<iframe width="' + video_width + '" height="' + video_height + '" src="' + video_src + '" allowfullscreen frameborder="0"></iframe>', data, 1)
  516. else:
  517. break
  518. while 1:
  519. block = re.search('(\n(?:&gt; ?(?:(?:(?!\n).)+)?\n)+)', data)
  520. if block:
  521. block = block.groups()[0]
  522. block = re.sub('^\n&gt; ?', '', block)
  523. block = re.sub('\n&gt; ?', '\n', block)
  524. block = re.sub('\n$', '', block)
  525. data = re.sub('(\n(?:&gt; ?(?:(?:(?!\n).)+)?\n)+)', '\n<blockquote>' + block + '</blockquote>\n', data, 1)
  526. else:
  527. break
  528. data = re.sub('(?P<in>\n +\* ?(?:(?:(?!\|\|).)+))\|\|', '\g<in>\n ||', data)
  529. while 1:
  530. li = re.search('(\n(?:(?: *)\* ?(?:(?:(?!\n).)+)\n)+)', data)
  531. if li:
  532. li = li.groups()[0]
  533. while 1:
  534. sub_li = re.search('\n(?:( *)\* ?((?:(?!\n).)+))', li)
  535. if sub_li:
  536. sub_li = sub_li.groups()
  537. if len(sub_li[0]) == 0:
  538. margin = 20
  539. else:
  540. margin = len(sub_li[0]) * 20
  541. li = re.sub('\n(?:( *)\* ?((?:(?!\n).)+))', '<li style="margin-left: ' + str(margin) + 'px;">' + sub_li[1] + '</li>', li, 1)
  542. else:
  543. break
  544. data = re.sub('(\n(?:(?: *)\* ?(?:(?:(?!\n).)+)\n)+)', '\n\n<ul>' + li + '</ul>\n', data, 1)
  545. else:
  546. break
  547. data = re.sub('<\/ul>\n \|\|', '</ul>||', data)
  548. while 1:
  549. indent = re.search('\n( +)', data)
  550. if indent:
  551. indent = len(indent.groups()[0])
  552. margin = '<span style="margin-left: 20px;"></span>' * indent
  553. data = re.sub('\n( +)', '\n' + margin, data, 1)
  554. else:
  555. break
  556. data = table_start(data)
  557. category = '\n<hr><div id="cate">category : '
  558. category_re = re.compile('^(?:category|분류):', re.I)
  559. while 1:
  560. link = re.search('\[\[((?:(?!\[\[|\]\]).)+)\]\]', data)
  561. if link:
  562. link = link.groups()[0]
  563. link_split = re.search('((?:(?!\|).)+)(?:\|((?:(?!\|).)+))', link)
  564. if link_split:
  565. link_split = link_split.groups()
  566. main_link = link_split[0]
  567. see_link = link_split[1]
  568. else:
  569. main_link = link
  570. see_link = link
  571. if re.search('^((?:file|파일)|(?:out|외부)):', main_link):
  572. file_style = ''
  573. width = re.search('width=((?:(?!&).)+)', see_link)
  574. if width:
  575. file_width = width.groups()[0]
  576. if re.search('px$', file_width):
  577. file_style += 'width: ' + file_width + ';'
  578. else:
  579. file_style += 'width: ' + file_width + 'px;'
  580. height = re.search('height=((?:(?!&).)+)', see_link)
  581. if height:
  582. file_height = height.groups()[0]
  583. if re.search('px$', file_height):
  584. file_style += 'height: ' + file_height + ';'
  585. else:
  586. file_style += 'height: ' + file_height + 'px;'
  587. align = re.search('align=((?:(?!&).)+)', see_link)
  588. if align:
  589. file_align = align.groups()[0]
  590. if file_align == 'center':
  591. file_align = 'display: block; text-align: center;'
  592. else:
  593. file_align = 'float: ' + file_align + ';'
  594. else:
  595. file_align = ''
  596. if re.search('^(?:out|외부):', main_link):
  597. file_src = re.sub('^(?:out|외부):', '', main_link)
  598. file_alt = main_link
  599. exist = 'Yes'
  600. else:
  601. file_data = re.search('^(?:file|파일):((?:(?!\.).)+)\.(.+)$', main_link)
  602. if file_data:
  603. file_data = file_data.groups()
  604. file_name = file_data[0]
  605. file_end = file_data[1]
  606. backlink += [[title, main_link, 'file']]
  607. else:
  608. file_name = 'TEST'
  609. file_end = 'jpg'
  610. file_src = '/image/' + tool.sha224(file_name) + '.' + file_end
  611. file_alt = 'file:' + file_name + '.' + file_end
  612. curs.execute("select title from data where title = ?", [file_alt])
  613. exist = curs.fetchall()
  614. if exist:
  615. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<span style="' + file_align + '"><img style="' + file_style + '" alt="' + file_alt + '" src="' + file_src + '"></span>', data, 1)
  616. else:
  617. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="not_thing" href="/w/' + tool.url_pas(file_alt) + '">' + file_alt + '</a>', data, 1)
  618. elif category_re.search(main_link):
  619. see_link = re.sub('#include', '', see_link)
  620. main_link = re.sub('#include', '', category_re.sub('category:', main_link))
  621. if re.search('#blur', main_link):
  622. see_link = 'Hidden'
  623. link_id = 'id="inside"'
  624. main_link = re.sub('#blur', '', main_link)
  625. else:
  626. link_id = ''
  627. backlink += [[title, main_link, 'cat']]
  628. category += '<a ' + link_id + ' href="' + tool.url_pas(main_link) + '">' + category_re.sub('', see_link) + '</a> / '
  629. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '', data, 1)
  630. elif re.search('^wiki:', main_link):
  631. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="inside" href="/' + tool.url_pas(re.sub('^wiki:', '', main_link)) + '">' + see_link + '</a>', data, 1)
  632. elif re.search('^inter:((?:(?!:).)+):', main_link):
  633. inter_data = re.search('^inter:((?:(?!:).)+):((?:(?!\]\]|\|).)+)', main_link)
  634. inter_data = inter_data.groups()
  635. curs.execute('select link from inter where title = ?', [inter_data[0]])
  636. inter = curs.fetchall()
  637. if inter:
  638. if see_link != main_link:
  639. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="inside" href="' + inter[0][0] + inter_data[1] + '">' + inter_data[0] + ':' + see_link + '</a>', data, 1)
  640. else:
  641. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="inside" href="' + inter[0][0] + inter_data[1] + '">' + inter_data[0] + ':' + inter_data[1] + '</a>', data, 1)
  642. else:
  643. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', 'Not exist', data, 1)
  644. elif re.search('^\/', main_link):
  645. under_title = re.search('^(\/(?:.+))$', main_link)
  646. under_title = under_title.groups()[0]
  647. if see_link != main_link:
  648. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '[[' + title + under_title + '|' + see_link + ']]', data, 1)
  649. else:
  650. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '[[' + title + under_title + ']]', data, 1)
  651. elif re.search('^http(s)?:\/\/', main_link):
  652. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="out_link" rel="nofollow" href="' + main_link + '">' + see_link + '</a>', data, 1)
  653. else:
  654. return_link = link_fix(main_link)
  655. main_link = return_link[0]
  656. other_link = return_link[1]
  657. if re.search('^\/', main_link):
  658. main_link = re.sub('^\/', title + '/', main_link)
  659. elif re.search('\.\.\/\/', main_link):
  660. main_link = re.sub('\.\.\/\/', '/', main_link)
  661. elif re.search('^\.\.\/', main_link):
  662. main_link = re.sub('^\.\.\/', re.sub('(?P<in>.+)\/.*$', '\g<in>', title), main_link)
  663. if not re.search('^\|', main_link):
  664. if main_link != title:
  665. if main_link != '':
  666. curs.execute("select title from data where title = ?", [main_link])
  667. if not curs.fetchall():
  668. link_id = 'id="not_thing"'
  669. backlink += [[title, main_link, 'no']]
  670. else:
  671. link_id = ''
  672. backlink += [[title, main_link, '']]
  673. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a ' + link_id + ' href="/w/' + tool.url_pas(main_link) + other_link + '">' + see_link + '</a>', data, 1)
  674. else:
  675. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a href="' + other_link + '">' + see_link + '</a>', data, 1)
  676. else:
  677. if re.search('^#', other_link):
  678. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a href="' + other_link + '">' + other_link + '</a>', data, 1)
  679. else:
  680. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<b>' + see_link + '</b>', data, 1)
  681. else:
  682. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '&#91;&#91;' + link + '&#93;&#93;', data, 1)
  683. else:
  684. break
  685. br_re = re.compile('\[br\]', re.I)
  686. data = br_re.sub('<br>', data)
  687. footnote_number = 0
  688. footnote_all = []
  689. footnote_dict = {}
  690. footnote_re = {}
  691. footdata_all = '\n<hr><ul id="footnote_data">'
  692. re_footnote = re.compile('(?:\[\*((?:(?! |\]).)*)(?: ((?:(?!(?:\[\*|\])).)+))?\]|(\[(?:각주|footnote)\]))')
  693. while 1:
  694. footnote = re_footnote.search(data)
  695. if footnote:
  696. footnote_data = footnote.groups()
  697. if footnote_data[2]:
  698. footnote_all.sort()
  699. for footdata in footnote_all:
  700. if footdata[2] == 0:
  701. footdata_in = ''
  702. else:
  703. footdata_in = footdata[2]
  704. footdata_all += '<li><a href="#rfn-' + str(footdata[0]) + '" id="fn-' + str(footdata[0]) + '">(' + footdata[1] + ')</a> ' + footdata_in + '</li>'
  705. data = re_footnote.sub(footdata_all + '</ul>', data, 1)
  706. footnote_all = []
  707. footdata_all = '\n<hr><ul id="footnote_data">'
  708. else:
  709. footnote = footnote_data[1]
  710. footnote_name = footnote_data[0]
  711. if footnote_name and not footnote:
  712. if footnote_name in footnote_dict:
  713. footnote_re[footnote_name] += 1
  714. foot_plus_num = str(footnote_re[footnote_name])
  715. footshort = footnote_dict[footnote_name] + '.' + foot_plus_num
  716. footnote_all += [[float(footshort), footshort, 0]]
  717. data = re_footnote.sub('<sup><a href="#fn-' + footshort + '" id="rfn-' + footshort + '">(' + footshort + ')</a></sup>', data, 1)
  718. else:
  719. data = re_footnote.sub('<sup><a href="#">(' + footnote_name + ')</a></sup>', data, 1)
  720. else:
  721. footnote_number += 1
  722. if not footnote_name:
  723. footnote_name = str(footnote_number)
  724. footnote_dict.update({ footnote_name : str(footnote_number) })
  725. if not footnote_name in footnote_re:
  726. footnote_re.update({ footnote_name : 0 })
  727. else:
  728. footnote_re[footnote_name] += 1
  729. footnote_all += [[footnote_number, footnote_name, footnote]]
  730. data = re_footnote.sub('<sup><a href="#fn-' + str(footnote_number) + '" id="rfn-' + str(footnote_number) + '">(' + footnote_name + ')</a></sup>', data, 1)
  731. else:
  732. break
  733. data = re.sub('\n+$', '', data)
  734. footnote_all.sort()
  735. for footdata in footnote_all:
  736. if footdata[2] == 0:
  737. footdata_in = ''
  738. else:
  739. footdata_in = footdata[2]
  740. footdata_all += '<li><a href="#rfn-' + str(footdata[0]) + '" id="fn-' + str(footdata[0]) + '">(' + footdata[1] + ')</a> ' + footdata_in + '</li>'
  741. footdata_all += '</ul>'
  742. if footdata_all == '\n<hr><ul id="footnote_data"></ul>':
  743. footdata_all = ''
  744. data = re.sub('\n$', footdata_all, data + '\n', 1)
  745. category += '</div>'
  746. category = re.sub(' / <\/div>$', '</div>', category)
  747. if category == '\n<hr><div id="cate">category : </div>':
  748. category = ''
  749. data += category
  750. i = 0
  751. while 1:
  752. try:
  753. _ = end_data[i][0]
  754. except:
  755. break
  756. if end_data[i][2] == 'normal':
  757. data = data.replace('<span id="' + end_data[i][0] + '"></span>', end_data[i][1])
  758. data = data.replace(tool.url_pas('<span id="' + end_data[i][0] + '"></span>'), tool.url_pas(end_data[i][1]))
  759. else:
  760. if re.search('\n', end_data[i][1]):
  761. data = data.replace('<span id="' + end_data[i][0] + '"></span>', '\n<pre>' + re.sub('^\n', '', end_data[i][1]) + '</pre>')
  762. else:
  763. data = data.replace('<span id="' + end_data[i][0] + '"></span>', '<code>' + end_data[i][1] + '</code>')
  764. i += 1
  765. if main_num == 1:
  766. i = 0
  767. while 1:
  768. try:
  769. _ = backlink[i][0]
  770. except:
  771. break
  772. find_data = re.search('<span id="(one_nowiki_[0-9]+)">', backlink[i][1])
  773. if find_data:
  774. j = 0
  775. find_data = find_data.groups()[0]
  776. while 1:
  777. try:
  778. _ = end_data[j][0]
  779. except:
  780. break
  781. if end_data[j][0] == find_data:
  782. backlink[i][1] = backlink[i][1].replace('<span id="' + end_data[j][0] + '"></span>', end_data[j][1])
  783. j += 1
  784. i += 1
  785. data = re.sub('<\/td_end>', '</td>', data)
  786. data = re.sub('<include>\n', '', data)
  787. data = re.sub('\n<\/include>', '', data)
  788. data = re.sub('(?P<in><\/h[0-9]>)(\n)+', '\g<in>', data)
  789. data = re.sub('\n\n<ul>', '\n<ul>', data)
  790. data = re.sub('<\/ul>\n\n', '</ul>', data)
  791. data = re.sub('^(\n)+', '', data)
  792. data = re.sub('(\n)+<hr><ul id="footnote_data">', '<hr><ul id="footnote_data">', data)
  793. data = re.sub('(?P<in><td(((?!>).)*)>)\n', '\g<in>', data)
  794. data = re.sub('(\n)?<hr>(\n)?', '<hr>', data)
  795. data = re.sub('<\/ul>\n\n<ul>', '</ul>\n<ul>', data)
  796. data = re.sub('\n', '<br>', data)
  797. return [data, plus_data, backlink]