namu.py 45 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063
  1. from . import tool
  2. import datetime
  3. import html
  4. import re
  5. def table_parser(data, cel_data, start_data, num = 0):
  6. table_class = 'class="'
  7. all_table = 'style="'
  8. cel_style = 'style="'
  9. row_style = 'style="'
  10. row = ''
  11. cel = ''
  12. table_width = re.search("<table ?width=((?:(?!>).)*)>", data)
  13. if table_width:
  14. if re.search('^[0-9]+$', table_width.groups()[0]):
  15. all_table += 'width: ' + table_width.groups()[0] + 'px;'
  16. else:
  17. all_table += 'width: ' + table_width.groups()[0] + ';'
  18. table_height = re.search("<table ?height=((?:(?!>).)*)>", data)
  19. if table_height:
  20. if re.search('^[0-9]+$', table_height.groups()[0]):
  21. all_table += 'height: ' + table_height.groups()[0] + 'px;'
  22. else:
  23. all_table += 'height: ' + table_height.groups()[0] + ';'
  24. table_align = re.search("<table ?align=((?:(?!>).)*)>", data)
  25. if table_align:
  26. if table_align.groups()[0] == 'right':
  27. all_table += 'float: right;'
  28. elif table_align.groups()[0] == 'center':
  29. all_table += 'margin: auto;'
  30. table_text_align = re.search("<table ?textalign=((?:(?!>).)*)>", data)
  31. if table_text_align:
  32. num = 1
  33. if table_text_align.groups()[0] == 'right':
  34. all_table += 'text-align: right;'
  35. elif table_text_align.groups()[0] == 'center':
  36. all_table += 'text-align: center;'
  37. row_table_align = re.search("<row ?textalign=((?:(?!>).)*)>", data)
  38. if row_table_align:
  39. if row_table_align.groups()[0] == 'right':
  40. row_style += 'text-align: right;'
  41. elif row_table_align.groups()[0] == 'center':
  42. row_style += 'text-align: center;'
  43. else:
  44. row_style += 'text-align: left;'
  45. table_cel = re.search("<-((?:(?!>).)*)>", data)
  46. if table_cel:
  47. cel = 'colspan="' + table_cel.groups()[0] + '"'
  48. else:
  49. cel = 'colspan="' + str(round(len(start_data) / 2)) + '"'
  50. table_row = re.search("<\|((?:(?!>).)*)>", data)
  51. if table_row:
  52. row = 'rowspan="' + table_row.groups()[0] + '"'
  53. row_bgcolor = re.search("<rowbgcolor=(#(?:[0-9a-f-A-F]{3}){1,2}|\w+)>", data)
  54. if row_bgcolor:
  55. row_style += 'background: ' + row_bgcolor.groups()[0] + ';'
  56. table_border = re.search("<table ?bordercolor=(#(?:[0-9a-f-A-F]{3}){1,2}|\w+)>", data)
  57. if table_border:
  58. all_table += 'border: ' + table_border.groups()[0] + ' 2px solid;'
  59. table_bgcolor = re.search("<table ?bgcolor=(#(?:[0-9a-f-A-F]{3}){1,2}|\w+)>", data)
  60. if table_bgcolor:
  61. all_table += 'background: ' + table_bgcolor.groups()[0] + ';'
  62. bgcolor = re.search("<(?:bgcolor=)?(#(?:[0-9a-f-A-F]{3}){1,2}|\w+)>", data)
  63. if bgcolor:
  64. cel_style += 'background: ' + bgcolor.groups()[0] + ';'
  65. cel_width = re.search("<width=((?:(?!>).)*)>", data)
  66. if cel_width:
  67. cel_style += 'width: ' + cel_width.groups()[0] + 'px;'
  68. cel_height = re.search("<height=((?:(?!>).)*)>", data)
  69. if cel_height:
  70. cel_style += 'height: ' + cel_height.groups()[0] + 'px;'
  71. text_right = re.search("<\)>", data)
  72. text_center = re.search("<:>", data)
  73. text_left = re.search("<\(>", data)
  74. if text_right:
  75. cel_style += 'text-align: right;'
  76. elif text_center:
  77. cel_style += 'text-align: center;'
  78. elif text_left:
  79. cel_style += 'text-align: left;'
  80. elif num == 0:
  81. if re.search('^ ', cel_data) and re.search(' $', cel_data):
  82. cel_style += 'text-align: center;'
  83. elif re.search('^ ', cel_data):
  84. cel_style += 'text-align: right;'
  85. elif re.search(' $', cel_data):
  86. cel_style += 'text-align: left;'
  87. text_class = re.search("<table ?class=((?:(?!>).)+)>", data)
  88. if text_class:
  89. table_class += text_class.groups()[0]
  90. all_table += '"'
  91. cel_style += '"'
  92. row_style += '"'
  93. table_class += '"'
  94. return [all_table, row_style, cel_style, row, cel, table_class, num]
  95. def table_start(data):
  96. while 1:
  97. table = re.search('\n((?:(?:(?:(?:\|\|)+(?:(?:(?!\|\|).(?:\n)*)*))+)\|\|(?:\n)?)+)', data)
  98. if table:
  99. table = table.groups()[0]
  100. while 1:
  101. all_table = re.search('^((?:\|\|)+)((?:<(?:(?:(?!>).)+)>)*)\n*((?:(?!\|\|).\n*)*)', table)
  102. if all_table:
  103. all_table = all_table.groups()
  104. return_table = table_parser(all_table[1], all_table[2], all_table[0])
  105. number = return_table[6]
  106. table = re.sub('^((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*', '\n<table ' + return_table[5] + ' ' + return_table[0] + '><tbody><tr ' + return_table[1] + '><td ' + return_table[2] + ' ' + return_table[3] + ' ' + return_table[4] + '>', table, 1)
  107. else:
  108. break
  109. table = re.sub('\|\|\n?$', '</td></tr></tbody></table>', table)
  110. while 1:
  111. row_table = re.search('\|\|\n((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*((?:(?!\|\||<\/td>).\n*)*)', table)
  112. if row_table:
  113. row_table = row_table.groups()
  114. return_table = table_parser(row_table[1], row_table[2], row_table[0], number)
  115. table = re.sub('\|\|\n((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*', '</td></tr><tr ' + return_table[1] + '><td ' + return_table[2] + ' ' + return_table[3] + ' ' + return_table[4] + '>', table, 1)
  116. else:
  117. break
  118. while 1:
  119. cel_table = re.search('((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*((?:(?:(?!\|\||<\/td>).)|\n)*\n*)', table)
  120. if cel_table:
  121. cel_table = cel_table.groups()
  122. return_table = table_parser(cel_table[1], re.sub('\n', ' ', cel_table[2]), cel_table[0], number)
  123. table = re.sub('((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*', '</td><td ' + return_table[2] + ' ' + return_table[3] + ' ' + return_table[4] + '>', table, 1)
  124. else:
  125. break
  126. data = re.sub('\n((?:(?:(?:(?:\|\|)+(?:(?:(?!\|\|).(?:\n)*)*))+)\|\|(?:\n)?)+)', table, data, 1)
  127. else:
  128. break
  129. return data
  130. def middle_parser(data, fol_num, syntax_num, folding_num):
  131. global end_data
  132. global plus_data
  133. middle_stack = 0
  134. middle_list = []
  135. middle_number = 0
  136. middle_re = re.compile('(?:{{{((?:(?:(?! |{{{|}}}|&lt;).)*) ?)|(}}}))')
  137. while 1:
  138. middle_data = middle_re.search(data)
  139. if middle_data:
  140. middle_data = middle_data.groups()
  141. if not middle_data[1]:
  142. if middle_stack > 0:
  143. middle_stack += 1
  144. data = re.sub('(?:{{{((?:(?! |{{{|}}}|&lt;).)*)(?P<in> ?)|(}}}))', '&#123;&#123;&#123;' + middle_data[0] + '\g<in>', data, 1)
  145. else:
  146. if re.search('^(#|@|\+|\-)', middle_data[0]) and not re.search('^(#|@|\+|\-){2}', middle_data[0]):
  147. middle_search = re.search('^(#(?:[0-9a-f-A-F]{3}){1,2})', middle_data[0])
  148. if middle_search:
  149. middle_list += ['span']
  150. data = middle_re.sub('<span style="color: ' + middle_search.groups()[0] + ';">', data, 1)
  151. else:
  152. middle_search = re.search('^(?:#(\w+))', middle_data[0])
  153. if middle_search:
  154. middle_list += ['span']
  155. data = middle_re.sub('<span style="color: ' + middle_search.groups()[0] + ';">', data, 1)
  156. else:
  157. middle_search = re.search('^(?:@((?:[0-9a-f-A-F]{3}){1,2}))', middle_data[0])
  158. if middle_search:
  159. middle_list += ['span']
  160. data = middle_re.sub('<span style="background: #' + middle_search.groups()[0] + ';">', data, 1)
  161. else:
  162. middle_search = re.search('^(?:@(\w+))', middle_data[0])
  163. if middle_search:
  164. middle_list += ['span']
  165. data = middle_re.sub('<span style="background: ' + middle_search.groups()[0] + ';">', data, 1)
  166. else:
  167. middle_search = re.search('^(\+|-)([1-5])', middle_data[0])
  168. if middle_search:
  169. middle_search = middle_search.groups()
  170. if middle_search[0] == '+':
  171. font_size = str(int(middle_search[1]) * 20 + 100)
  172. else:
  173. font_size = str(100 - int(middle_search[1]) * 10)
  174. middle_list += ['span']
  175. data = middle_re.sub('<span style="font-size: ' + font_size + '%;">', data, 1)
  176. else:
  177. middle_search = re.search('^#!wiki', middle_data[0])
  178. if middle_search:
  179. middle_data_2 = re.search('{{{#!wiki(?: style=(?:&quot;|&#x27;)((?:(?!&quot;|&#x27;).)*)(?:&quot;|&#x27;))?\n?', data)
  180. if middle_data_2:
  181. middle_data_2 = middle_data_2.groups()
  182. else:
  183. middle_data_2 = ['']
  184. middle_list += ['div_end']
  185. data = re.sub('{{{#!wiki(?: style=(?:&quot;|&#x27;)((?:(?!&quot;|&#x27;).)*)(?:&quot;|&#x27;))?\n?', '<div id="wiki_div" style="' + str(middle_data_2[0]) + '">', data, 1)
  186. else:
  187. middle_search = re.search('^#!syntax', middle_data[0])
  188. if middle_search:
  189. middle_data_2 = re.search('{{{#!syntax ((?:(?!\n).)+)\n?', data)
  190. if middle_data_2:
  191. middle_data_2 = middle_data_2.groups()
  192. else:
  193. middle_data_2 = ['python']
  194. if syntax_num == 0:
  195. plus_data += '''
  196. <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/9.12.0/styles/default.min.css">
  197. <script src="//cdnjs.cloudflare.com/ajax/libs/highlight.js/9.12.0/highlight.min.js"></script>
  198. <script>hljs.initHighlightingOnLoad();</script>
  199. '''
  200. syntax_num = 1
  201. middle_list += ['pre']
  202. data = re.sub('{{{#!syntax ?((?:(?!\n).)*)\n?', '<pre id="syntax"><code class="' + middle_data_2[0] + '">', data, 1)
  203. else:
  204. middle_search = re.search('^#!folding', middle_data[0])
  205. if middle_search:
  206. middle_list += ['2div']
  207. folding_data = re.search('{{{#!folding ?((?:(?!\n).)*)\n?', data)
  208. if folding_data:
  209. folding_data = folding_data.groups()
  210. else:
  211. folding_data = ['Test']
  212. if folding_num == 0:
  213. folding_num = 1
  214. data = re.sub('{{{#!folding ?((?:(?!\n).)*)\n?', '<div>' + str(folding_data[0]) + ' <div style="display: inline-block;"><a href="javascript:void(0);" onclick="folding(' + str(fol_num) + ');">[do]</a></div_end><div id="folding_' + str(fol_num) + '" style="display: none;"><div id="wiki_div" style="">', data, 1)
  215. fol_num += 1
  216. else:
  217. middle_list += ['span']
  218. data = middle_re.sub('<span>', data, 1)
  219. else:
  220. middle_list += ['code']
  221. middle_stack += 1
  222. data = middle_re.sub('<code>' + middle_data[0].replace('\\', '\\\\'), data, 1)
  223. middle_number += 1
  224. else:
  225. if middle_list == []:
  226. data = middle_re.sub('&#125;&#125;&#125;', data, 1)
  227. else:
  228. if middle_stack > 0:
  229. middle_stack -= 1
  230. if middle_stack > 0:
  231. data = middle_re.sub('&#125;&#125;&#125;', data, 1)
  232. else:
  233. if middle_number > 0:
  234. middle_number -= 1
  235. if middle_list[middle_number] == '2div':
  236. data = middle_re.sub('</div_end></div_end></div_end>', data, 1)
  237. elif middle_list[middle_number] == 'pre':
  238. data = middle_re.sub('</code></pre>', data, 1)
  239. else:
  240. data = middle_re.sub('</' + middle_list[middle_number] + '>', data, 1)
  241. del(middle_list[middle_number])
  242. else:
  243. if middle_stack == 0:
  244. break
  245. else:
  246. if middle_list == []:
  247. data += '&#125;&#125;&#125;'
  248. else:
  249. if middle_stack > 0:
  250. middle_stack -= 1
  251. if middle_stack > 0:
  252. data += '&#125;&#125;&#125;'
  253. else:
  254. if middle_number > 0:
  255. middle_number -= 1
  256. if middle_list[middle_number] == '2div':
  257. data += '</div_end></div_end></div_end>'
  258. elif middle_list[middle_number] == 'pre':
  259. data += '</code></pre>'
  260. else:
  261. data += '</' + middle_list[middle_number] + '>'
  262. del(middle_list[middle_number])
  263. num = 0
  264. while 1:
  265. nowiki_data = re.search('<code>((?:(?:(?!<\/code>).)*\n*)*)<\/code>', data)
  266. if nowiki_data:
  267. nowiki_data = nowiki_data.groups()
  268. num += 1
  269. end_data += [['nowiki_' + str(num), nowiki_data[0], 'code']]
  270. data = re.sub('<code>((?:(?:(?!<\/code>).)*\n*)*)<\/code>', '<span id="nowiki_' + str(num) + '"></span>', data, 1)
  271. else:
  272. break
  273. num = 0
  274. while 1:
  275. syntax_data = re.search('<code class="((?:(?!").)+)">((?:(?:(?:(?!<\/code>|<span id="syntax_)).)+\n*)+)<\/code>', data)
  276. if syntax_data:
  277. syntax_data = syntax_data.groups()
  278. num += 1
  279. end_data += [['syntax_' + str(num), syntax_data[1], 'normal']]
  280. data = re.sub('<code class="((?:(?!").)+)">((?:(?:(?:(?!<\/code>|<span id="syntax_)).)+\n*)+)<\/code>', '<code class="' + syntax_data[0] + '"><span id="syntax_' + str(num) + '"></span></code>', data, 1)
  281. else:
  282. break
  283. return [data, [fol_num, syntax_num, folding_num]]
  284. def link_fix(main_link):
  285. if re.search('^:', main_link):
  286. main_link = re.sub('^:', '', main_link)
  287. main_link = re.sub('^사용자:', 'user:', main_link)
  288. main_link = re.sub('^파일:', 'file:', main_link)
  289. main_link = re.sub('^분류:', 'category:', main_link)
  290. other_link = re.search('(#.+)$', main_link)
  291. if other_link:
  292. other_link = other_link.groups()[0]
  293. main_link = re.sub('(#.+)$', '', main_link)
  294. else:
  295. other_link = ''
  296. return [main_link, other_link]
  297. def namu(conn, data, title, main_num):
  298. curs = conn.cursor()
  299. global plus_data
  300. global end_data
  301. data = '\n' + data + '\n'
  302. plus_data = ''
  303. backlink = []
  304. end_data = []
  305. data = html.escape(data)
  306. data = re.sub('\r\n', '\n', data)
  307. t_data = middle_parser(data, 0, 0, 0)
  308. data = t_data[0]
  309. include_re = re.compile('\[include\(((?:(?!\)\]).)+)\)\]', re.I)
  310. while 1:
  311. include = include_re.search(data)
  312. if include:
  313. include = include.groups()[0]
  314. include_data = re.search('^((?:(?!,).)+)', include)
  315. if include_data:
  316. include_data = include_data.groups()[0]
  317. else:
  318. include_data = 'Test'
  319. include_link = include_data
  320. backlink += [[title, include_link, 'include']]
  321. include = re.sub('^((?:(?!,).)+)', '', include)
  322. num = 0
  323. while 1:
  324. include_one_nowiki = re.search('(?:\\\\){2}(.)', include)
  325. if include_one_nowiki:
  326. include_one_nowiki = include_one_nowiki.groups()
  327. num += 1
  328. end_data += [['include_one_nowiki_' + str(num), include_one_nowiki[0], 'normal']]
  329. include = re.sub('(?:\\\\){2}(.)', '<span id="include_one_nowiki_' + str(num) + '"></span>', include, 1)
  330. else:
  331. break
  332. curs.execute("select data from data where title = ?", [include_data])
  333. include_data = curs.fetchall()
  334. if include_data:
  335. include_parser = include_re.sub('', include_data[0][0])
  336. include_parser = html.escape(include_parser)
  337. while 1:
  338. include_plus = re.search(', ?((?:(?!=).)+)=((?:(?!,).)+)', include)
  339. if include_plus:
  340. include_plus = include_plus.groups()
  341. include_parser = include_parser.replace('@' + include_plus[0] + '@', include_plus[1])
  342. include = re.sub(', ?((?:(?!=).)+)=((?:(?!,).)+)', '', include, 1)
  343. else:
  344. break
  345. include_parser = re.sub('\[\[(?:category|분류):(((?!\]\]|#include).)+)\]\]', '', include_parser)
  346. data = include_re.sub('<include>\n<a id="include_link" href="/w/' + tool.url_pas(include_link) + '">[' + include_link + ']</a>\n' + include_parser + '\n</include>', data, 1)
  347. else:
  348. data = include_re.sub('<a id="not_thing" href="/w/' + tool.url_pas(include_link) + '">' + include_link + '</a>', data, 1)
  349. else:
  350. break
  351. data = re.sub('\r\n', '\n', data)
  352. t_data = middle_parser(data, t_data[1][0], t_data[1][1], t_data[1][2])
  353. data = t_data[0]
  354. data = re.sub('&amp;', '&', data)
  355. data = re.sub('\n( +)\|\|', '\n||', data)
  356. data = re.sub('\|\|( +)\n', '||\n', data)
  357. data = re.sub('\n##(((?!\n).)+)', '', data)
  358. while 1:
  359. wiki_table_data = re.search('<div id="wiki_div" ((?:(?!>).)+)>((?:(?!<div id="wiki_div"|<\/div_end>).\n*)+)<\/div_end>', data)
  360. if wiki_table_data:
  361. wiki_table_data = wiki_table_data.groups()
  362. if re.search('\|\|', wiki_table_data[1]):
  363. end_parser = re.sub('\n$', '', re.sub('^\n', '', table_start('\n' + wiki_table_data[1] + '\n')))
  364. else:
  365. end_parser = wiki_table_data[1]
  366. data = re.sub('<div id="wiki_div" ((?:(?!>).)+)>((?:(?!<div id="wiki_div"|<\/div_end>).\n*)+)<\/div_end>', '<div ' + wiki_table_data[0] + '>' + end_parser + '</div>', data, 1)
  367. else:
  368. break
  369. data = re.sub('<\/div_end>', '</div>', data)
  370. data = re.sub('<\/td>', '</td_end>', data)
  371. first = 0
  372. math_re = re.compile('\[math\(((?:(?!\)\]).)+)\)\]', re.I)
  373. while 1:
  374. math = math_re.search(data)
  375. if math:
  376. if first == 0:
  377. plus_data += '''
  378. <link rel="stylesheet"
  379. href="https://cdn.jsdelivr.net/npm/katex@0.10.1/dist/katex.min.css"
  380. integrity="sha384-dbVIfZGuN1Yq7/1Ocstc1lUEm+AT+/rCkibIcC/OmWo5f0EA48Vf8CytHzGrSwbQ"
  381. crossorigin="anonymous">
  382. <script src="https://cdn.jsdelivr.net/npm/katex@0.10.1/dist/katex.min.js"
  383. integrity="sha384-2BKqo+exmr9su6dir+qCw08N2ZKRucY4PrGQPPWU1A7FtlCGjmEGFqXCv5nyM5Ij"
  384. crossorigin="anonymous"></script>
  385. '''
  386. math = math.groups()[0]
  387. first += 1
  388. data = math_re.sub('<span id="math_' + str(first) + '"></span>', data, 1)
  389. plus_data += '''
  390. <script>
  391. katex.render(
  392. "''' + math.replace('\\', '\\\\').replace('&lt;', '<').replace('&gt;', '>') + '''",
  393. document.getElementById("math_''' + str(first) + '''")
  394. );
  395. </script>
  396. '''
  397. else:
  398. break
  399. num = 0
  400. while 1:
  401. one_nowiki = re.search('(?:\\\\)(.)', data)
  402. if one_nowiki:
  403. one_nowiki = one_nowiki.groups()
  404. num += 1
  405. end_data += [['one_nowiki_' + str(num), one_nowiki[0], 'normal']]
  406. data = re.sub('(?:\\\\)(.)', '<span id="one_nowiki_' + str(num) + '"></span>', data, 1)
  407. else:
  408. break
  409. while 1:
  410. hr = re.search('\n-{4,9}\n', data)
  411. if hr:
  412. data = re.sub('\n-{4,9}\n', '\n<hr>\n', data, 1)
  413. else:
  414. break
  415. data += '\n'
  416. data = data.replace('\\', '&#92;')
  417. data = re.sub('&#x27;&#x27;&#x27;(?P<in>((?!&#x27;&#x27;&#x27;).)+)&#x27;&#x27;&#x27;', '<b>\g<in></b>', data)
  418. data = re.sub('&#x27;&#x27;(?P<in>((?!&#x27;&#x27;).)+)&#x27;&#x27;', '<i>\g<in></i>', data)
  419. data = re.sub('~~(?P<in>(?:(?!~~).)+)~~', '<s>\g<in></s>', data)
  420. data = re.sub('--(?P<in>(?:(?!--).)+)--', '<s>\g<in></s>', data)
  421. data = re.sub('__(?P<in>(?:(?!__).)+)__', '<u>\g<in></u>', data)
  422. data = re.sub('\^\^(?P<in>(?:(?!\^\^).)+)\^\^', '<sup>\g<in></sup>', data)
  423. data = re.sub(',,(?P<in>(?:(?!,,).)+),,', '<sub>\g<in></sub>', data)
  424. redirect_re = re.compile('\n#(?:redirect|넘겨주기) ((?:(?!\n).)+)\n', re.I)
  425. redirect = redirect_re.search(data)
  426. if redirect:
  427. redirect = redirect.groups()[0]
  428. return_link = link_fix(redirect)
  429. main_link = return_link[0]
  430. other_link = return_link[1]
  431. backlink += [[title, main_link, 'redirect']]
  432. data = redirect_re.sub('\n * ' + title + ' - [[' + main_link + ']]\n', data, 1)
  433. no_toc_re = re.compile('\[(?:목차|toc)\((?:no)\)\]\n', re.I)
  434. toc_re = re.compile('\[(?:목차|toc)\]', re.I)
  435. if not no_toc_re.search(data):
  436. if not toc_re.search(data):
  437. data = re.sub('\n(?P<in>={1,6}) ?(?P<out>(?:(?!=).)+) ?={1,6}\n', '\n[toc]\n\g<in> \g<out> \g<in>\n', data, 1)
  438. else:
  439. data = no_toc_re.sub('', data)
  440. toc_full = 0
  441. toc_top_stack = 6
  442. toc_stack = [0, 0, 0, 0, 0, 0]
  443. edit_number = 0
  444. toc_data = '<div id="toc"><span style="font-size: 18px;">toc</span>\n\n'
  445. while 1:
  446. toc = re.search('\n(={1,6}) ?((?:(?!\n).)+) ?\n', data)
  447. if toc:
  448. toc = toc.groups()
  449. toc_number = len(toc[0])
  450. edit_number += 1
  451. if toc_full > toc_number:
  452. for i in range(toc_number, 6):
  453. toc_stack[i] = 0
  454. if toc_top_stack > toc_number:
  455. toc_top_stack = toc_number
  456. toc_full = toc_number
  457. toc_stack[toc_number - 1] += 1
  458. toc_number = str(toc_number)
  459. all_stack = ''
  460. for i in range(0, 6):
  461. all_stack += str(toc_stack[i]) + '.'
  462. while 1:
  463. if re.search('[^0-9]0\.', all_stack):
  464. all_stack = re.sub('[^0-9]0\.', '.', all_stack)
  465. else:
  466. break
  467. all_stack = re.sub('^0\.', '', all_stack)
  468. data = re.sub('\n(={1,6}) ?((?:(?!\n).)+) ?\n', '\n<h' + toc_number + ' id="s-' + re.sub('\.$', '', all_stack) + '"><a href="#toc">' + all_stack + '</a> ' + re.sub('=*$', '', toc[1]) + ' <span style="font-size: 12px"><a href="/edit/' + tool.url_pas(title) + '?section=' + str(edit_number) + '">(Edit)</a></span></h' + toc_number + '>\n', data, 1)
  469. toc_main_data = toc[1]
  470. toc_main_data = re.sub('=*$', '', toc_main_data)
  471. toc_main_data = re.sub('\[\*((?:(?! |\]).)*)(?: ((?:(?!(\[\*(?:(?:(?!\]).)+)\]|\])).)+))?\]', '', toc_main_data)
  472. toc_main_data = re.sub('<span id="math_[0-9]"><\/span>', '(수식)', toc_main_data)
  473. toc_data += '<span style="margin-left: ' + str((toc_full - toc_top_stack) * 10) + 'px;"><a href="#s-' + re.sub('\.$', '', all_stack) + '">' + all_stack + '</a> ' + toc_main_data + '</span>\n'
  474. else:
  475. break
  476. toc_data += '</div>'
  477. data = toc_re.sub(toc_data, data)
  478. data = tool.savemark(data)
  479. anchor_re = re.compile("\[anchor\((?P<in>(?:(?!\)\]).)+)\)\]", re.I)
  480. data = anchor_re.sub('<span id="\g<in>"></span>', data)
  481. ruby_re = re.compile("\[ruby\((?P<in>(?:(?!,).)+)\, ?ruby=(?P<out>(?:(?!\)\]|,).)+)(?:\, ?color=(?P<under>(?:(?!\)\]).)+))?\)\]", re.I)
  482. data = ruby_re.sub('<ruby>\g<in><rp>(</rp><rt style="color: \g<under>">\g<out></rt><rp>)</rp></ruby>', data)
  483. now_time = tool.get_time()
  484. date_re = re.compile('\[date\]', re.I)
  485. data = date_re.sub(now_time, data)
  486. time_data = re.search('^([0-9]{4}-[0-9]{2}-[0-9]{2})', now_time)
  487. time = time_data.groups()
  488. age_re = re.compile('\[age\(([0-9]{4}-[0-9]{2}-[0-9]{2})\)\]', re.I)
  489. while 1:
  490. age_data = age_re.search(data)
  491. if age_data:
  492. age = age_data.groups()[0]
  493. old = datetime.datetime.strptime(time[0], '%Y-%m-%d')
  494. will = datetime.datetime.strptime(age, '%Y-%m-%d')
  495. e_data = old - will
  496. data = age_re.sub(str(int(e_data.days / 365)), data, 1)
  497. else:
  498. break
  499. dday_re = re.compile('\[dday\(([0-9]{4}-[0-9]{2}-[0-9]{2})\)\]', re.I)
  500. while 1:
  501. dday_data = dday_re.search(data)
  502. if dday_data:
  503. dday = dday_data.groups()[0]
  504. old = datetime.datetime.strptime(time[0], '%Y-%m-%d')
  505. will = datetime.datetime.strptime(dday, '%Y-%m-%d')
  506. e_data = old - will
  507. if re.search('^-', str(e_data.days)):
  508. e_day = str(e_data.days)
  509. else:
  510. e_day = '+' + str(e_data.days)
  511. data = dday_re.sub(e_day, data, 1)
  512. else:
  513. break
  514. video_re = re.compile('\[(youtube|kakaotv|nicovideo)\(((?:(?!\)\]).)+)\)\]', re.I)
  515. youtube_re = re.compile('youtube', re.I)
  516. kakaotv_re = re.compile('kakaotv', re.I)
  517. while 1:
  518. video = video_re.search(data)
  519. if video:
  520. video = video.groups()
  521. width = re.search(', ?width=((?:(?!,).)+)', video[1])
  522. if width:
  523. video_width = width.groups()[0]
  524. else:
  525. video_width = '560'
  526. height = re.search(', ?height=((?:(?!,).)+)', video[1])
  527. if height:
  528. video_height = height.groups()[0]
  529. else:
  530. video_height = '315'
  531. code = re.search('^((?:(?!,).)+)', video[1])
  532. if code:
  533. video_code = code.groups()[0]
  534. else:
  535. video_code = ''
  536. if youtube_re.search(video[0]):
  537. video_code = re.sub('^https:\/\/www\.youtube\.com\/watch\?v=', '', video_code)
  538. video_code = re.sub('^https:\/\/youtu\.be\/', '', video_code)
  539. video_src = 'https://www.youtube.com/embed/' + video_code
  540. elif kakaotv_re.search(video[0]):
  541. video_code = re.sub('^https:\/\/tv\.kakao\.com\/channel\/9262\/cliplink\/', '', video_code)
  542. video_code = re.sub('^http:\/\/tv\.kakao\.com\/v\/', '', video_code)
  543. video_src = 'https://tv.kakao.com/embed/player/cliplink/' + video_code +'?service=kakao_tv'
  544. else:
  545. video_src = 'https://embed.nicovideo.jp/watch/' + video_code
  546. data = video_re.sub('<iframe width="' + video_width + '" height="' + video_height + '" src="' + video_src + '" allowfullscreen frameborder="0"></iframe>', data, 1)
  547. else:
  548. break
  549. while 1:
  550. block = re.search('(\n(?:&gt; ?(?:(?:(?!\n).)+)?\n)+)', data)
  551. if block:
  552. block = block.groups()[0]
  553. block = re.sub('^\n&gt; ?', '', block)
  554. block = re.sub('\n&gt; ?', '\n', block)
  555. block = re.sub('\n$', '', block)
  556. data = re.sub('(\n(?:&gt; ?(?:(?:(?!\n).)+)?\n)+)', '\n<blockquote>' + block + '</blockquote>\n', data, 1)
  557. else:
  558. break
  559. data = re.sub('(?P<in>\n +\* ?(?:(?:(?!\|\|).)+))\|\|', '\g<in>\n ||', data)
  560. while 1:
  561. li = re.search('(\n(?:(?: *)\* ?(?:(?:(?!\n).)+)\n)+)', data)
  562. if li:
  563. li = li.groups()[0]
  564. while 1:
  565. sub_li = re.search('\n(?:( *)\* ?((?:(?!\n).)+))', li)
  566. if sub_li:
  567. sub_li = sub_li.groups()
  568. if len(sub_li[0]) == 0:
  569. margin = 20
  570. else:
  571. margin = len(sub_li[0]) * 20
  572. li = re.sub('\n(?:( *)\* ?((?:(?!\n).)+))', '<li style="margin-left: ' + str(margin) + 'px;">' + sub_li[1] + '</li>', li, 1)
  573. else:
  574. break
  575. data = re.sub('(\n(?:(?: *)\* ?(?:(?:(?!\n).)+)\n)+)', '\n\n<ul>' + li + '</ul>\n', data, 1)
  576. else:
  577. break
  578. data = re.sub('<\/ul>\n \|\|', '</ul>||', data)
  579. while 1:
  580. indent = re.search('\n( +)', data)
  581. if indent:
  582. indent = len(indent.groups()[0])
  583. margin = '<span style="margin-left: 20px;"></span>' * indent
  584. data = re.sub('\n( +)', '\n' + margin, data, 1)
  585. else:
  586. break
  587. data = table_start(data)
  588. category = '\n<hr><div id="cate">Category : '
  589. category_re = re.compile('^(?:category|분류):', re.I)
  590. while 1:
  591. link = re.search('\[\[((?:(?!\[\[|\]\]).)+)\]\]', data)
  592. if link:
  593. link = link.groups()[0]
  594. link_split = re.search('((?:(?!\|).)+)(?:\|((?:(?!\|).)+))', link)
  595. if link_split:
  596. link_split = link_split.groups()
  597. main_link = link_split[0]
  598. see_link = link_split[1]
  599. else:
  600. main_link = link
  601. see_link = link
  602. if re.search('^((?:file|파일)|(?:out|외부)):', main_link):
  603. file_style = ''
  604. width = re.search('width=((?:(?!&).)+)', see_link)
  605. if width:
  606. file_width = width.groups()[0]
  607. if re.search('px$', file_width):
  608. file_style += 'width: ' + file_width + ';'
  609. else:
  610. file_style += 'width: ' + file_width + 'px;'
  611. height = re.search('height=((?:(?!&).)+)', see_link)
  612. if height:
  613. file_height = height.groups()[0]
  614. if re.search('px$', file_height):
  615. file_style += 'height: ' + file_height + ';'
  616. else:
  617. file_style += 'height: ' + file_height + 'px;'
  618. align = re.search('align=((?:(?!&).)+)', see_link)
  619. if align:
  620. file_align = align.groups()[0]
  621. if file_align == 'center':
  622. file_align = 'display: block; text-align: center;'
  623. else:
  624. file_align = 'float: ' + file_align + ';'
  625. else:
  626. file_align = ''
  627. if re.search('^(?:out|외부):', main_link):
  628. file_src = re.sub('^(?:out|외부):', '', main_link)
  629. file_alt = main_link
  630. exist = 'Yes'
  631. else:
  632. file_data = re.search('^(?:file|파일):((?:(?!\.).)+)\.(.+)$', main_link)
  633. if file_data:
  634. file_data = file_data.groups()
  635. file_name = file_data[0]
  636. file_end = file_data[1]
  637. backlink += [[title, main_link, 'file']]
  638. else:
  639. file_name = 'TEST'
  640. file_end = 'jpg'
  641. file_src = '/image/' + tool.sha224(file_name) + '.' + file_end
  642. file_alt = 'file:' + file_name + '.' + file_end
  643. curs.execute("select title from data where title = ?", [file_alt])
  644. exist = curs.fetchall()
  645. if exist:
  646. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<span style="' + file_align + '"><img style="' + file_style + '" alt="' + file_alt + '" src="' + file_src + '"></span>', data, 1)
  647. else:
  648. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="not_thing" href="/w/' + tool.url_pas(file_alt) + '">' + file_alt + '</a>', data, 1)
  649. elif category_re.search(main_link):
  650. see_link = re.sub('#include', '', see_link)
  651. main_link = re.sub('#include', '', category_re.sub('category:', main_link))
  652. if re.search('#blur', main_link):
  653. see_link = 'Hidden'
  654. link_id = 'id="inside"'
  655. main_link = re.sub('#blur', '', main_link)
  656. else:
  657. link_id = ''
  658. backlink += [[title, main_link, 'cat']]
  659. category += '<a ' + link_id + ' href="' + tool.url_pas(main_link) + '">' + category_re.sub('', see_link) + '</a> / '
  660. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '', data, 1)
  661. elif re.search('^wiki:', main_link):
  662. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="inside" href="/' + tool.url_pas(re.sub('^wiki:', '', main_link)) + '">' + see_link + '</a>', data, 1)
  663. elif re.search('^inter:((?:(?!:).)+):', main_link):
  664. inter_data = re.search('^inter:((?:(?!:).)+):((?:(?!\]\]|\|).)+)', main_link)
  665. inter_data = inter_data.groups()
  666. curs.execute('select link from inter where title = ?', [inter_data[0]])
  667. inter = curs.fetchall()
  668. if inter:
  669. if see_link != main_link:
  670. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="inside" href="' + inter[0][0] + inter_data[1] + '">' + inter_data[0] + ':' + see_link + '</a>', data, 1)
  671. else:
  672. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="inside" href="' + inter[0][0] + inter_data[1] + '">' + inter_data[0] + ':' + inter_data[1] + '</a>', data, 1)
  673. else:
  674. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', 'Not exist', data, 1)
  675. elif re.search('^\/', main_link):
  676. under_title = re.search('^(\/(?:.+))$', main_link)
  677. under_title = under_title.groups()[0]
  678. if see_link != main_link:
  679. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '[[' + title + under_title + '|' + see_link + ']]', data, 1)
  680. else:
  681. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '[[' + title + under_title + ']]', data, 1)
  682. elif re.search('^http(s)?:\/\/', main_link):
  683. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="out_link" rel="nofollow" href="' + main_link + '">' + see_link + '</a>', data, 1)
  684. else:
  685. return_link = link_fix(main_link)
  686. main_link = return_link[0]
  687. other_link = return_link[1]
  688. if re.search('^\/', main_link):
  689. main_link = re.sub('^\/', title + '/', main_link)
  690. elif re.search('\.\.\/\/', main_link):
  691. main_link = re.sub('\.\.\/\/', '/', main_link)
  692. elif re.search('^\.\.\/', main_link):
  693. main_link = re.sub('^\.\.\/', re.sub('(?P<in>.+)\/.*$', '\g<in>', title), main_link)
  694. if not re.search('^\|', main_link):
  695. if main_link != title:
  696. if main_link != '':
  697. curs.execute("select title from data where title = ?", [main_link])
  698. if not curs.fetchall():
  699. link_id = 'id="not_thing"'
  700. backlink += [[title, main_link, 'no']]
  701. else:
  702. link_id = ''
  703. backlink += [[title, main_link, '']]
  704. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a ' + link_id + ' href="/w/' + tool.url_pas(main_link) + other_link + '">' + see_link + '</a>', data, 1)
  705. else:
  706. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a href="' + other_link + '">' + see_link + '</a>', data, 1)
  707. else:
  708. if re.search('^#', other_link):
  709. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a href="' + other_link + '">' + other_link + '</a>', data, 1)
  710. else:
  711. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<b>' + see_link + '</b>', data, 1)
  712. else:
  713. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '&#91;&#91;' + link + '&#93;&#93;', data, 1)
  714. else:
  715. break
  716. br_re = re.compile('\[br\]', re.I)
  717. data = br_re.sub('<br>', data)
  718. footnote_number = 0
  719. footnote_all = []
  720. footnote_dict = {}
  721. footnote_re = {}
  722. footdata_all = '\n<hr><ul id="footnote_data">'
  723. re_footnote = re.compile('(?:\[\*((?:(?! |\]).)*)(?: ((?:(?!(?:\[\*|\])).)+))?\]|(\[(?:각주|footnote)\]))')
  724. while 1:
  725. footnote = re_footnote.search(data)
  726. if footnote:
  727. footnote_data = footnote.groups()
  728. if footnote_data[2]:
  729. footnote_all.sort()
  730. for footdata in footnote_all:
  731. if footdata[2] == 0:
  732. footdata_in = ''
  733. else:
  734. footdata_in = footdata[2]
  735. footdata_all += '<li><a href="#rfn-' + str(footdata[0]) + '">(' + footdata[1] + ')</a> <span id="fn-' + str(footdata[0]) + '">' + footdata_in + '</span></li>'
  736. data = re_footnote.sub(footdata_all + '</ul>', data, 1)
  737. footnote_all = []
  738. footdata_all = '\n<hr><ul id="footnote_data">'
  739. else:
  740. footnote = footnote_data[1]
  741. footnote_name = footnote_data[0]
  742. if footnote_name and not footnote:
  743. if footnote_name in footnote_dict:
  744. footnote_re[footnote_name] += 1
  745. foot_plus_num = str(footnote_re[footnote_name])
  746. footshort = footnote_dict[footnote_name] + '.' + foot_plus_num
  747. footnote_all += [[float(footshort), footshort, 0]]
  748. data = re_footnote.sub('<sup><a href="javascript:open_foot(\'fn-' + footshort + '\')" id="rfn-' + footshort + '">(' + footnote_name + ')</a></sup><span class="foot_plus" id="cfn-' + footshort + '"></span>', data, 1)
  749. else:
  750. data = re_footnote.sub('<sup><a href="#">(' + footnote_name + ')</a></sup>', data, 1)
  751. else:
  752. footnote_number += 1
  753. if not footnote_name:
  754. footnote_name = str(footnote_number)
  755. footnote_dict.update({ footnote_name : str(footnote_number) })
  756. if not footnote_name in footnote_re:
  757. footnote_re.update({ footnote_name : 0 })
  758. else:
  759. footnote_re[footnote_name] += 1
  760. footnote_all += [[footnote_number, footnote_name, footnote]]
  761. data = re_footnote.sub('<sup><a href="javascript:open_foot(\'fn-' + str(footnote_number) + '\')" id="rfn-' + str(footnote_number) + '">(' + footnote_name + ')</a></sup><span class="foot_plus" id="cfn-' + str(footnote_number) + '"></span>', data, 1)
  762. else:
  763. break
  764. data = re.sub('\n+$', '', data)
  765. footnote_all.sort()
  766. for footdata in footnote_all:
  767. if footdata[2] == 0:
  768. footdata_in = ''
  769. else:
  770. footdata_in = footdata[2]
  771. footdata_all += '<li><a href="#rfn-' + str(footdata[0]) + '">(' + footdata[1] + ')</a> <span id="fn-' + str(footdata[0]) + '">' + footdata_in + '</span></li>'
  772. footdata_all += '</ul>'
  773. if footdata_all == '\n<hr><ul id="footnote_data"></ul>':
  774. footdata_all = ''
  775. data = re.sub('\n$', footdata_all, data + '\n', 1)
  776. category += '</div>'
  777. category = re.sub(' / <\/div>$', '</div>', category)
  778. if category == '\n<hr><div id="cate">Category : </div>':
  779. category = ''
  780. data += category
  781. i = 0
  782. while 1:
  783. try:
  784. _ = end_data[i][0]
  785. except:
  786. break
  787. if end_data[i][2] == 'normal':
  788. data = data.replace('<span id="' + end_data[i][0] + '"></span>', end_data[i][1])
  789. data = data.replace(tool.url_pas('<span id="' + end_data[i][0] + '"></span>'), tool.url_pas(end_data[i][1]))
  790. else:
  791. if re.search('\n', end_data[i][1]):
  792. data = data.replace('<span id="' + end_data[i][0] + '"></span>', '\n<pre>' + re.sub('^\n', '', end_data[i][1]) + '</pre>')
  793. else:
  794. data = data.replace('<span id="' + end_data[i][0] + '"></span>', '<code>' + end_data[i][1] + '</code>')
  795. i += 1
  796. if main_num == 1:
  797. i = 0
  798. while 1:
  799. try:
  800. _ = backlink[i][0]
  801. except:
  802. break
  803. find_data = re.search('<span id="(one_nowiki_[0-9]+)">', backlink[i][1])
  804. if find_data:
  805. j = 0
  806. find_data = find_data.groups()[0]
  807. while 1:
  808. try:
  809. _ = end_data[j][0]
  810. except:
  811. break
  812. if end_data[j][0] == find_data:
  813. backlink[i][1] = backlink[i][1].replace('<span id="' + end_data[j][0] + '"></span>', end_data[j][1])
  814. j += 1
  815. i += 1
  816. data = re.sub('<\/td_end>', '</td>', data)
  817. data = re.sub('<include>\n', '', data)
  818. data = re.sub('\n<\/include>', '', data)
  819. data = re.sub('(?P<in><\/h[0-9]>)(\n)+', '\g<in>', data)
  820. data = re.sub('\n\n<ul>', '\n<ul>', data)
  821. data = re.sub('<\/ul>\n\n', '</ul>', data)
  822. data = re.sub('^(\n)+', '', data)
  823. data = re.sub('(\n)+<hr><ul id="footnote_data">', '<hr><ul id="footnote_data">', data)
  824. data = re.sub('(?P<in><td(((?!>).)*)>)\n', '\g<in>', data)
  825. data = re.sub('(\n)?<hr>(\n)?', '<hr>', data)
  826. data = re.sub('<\/ul>\n\n<ul>', '</ul>\n<ul>', data)
  827. data = re.sub('\n', '<br>', data)
  828. return [data, plus_data, backlink]