namu.py 45 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050
  1. from . import tool
  2. import datetime
  3. import html
  4. import re
  5. def table_parser(data, cel_data, start_data, num = 0):
  6. table_class = 'class="'
  7. all_table = 'style="'
  8. cel_style = 'style="'
  9. row_style = 'style="'
  10. row = ''
  11. cel = ''
  12. table_width = re.search("<table ?width=((?:(?!>).)*)>", data)
  13. if table_width:
  14. if re.search('^[0-9]+$', table_width.groups()[0]):
  15. all_table += 'width: ' + table_width.groups()[0] + 'px;'
  16. else:
  17. all_table += 'width: ' + table_width.groups()[0] + ';'
  18. table_height = re.search("<table ?height=((?:(?!>).)*)>", data)
  19. if table_height:
  20. if re.search('^[0-9]+$', table_height.groups()[0]):
  21. all_table += 'height: ' + table_height.groups()[0] + 'px;'
  22. else:
  23. all_table += 'height: ' + table_height.groups()[0] + ';'
  24. table_align = re.search("<table ?align=((?:(?!>).)*)>", data)
  25. if table_align:
  26. if table_align.groups()[0] == 'right':
  27. all_table += 'float: right;'
  28. elif table_align.groups()[0] == 'center':
  29. all_table += 'margin: auto;'
  30. table_text_align = re.search("<table ?textalign=((?:(?!>).)*)>", data)
  31. if table_text_align:
  32. num = 1
  33. if table_text_align.groups()[0] == 'right':
  34. all_table += 'text-align: right;'
  35. elif table_text_align.groups()[0] == 'center':
  36. all_table += 'text-align: center;'
  37. row_table_align = re.search("<row ?textalign=((?:(?!>).)*)>", data)
  38. if row_table_align:
  39. if row_table_align.groups()[0] == 'right':
  40. row_style += 'text-align: right;'
  41. elif row_table_align.groups()[0] == 'center':
  42. row_style += 'text-align: center;'
  43. else:
  44. row_style += 'text-align: left;'
  45. table_cel = re.search("<-((?:(?!>).)*)>", data)
  46. if table_cel:
  47. cel = 'colspan="' + table_cel.groups()[0] + '"'
  48. else:
  49. cel = 'colspan="' + str(round(len(start_data) / 2)) + '"'
  50. table_row = re.search("<\|((?:(?!>).)*)>", data)
  51. if table_row:
  52. row = 'rowspan="' + table_row.groups()[0] + '"'
  53. row_bgcolor = re.search("<rowbgcolor=(#(?:[0-9a-f-A-F]{3}){1,2}|\w+)>", data)
  54. if row_bgcolor:
  55. row_style += 'background: ' + row_bgcolor.groups()[0] + ';'
  56. table_border = re.search("<table ?bordercolor=(#(?:[0-9a-f-A-F]{3}){1,2}|\w+)>", data)
  57. if table_border:
  58. all_table += 'border: ' + table_border.groups()[0] + ' 2px solid;'
  59. table_bgcolor = re.search("<table ?bgcolor=(#(?:[0-9a-f-A-F]{3}){1,2}|\w+)>", data)
  60. if table_bgcolor:
  61. all_table += 'background: ' + table_bgcolor.groups()[0] + ';'
  62. bgcolor = re.search("<(?:bgcolor=)?(#(?:[0-9a-f-A-F]{3}){1,2}|\w+)>", data)
  63. if bgcolor:
  64. cel_style += 'background: ' + bgcolor.groups()[0] + ';'
  65. cel_width = re.search("<width=((?:(?!>).)*)>", data)
  66. if cel_width:
  67. cel_style += 'width: ' + cel_width.groups()[0] + 'px;'
  68. cel_height = re.search("<height=((?:(?!>).)*)>", data)
  69. if cel_height:
  70. cel_style += 'height: ' + cel_height.groups()[0] + 'px;'
  71. text_right = re.search("<\)>", data)
  72. text_center = re.search("<:>", data)
  73. text_left = re.search("<\(>", data)
  74. if text_right:
  75. cel_style += 'text-align: right;'
  76. elif text_center:
  77. cel_style += 'text-align: center;'
  78. elif text_left:
  79. cel_style += 'text-align: left;'
  80. elif num == 0:
  81. if re.search('^ ', cel_data) and re.search(' $', cel_data):
  82. cel_style += 'text-align: center;'
  83. elif re.search('^ ', cel_data):
  84. cel_style += 'text-align: right;'
  85. elif re.search(' $', cel_data):
  86. cel_style += 'text-align: left;'
  87. text_class = re.search("<table ?class=((?:(?!>).)+)>", data)
  88. if text_class:
  89. table_class += text_class.groups()[0]
  90. all_table += '"'
  91. cel_style += '"'
  92. row_style += '"'
  93. table_class += '"'
  94. return [all_table, row_style, cel_style, row, cel, table_class, num]
  95. def table_start(data):
  96. data = re.sub('\|\|\n(?P<in>(?:(?:(?:(?!\|\|).)+)\n?)+)\n\|\|', '|| \n\g<in> ||', data)
  97. while 1:
  98. table = re.search('\n((?:(?:(?:(?:\|\|)+(?:(?:(?!\|\|).(?:\n)*)*))+)\|\|(?:\n)?)+)', data)
  99. if table:
  100. table = table.groups()[0]
  101. while 1:
  102. all_table = re.search('^((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*((?:(?!\|\|).\n*)*)', table)
  103. if all_table:
  104. all_table = all_table.groups()
  105. return_table = table_parser(all_table[1], all_table[2], all_table[0])
  106. number = return_table[6]
  107. table = re.sub('^((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*', '\n<table ' + return_table[5] + ' ' + return_table[0] + '><tbody><tr ' + return_table[1] + '><td ' + return_table[2] + ' ' + return_table[3] + ' ' + return_table[4] + '>', table, 1)
  108. else:
  109. break
  110. table = re.sub('\|\|\n?$', '</td></tr></tbody></table>', table)
  111. while 1:
  112. row_table = re.search('\|\|\n((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*((?:(?!\|\||<\/td>).\n*)*)', table)
  113. if row_table:
  114. row_table = row_table.groups()
  115. return_table = table_parser(row_table[1], row_table[2], row_table[0], number)
  116. table = re.sub('\|\|\n((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*', '</td></tr><tr ' + return_table[1] + '><td ' + return_table[2] + ' ' + return_table[3] + ' ' + return_table[4] + '>', table, 1)
  117. else:
  118. break
  119. while 1:
  120. cel_table = re.search('((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*((?:(?:(?!\|\||<\/td>).)|\n)*\n*)', table)
  121. if cel_table:
  122. cel_table = cel_table.groups()
  123. return_table = table_parser(cel_table[1], re.sub('\n', ' ', cel_table[2]), cel_table[0], number)
  124. table = re.sub('((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*', '</td><td ' + return_table[2] + ' ' + return_table[3] + ' ' + return_table[4] + '>', table, 1)
  125. else:
  126. break
  127. data = re.sub('\n((?:(?:(?:(?:\|\|)+(?:(?:(?!\|\|).(?:\n)*)*))+)\|\|(?:\n)?)+)', table, data, 1)
  128. else:
  129. break
  130. return data
  131. def middle_parser(data, fol_num, syntax_num, folding_num):
  132. global end_data
  133. global plus_data
  134. middle_stack = 0
  135. middle_list = []
  136. middle_number = 0
  137. middle_re = re.compile('(?:{{{((?:(?:(?! |{{{|}}}|&lt;).)*) ?)|(}}}))')
  138. while 1:
  139. middle_data = middle_re.search(data)
  140. if middle_data:
  141. middle_data = middle_data.groups()
  142. if not middle_data[1]:
  143. if middle_stack > 0:
  144. middle_stack += 1
  145. data = re.sub('(?:{{{((?:(?! |{{{|}}}|&lt;).)*)(?P<in> ?)|(}}}))', '&#123;&#123;&#123;' + middle_data[0] + '\g<in>', data, 1)
  146. else:
  147. if re.search('^(#|@|\+|\-)', middle_data[0]) and not re.search('^(#|@|\+|\-){2}|(#|@|\+|\-)\\\\', middle_data[0]):
  148. middle_search = re.search('^(#(?:[0-9a-f-A-F]{3}){1,2})', middle_data[0])
  149. if middle_search:
  150. middle_list += ['span']
  151. data = middle_re.sub('<span style="color: ' + middle_search.groups()[0] + ';">', data, 1)
  152. else:
  153. middle_search = re.search('^(?:#(\w+))', middle_data[0])
  154. if middle_search:
  155. middle_list += ['span']
  156. data = middle_re.sub('<span style="color: ' + middle_search.groups()[0] + ';">', data, 1)
  157. else:
  158. middle_search = re.search('^(?:@((?:[0-9a-f-A-F]{3}){1,2}))', middle_data[0])
  159. if middle_search:
  160. middle_list += ['span']
  161. data = middle_re.sub('<span style="background: #' + middle_search.groups()[0] + ';">', data, 1)
  162. else:
  163. middle_search = re.search('^(?:@(\w+))', middle_data[0])
  164. if middle_search:
  165. middle_list += ['span']
  166. data = middle_re.sub('<span style="background: ' + middle_search.groups()[0] + ';">', data, 1)
  167. else:
  168. middle_search = re.search('^(\+|-)([1-5])', middle_data[0])
  169. if middle_search:
  170. middle_search = middle_search.groups()
  171. if middle_search[0] == '+':
  172. font_size = str(int(middle_search[1]) * 20 + 100)
  173. else:
  174. font_size = str(100 - int(middle_search[1]) * 10)
  175. middle_list += ['span']
  176. data = middle_re.sub('<span style="font-size: ' + font_size + '%;">', data, 1)
  177. else:
  178. middle_search = re.search('^#!wiki', middle_data[0])
  179. if middle_search:
  180. middle_data_2 = re.search('{{{#!wiki(?: style=(?:&quot;|&#x27;)((?:(?!&quot;|&#x27;).)*)(?:&quot;|&#x27;))?\n?', data)
  181. if middle_data_2:
  182. middle_data_2 = middle_data_2.groups()
  183. else:
  184. middle_data_2 = ['']
  185. middle_list += ['div_end']
  186. data = re.sub('{{{#!wiki(?: style=(?:&quot;|&#x27;)((?:(?!&quot;|&#x27;).)*)(?:&quot;|&#x27;))?\n?', '<div id="wiki_div" style="' + str(middle_data_2[0]) + '">', data, 1)
  187. else:
  188. middle_search = re.search('^#!syntax', middle_data[0])
  189. if middle_search:
  190. middle_data_2 = re.search('{{{#!syntax ((?:(?!\n).)+)\n?', data)
  191. if middle_data_2:
  192. middle_data_2 = middle_data_2.groups()
  193. else:
  194. middle_data_2 = ['python']
  195. if syntax_num == 0:
  196. plus_data += '<script>hljs.initHighlightingOnLoad();</script>'
  197. syntax_num = 1
  198. middle_list += ['pre']
  199. data = re.sub('{{{#!syntax ?((?:(?!\n).)*)\n?', '<pre id="syntax"><code class="' + middle_data_2[0] + '">', data, 1)
  200. else:
  201. middle_search = re.search('^#!folding', middle_data[0])
  202. if middle_search:
  203. middle_list += ['2div']
  204. folding_data = re.search('{{{#!folding ?((?:(?!\n).)*)\n?', data)
  205. if folding_data:
  206. folding_data = folding_data.groups()
  207. else:
  208. folding_data = ['Test']
  209. if folding_num == 0:
  210. folding_num = 1
  211. data = re.sub('{{{#!folding ?((?:(?!\n).)*)\n?', '<div>' + str(folding_data[0]) + ' <div style="display: inline-block;"><a href="javascript:void(0);" onclick="folding(' + str(fol_num) + ');">[do]</a></div_end><div id="folding_' + str(fol_num) + '" style="display: none;"><div id="wiki_div" style="">', data, 1)
  212. fol_num += 1
  213. else:
  214. middle_list += ['span']
  215. data = middle_re.sub('<span>', data, 1)
  216. else:
  217. middle_list += ['code']
  218. middle_stack += 1
  219. data = middle_re.sub('<code>' + middle_data[0].replace('\\', '\\\\'), data, 1)
  220. middle_number += 1
  221. else:
  222. if middle_list == []:
  223. data = middle_re.sub('&#125;&#125;&#125;', data, 1)
  224. else:
  225. if middle_stack > 0:
  226. middle_stack -= 1
  227. if middle_stack > 0:
  228. data = middle_re.sub('&#125;&#125;&#125;', data, 1)
  229. else:
  230. if middle_number > 0:
  231. middle_number -= 1
  232. if middle_list[middle_number] == '2div':
  233. data = middle_re.sub('</div_end></div_end></div_end>', data, 1)
  234. elif middle_list[middle_number] == 'pre':
  235. data = middle_re.sub('</code></pre>', data, 1)
  236. else:
  237. data = middle_re.sub('</' + middle_list[middle_number] + '>', data, 1)
  238. del(middle_list[middle_number])
  239. else:
  240. if middle_stack == 0:
  241. break
  242. else:
  243. if middle_list == []:
  244. data += '&#125;&#125;&#125;'
  245. else:
  246. if middle_stack > 0:
  247. middle_stack -= 1
  248. if middle_stack > 0:
  249. data += '&#125;&#125;&#125;'
  250. else:
  251. if middle_number > 0:
  252. middle_number -= 1
  253. if middle_list[middle_number] == '2div':
  254. data += '</div_end></div_end></div_end>'
  255. elif middle_list[middle_number] == 'pre':
  256. data += '</code></pre>'
  257. else:
  258. data += '</' + middle_list[middle_number] + '>'
  259. del(middle_list[middle_number])
  260. num = 0
  261. while 1:
  262. nowiki_data = re.search('<code>((?:(?:(?!<\/code>).)*\n*)*)<\/code>', data)
  263. if nowiki_data:
  264. nowiki_data = nowiki_data.groups()
  265. num += 1
  266. end_data += [['nowiki_' + str(num), nowiki_data[0], 'code']]
  267. data = re.sub('<code>((?:(?:(?!<\/code>).)*\n*)*)<\/code>', '<span id="nowiki_' + str(num) + '"></span>', data, 1)
  268. else:
  269. break
  270. num = 0
  271. while 1:
  272. syntax_data = re.search('<code class="((?:(?!").)+)">((?:(?:(?:(?!<\/code>|<span id="syntax_)).)+\n*)+)<\/code>', data)
  273. if syntax_data:
  274. syntax_data = syntax_data.groups()
  275. num += 1
  276. end_data += [['syntax_' + str(num), syntax_data[1], 'normal']]
  277. data = re.sub('<code class="((?:(?!").)+)">((?:(?:(?:(?!<\/code>|<span id="syntax_)).)+\n*)+)<\/code>', '<code class="' + syntax_data[0] + '"><span id="syntax_' + str(num) + '"></span></code>', data, 1)
  278. else:
  279. break
  280. return [data, [fol_num, syntax_num, folding_num]]
  281. def link_fix(main_link):
  282. if re.search('^:', main_link):
  283. main_link = re.sub('^:', '', main_link)
  284. main_link = re.sub('^사용자:', 'user:', main_link)
  285. main_link = re.sub('^파일:', 'file:', main_link)
  286. main_link = re.sub('^분류:', 'category:', main_link)
  287. other_link = re.search('(#.+)$', main_link)
  288. if other_link:
  289. other_link = other_link.groups()[0]
  290. main_link = re.sub('(#.+)$', '', main_link)
  291. else:
  292. other_link = ''
  293. return [main_link, other_link]
  294. def namu(conn, data, title, main_num):
  295. curs = conn.cursor()
  296. global plus_data
  297. global end_data
  298. data = '\n' + data + '\n'
  299. plus_data = ''
  300. backlink = []
  301. end_data = []
  302. data = re.sub('<math>(?P<in>(?:(?!<\/math>).)+)<\/math>', '[math(\g<in>)]', data)
  303. data = html.escape(data)
  304. data = re.sub('\r\n', '\n', data)
  305. t_data = middle_parser(data, 0, 0, 0)
  306. data = t_data[0]
  307. include_re = re.compile('\[include\(((?:(?!\)\]).)+)\)\]', re.I)
  308. while 1:
  309. include = include_re.search(data)
  310. if include:
  311. include = include.groups()[0]
  312. include_data = re.search('^((?:(?!,).)+)', include)
  313. if include_data:
  314. include_data = include_data.groups()[0]
  315. else:
  316. include_data = 'Test'
  317. include_link = include_data
  318. backlink += [[title, include_link, 'include']]
  319. include = re.sub('^((?:(?!,).)+)', '', include)
  320. num = 0
  321. while 1:
  322. include_one_nowiki = re.search('(?:\\\\){2}(.)', include)
  323. if include_one_nowiki:
  324. include_one_nowiki = include_one_nowiki.groups()
  325. num += 1
  326. end_data += [['include_one_nowiki_' + str(num), include_one_nowiki[0], 'normal']]
  327. include = re.sub('(?:\\\\){2}(.)', '<span id="include_one_nowiki_' + str(num) + '"></span>', include, 1)
  328. else:
  329. break
  330. curs.execute("select data from data where title = ?", [include_data])
  331. include_data = curs.fetchall()
  332. if include_data:
  333. include_parser = include_re.sub('', include_data[0][0])
  334. include_parser = html.escape(include_parser)
  335. while 1:
  336. include_plus = re.search(', ?((?:(?!=).)+)=((?:(?!,).)+)', include)
  337. if include_plus:
  338. include_plus = include_plus.groups()
  339. include_parser = include_parser.replace('@' + include_plus[0] + '@', include_plus[1])
  340. include = re.sub(', ?((?:(?!=).)+)=((?:(?!,).)+)', '', include, 1)
  341. else:
  342. break
  343. include_parser = re.sub('\[\[(?:category|분류):(((?!\]\]|#include).)+)\]\]', '', include_parser)
  344. data = include_re.sub('<include>\n<a id="include_link" href="/w/' + tool.url_pas(include_link) + '">[' + include_link + ']</a>\n' + include_parser + '\n</include>', data, 1)
  345. else:
  346. data = include_re.sub('<a id="not_thing" href="/w/' + tool.url_pas(include_link) + '">' + include_link + '</a>', data, 1)
  347. else:
  348. break
  349. data = re.sub('\r\n', '\n', data)
  350. t_data = middle_parser(data, t_data[1][0], t_data[1][1], t_data[1][2])
  351. data = t_data[0]
  352. data = re.sub('&amp;', '&', data)
  353. data = re.sub('\n( +)\|\|', '\n||', data)
  354. data = re.sub('\|\|( +)\n', '|| \n', data)
  355. data = re.sub('\n##(((?!\n).)+)', '', data)
  356. while 1:
  357. wiki_table_data = re.search('<div id="wiki_div" ((?:(?!>).)+)>((?:(?!<div id="wiki_div"|<\/div_end>).\n*)+)<\/div_end>', data)
  358. if wiki_table_data:
  359. wiki_table_data = wiki_table_data.groups()
  360. if re.search('\|\|', wiki_table_data[1]):
  361. end_parser = re.sub('\n$', '', re.sub('^\n', '', table_start('\n' + wiki_table_data[1] + '\n')))
  362. else:
  363. end_parser = wiki_table_data[1]
  364. data = re.sub('<div id="wiki_div" ((?:(?!>).)+)>((?:(?!<div id="wiki_div"|<\/div_end>).\n*)+)<\/div_end>', '<div ' + wiki_table_data[0] + '>' + end_parser + '</div>', data, 1)
  365. else:
  366. break
  367. data = re.sub('<\/div_end>', '</div>', data)
  368. data = re.sub('<\/td>', '</td_end>', data)
  369. first = 0
  370. math_re = re.compile('\[math\(((?:(?!\)\]).)+)\)\]', re.I)
  371. while 1:
  372. math = math_re.search(data)
  373. if math:
  374. math = math.groups()[0]
  375. first += 1
  376. data = math_re.sub('<span id="math_' + str(first) + '"></span>', data, 1)
  377. plus_data += '''
  378. <script>
  379. katex.render(
  380. "''' + math.replace('\\', '\\\\').replace('&lt;', '<').replace('&gt;', '>') + '''",
  381. document.getElementById("math_''' + str(first) + '''")
  382. );
  383. </script>
  384. '''
  385. else:
  386. break
  387. num = 0
  388. while 1:
  389. one_nowiki = re.search('(?:\\\\)(.)', data)
  390. if one_nowiki:
  391. one_nowiki = one_nowiki.groups()
  392. num += 1
  393. end_data += [['one_nowiki_' + str(num), one_nowiki[0], 'normal']]
  394. data = re.sub('(?:\\\\)(.)', '<span id="one_nowiki_' + str(num) + '"></span>', data, 1)
  395. else:
  396. break
  397. while 1:
  398. hr = re.search('\n-{4,9}\n', data)
  399. if hr:
  400. data = re.sub('\n-{4,9}\n', '\n<hr>\n', data, 1)
  401. else:
  402. break
  403. data += '\n'
  404. data = data.replace('\\', '&#92;')
  405. data = re.sub('&#x27;&#x27;&#x27;(?P<in>((?!&#x27;&#x27;&#x27;).)+)&#x27;&#x27;&#x27;', '<b>\g<in></b>', data)
  406. data = re.sub('&#x27;&#x27;(?P<in>((?!&#x27;&#x27;).)+)&#x27;&#x27;', '<i>\g<in></i>', data)
  407. data = re.sub('~~(?P<in>(?:(?!~~).)+)~~', '<s>\g<in></s>', data)
  408. data = re.sub('--(?P<in>(?:(?!--).)+)--', '<s>\g<in></s>', data)
  409. data = re.sub('__(?P<in>(?:(?!__).)+)__', '<u>\g<in></u>', data)
  410. data = re.sub('\^\^(?P<in>(?:(?!\^\^).)+)\^\^', '<sup>\g<in></sup>', data)
  411. data = re.sub(',,(?P<in>(?:(?!,,).)+),,', '<sub>\g<in></sub>', data)
  412. redirect_re = re.compile('\n#(?:redirect|넘겨주기) ((?:(?!\n).)+)\n', re.I)
  413. redirect = redirect_re.search(data)
  414. if redirect:
  415. redirect = redirect.groups()[0]
  416. return_link = link_fix(redirect)
  417. main_link = return_link[0]
  418. other_link = return_link[1]
  419. backlink += [[title, main_link, 'redirect']]
  420. data = redirect_re.sub('\n * ' + title + ' - [[' + main_link + ']]\n', data, 1)
  421. no_toc_re = re.compile('\[(?:목차|toc)\((?:no)\)\]\n', re.I)
  422. toc_re = re.compile('\[(?:목차|toc)\]', re.I)
  423. if not no_toc_re.search(data):
  424. if not toc_re.search(data):
  425. data = re.sub('\n(?P<in>={1,6}) ?(?P<out>(?:(?!=).)+) ?={1,6}\n', '\n[toc]\n\g<in> \g<out> \g<in>\n', data, 1)
  426. else:
  427. data = no_toc_re.sub('', data)
  428. toc_full = 0
  429. toc_top_stack = 6
  430. toc_stack = [0, 0, 0, 0, 0, 0]
  431. edit_number = 0
  432. toc_data = '<div id="toc"><span id="toc_title">TOC</span>\n\n'
  433. while 1:
  434. toc = re.search('\n(={1,6}) ?((?:(?!\n).)+) ?\n', data)
  435. if toc:
  436. toc = toc.groups()
  437. toc_number = len(toc[0])
  438. edit_number += 1
  439. if toc_full > toc_number:
  440. for i in range(toc_number, 6):
  441. toc_stack[i] = 0
  442. if toc_top_stack > toc_number:
  443. toc_top_stack = toc_number
  444. toc_full = toc_number
  445. toc_stack[toc_number - 1] += 1
  446. toc_number = str(toc_number)
  447. all_stack = ''
  448. for i in range(0, 6):
  449. all_stack += str(toc_stack[i]) + '.'
  450. while 1:
  451. if re.search('[^0-9]0\.', all_stack):
  452. all_stack = re.sub('[^0-9]0\.', '.', all_stack)
  453. else:
  454. break
  455. all_stack = re.sub('^0\.', '', all_stack)
  456. data = re.sub('\n(={1,6}) ?((?:(?!\n).)+) ?\n', '\n<h' + toc_number + ' id="s-' + re.sub('\.$', '', all_stack) + '"><a href="#toc">' + all_stack + '</a> ' + re.sub('=*$', '', toc[1]) + ' <span style="font-size: 12px"><a href="/edit/' + tool.url_pas(title) + '?section=' + str(edit_number) + '">(Edit)</a></span></h' + toc_number + '>\n', data, 1)
  457. toc_main_data = toc[1]
  458. toc_main_data = re.sub('=*$', '', toc_main_data)
  459. toc_main_data = re.sub('\[\*((?:(?! |\]).)*)(?: ((?:(?!(\[\*(?:(?:(?!\]).)+)\]|\])).)+))?\]', '', toc_main_data)
  460. toc_main_data = re.sub('<span id="math_[0-9]"><\/span>', '(수식)', toc_main_data)
  461. toc_data += '<span style="margin-left: ' + str((toc_full - toc_top_stack) * 10) + 'px;"><a href="#s-' + re.sub('\.$', '', all_stack) + '">' + all_stack + '</a> ' + toc_main_data + '</span>\n'
  462. else:
  463. break
  464. toc_data += '</div>'
  465. data = toc_re.sub(toc_data, data)
  466. data = tool.savemark(data)
  467. anchor_re = re.compile("\[anchor\((?P<in>(?:(?!\)\]).)+)\)\]", re.I)
  468. data = anchor_re.sub('<span id="\g<in>"></span>', data)
  469. ruby_re = re.compile("\[ruby\((?P<in>(?:(?!,).)+)\, ?ruby=(?P<out>(?:(?!\)\]|,).)+)(?:\, ?color=(?P<under>(?:(?!\)\]).)+))?\)\]", re.I)
  470. data = ruby_re.sub('<ruby>\g<in><rp>(</rp><rt style="color: \g<under>">\g<out></rt><rp>)</rp></ruby>', data)
  471. now_time = tool.get_time()
  472. date_re = re.compile('\[date\]', re.I)
  473. data = date_re.sub(now_time, data)
  474. time_data = re.search('^([0-9]{4}-[0-9]{2}-[0-9]{2})', now_time)
  475. time = time_data.groups()
  476. age_re = re.compile('\[age\(([0-9]{4}-[0-9]{2}-[0-9]{2})\)\]', re.I)
  477. while 1:
  478. age_data = age_re.search(data)
  479. if age_data:
  480. age = age_data.groups()[0]
  481. old = datetime.datetime.strptime(time[0], '%Y-%m-%d')
  482. will = datetime.datetime.strptime(age, '%Y-%m-%d')
  483. e_data = old - will
  484. data = age_re.sub(str(int(e_data.days / 365)), data, 1)
  485. else:
  486. break
  487. dday_re = re.compile('\[dday\(([0-9]{4}-[0-9]{2}-[0-9]{2})\)\]', re.I)
  488. while 1:
  489. dday_data = dday_re.search(data)
  490. if dday_data:
  491. dday = dday_data.groups()[0]
  492. old = datetime.datetime.strptime(time[0], '%Y-%m-%d')
  493. will = datetime.datetime.strptime(dday, '%Y-%m-%d')
  494. e_data = old - will
  495. if re.search('^-', str(e_data.days)):
  496. e_day = str(e_data.days)
  497. else:
  498. e_day = '+' + str(e_data.days)
  499. data = dday_re.sub(e_day, data, 1)
  500. else:
  501. break
  502. video_re = re.compile('\[(youtube|kakaotv|nicovideo)\(((?:(?!\)\]).)+)\)\]', re.I)
  503. youtube_re = re.compile('youtube', re.I)
  504. kakaotv_re = re.compile('kakaotv', re.I)
  505. while 1:
  506. video = video_re.search(data)
  507. if video:
  508. video = video.groups()
  509. width = re.search(', ?width=((?:(?!,).)+)', video[1])
  510. if width:
  511. video_width = width.groups()[0]
  512. else:
  513. video_width = '560'
  514. height = re.search(', ?height=((?:(?!,).)+)', video[1])
  515. if height:
  516. video_height = height.groups()[0]
  517. else:
  518. video_height = '315'
  519. code = re.search('^((?:(?!,).)+)', video[1])
  520. if code:
  521. video_code = code.groups()[0]
  522. else:
  523. video_code = ''
  524. if youtube_re.search(video[0]):
  525. video_code = re.sub('^https:\/\/www\.youtube\.com\/watch\?v=', '', video_code)
  526. video_code = re.sub('^https:\/\/youtu\.be\/', '', video_code)
  527. video_src = 'https://www.youtube.com/embed/' + video_code
  528. elif kakaotv_re.search(video[0]):
  529. video_code = re.sub('^https:\/\/tv\.kakao\.com\/channel\/9262\/cliplink\/', '', video_code)
  530. video_code = re.sub('^http:\/\/tv\.kakao\.com\/v\/', '', video_code)
  531. video_src = 'https://tv.kakao.com/embed/player/cliplink/' + video_code +'?service=kakao_tv'
  532. else:
  533. video_src = 'https://embed.nicovideo.jp/watch/' + video_code
  534. data = video_re.sub('<iframe width="' + video_width + '" height="' + video_height + '" src="' + video_src + '" allowfullscreen frameborder="0"></iframe>', data, 1)
  535. else:
  536. break
  537. while 1:
  538. block = re.search('(\n(?:&gt; ?(?:(?:(?!\n).)+)?\n)+)', data)
  539. if block:
  540. block = block.groups()[0]
  541. block = re.sub('^\n&gt; ?', '', block)
  542. block = re.sub('\n&gt; ?', '\n', block)
  543. block = re.sub('\n$', '', block)
  544. data = re.sub('(\n(?:&gt; ?(?:(?:(?!\n).)+)?\n)+)', '\n<blockquote>' + block + '</blockquote>\n', data, 1)
  545. else:
  546. break
  547. data = re.sub('(?P<in>\n +\* ?(?:(?:(?!\|\|).)+))\|\|', '\g<in>\n ||', data)
  548. while 1:
  549. li = re.search('(\n(?:(?: *)\* ?(?:(?:(?!\n).)+)\n)+)', data)
  550. if li:
  551. li = li.groups()[0]
  552. while 1:
  553. sub_li = re.search('\n(?:( *)\* ?((?:(?!\n).)+))', li)
  554. if sub_li:
  555. sub_li = sub_li.groups()
  556. if len(sub_li[0]) == 0:
  557. margin = 20
  558. else:
  559. margin = len(sub_li[0]) * 20
  560. li = re.sub('\n(?:( *)\* ?((?:(?!\n).)+))', '<li style="margin-left: ' + str(margin) + 'px;">' + sub_li[1] + '</li>', li, 1)
  561. else:
  562. break
  563. data = re.sub('(\n(?:(?: *)\* ?(?:(?:(?!\n).)+)\n)+)', '\n\n<ul>' + li + '</ul>\n', data, 1)
  564. else:
  565. break
  566. data = re.sub('<\/ul>\n \|\|', '</ul>||', data)
  567. while 1:
  568. indent = re.search('\n( +)', data)
  569. if indent:
  570. indent = len(indent.groups()[0])
  571. margin = '<span style="margin-left: 20px;"></span>' * indent
  572. data = re.sub('\n( +)', '\n' + margin, data, 1)
  573. else:
  574. break
  575. data = table_start(data)
  576. category = '\n<div id="cate_all"><hr><div id="cate">Category : '
  577. category_re = re.compile('^(?:category|분류):', re.I)
  578. while 1:
  579. link = re.search('\[\[((?:(?!\[\[|\]\]).)+)\]\]', data)
  580. if link:
  581. link = link.groups()[0]
  582. link_split = re.search('((?:(?!\|).)+)(?:\|((?:(?!\|).)+))', link)
  583. if link_split:
  584. link_split = link_split.groups()
  585. main_link = link_split[0]
  586. see_link = link_split[1]
  587. else:
  588. main_link = link
  589. see_link = link
  590. if re.search('^((?:file|파일)|(?:out|외부)):', main_link):
  591. file_style = ''
  592. width = re.search('width=((?:(?!&).)+)', see_link)
  593. if width:
  594. file_width = width.groups()[0]
  595. if re.search('px$', file_width):
  596. file_style += 'width: ' + file_width + ';'
  597. else:
  598. file_style += 'width: ' + file_width + 'px;'
  599. height = re.search('height=((?:(?!&).)+)', see_link)
  600. if height:
  601. file_height = height.groups()[0]
  602. if re.search('px$', file_height):
  603. file_style += 'height: ' + file_height + ';'
  604. else:
  605. file_style += 'height: ' + file_height + 'px;'
  606. align = re.search('align=((?:(?!&).)+)', see_link)
  607. if align:
  608. file_align = align.groups()[0]
  609. if file_align == 'center':
  610. file_align = 'display: block; text-align: center;'
  611. else:
  612. file_align = 'float: ' + file_align + ';'
  613. else:
  614. file_align = ''
  615. if re.search('^(?:out|외부):', main_link):
  616. file_src = re.sub('^(?:out|외부):', '', main_link)
  617. file_alt = main_link
  618. exist = 'Yes'
  619. else:
  620. file_data = re.search('^(?:file|파일):((?:(?!\.).)+)\.(.+)$', main_link)
  621. if file_data:
  622. file_data = file_data.groups()
  623. file_name = file_data[0]
  624. file_end = file_data[1]
  625. backlink += [[title, main_link, 'file']]
  626. else:
  627. file_name = 'TEST'
  628. file_end = 'jpg'
  629. file_src = '/image/' + tool.sha224(file_name) + '.' + file_end
  630. file_alt = 'file:' + file_name + '.' + file_end
  631. curs.execute("select title from data where title = ?", [file_alt])
  632. exist = curs.fetchall()
  633. if exist:
  634. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<span style="' + file_align + '"><img style="' + file_style + '" alt="' + file_alt + '" src="' + file_src + '"></span>', data, 1)
  635. else:
  636. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="not_thing" href="/w/' + tool.url_pas(file_alt) + '">' + file_alt + '</a>', data, 1)
  637. elif category_re.search(main_link):
  638. see_link = re.sub('#include', '', see_link)
  639. main_link = re.sub('#include', '', category_re.sub('category:', main_link))
  640. if re.search('#blur', main_link):
  641. see_link = 'Hidden'
  642. link_id = 'id="inside"'
  643. main_link = re.sub('#blur', '', main_link)
  644. else:
  645. link_id = ''
  646. backlink += [[title, main_link, 'cat']]
  647. category += '<a ' + link_id + ' href="' + tool.url_pas(main_link) + '">' + category_re.sub('', see_link) + '</a> | '
  648. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '', data, 1)
  649. elif re.search('^wiki:', main_link):
  650. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="inside" href="/' + tool.url_pas(re.sub('^wiki:', '', main_link)) + '">' + see_link + '</a>', data, 1)
  651. elif re.search('^inter:((?:(?!:).)+):', main_link):
  652. inter_data = re.search('^inter:((?:(?!:).)+):((?:(?!\]\]|\|).)+)', main_link)
  653. inter_data = inter_data.groups()
  654. curs.execute('select link from inter where title = ?', [inter_data[0]])
  655. inter = curs.fetchall()
  656. if inter:
  657. if see_link != main_link:
  658. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="inside" href="' + inter[0][0] + inter_data[1] + '">' + inter_data[0] + ':' + see_link + '</a>', data, 1)
  659. else:
  660. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="inside" href="' + inter[0][0] + inter_data[1] + '">' + inter_data[0] + ':' + inter_data[1] + '</a>', data, 1)
  661. else:
  662. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', 'Not exist', data, 1)
  663. elif re.search('^\/', main_link):
  664. under_title = re.search('^(\/(?:.+))$', main_link)
  665. under_title = under_title.groups()[0]
  666. if see_link != main_link:
  667. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '[[' + title + under_title + '|' + see_link + ']]', data, 1)
  668. else:
  669. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '[[' + title + under_title + ']]', data, 1)
  670. elif re.search('^http(s)?:\/\/', main_link):
  671. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="out_link" rel="nofollow" href="' + main_link + '">' + see_link + '</a>', data, 1)
  672. else:
  673. return_link = link_fix(main_link)
  674. main_link = return_link[0]
  675. other_link = return_link[1]
  676. if re.search('^\/', main_link):
  677. main_link = re.sub('^\/', title + '/', main_link)
  678. elif re.search('\.\.\/\/', main_link):
  679. main_link = re.sub('\.\.\/\/', '/', main_link)
  680. elif re.search('^\.\.\/', main_link):
  681. main_link = re.sub('^\.\.\/', re.sub('(?P<in>.+)\/.*$', '\g<in>', title), main_link)
  682. if not re.search('^\|', main_link):
  683. if main_link != title:
  684. if main_link != '':
  685. curs.execute("select title from data where title = ?", [main_link])
  686. if not curs.fetchall():
  687. link_id = 'id="not_thing"'
  688. backlink += [[title, main_link, 'no']]
  689. else:
  690. link_id = ''
  691. backlink += [[title, main_link, '']]
  692. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a ' + link_id + ' href="/w/' + tool.url_pas(main_link) + other_link + '">' + see_link + '</a>', data, 1)
  693. else:
  694. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a href="' + other_link + '">' + see_link + '</a>', data, 1)
  695. else:
  696. if re.search('^#', other_link):
  697. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a href="' + other_link + '">' + other_link + '</a>', data, 1)
  698. else:
  699. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<b>' + see_link + '</b>', data, 1)
  700. else:
  701. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '&#91;&#91;' + link + '&#93;&#93;', data, 1)
  702. else:
  703. break
  704. br_re = re.compile('\[br\]', re.I)
  705. data = br_re.sub('<br>', data)
  706. footnote_number = 0
  707. footnote_all = []
  708. footnote_dict = {}
  709. footnote_re = {}
  710. footdata_all = '\n<hr><ul id="footnote_data">'
  711. re_footnote = re.compile('(?:\[\*((?:(?! |\]).)*)(?: ((?:(?!(?:\[\*|\])).)+))?\]|(\[(?:각주|footnote)\]))')
  712. while 1:
  713. footnote = re_footnote.search(data)
  714. if footnote:
  715. footnote_data = footnote.groups()
  716. if footnote_data[2]:
  717. footnote_all.sort()
  718. for footdata in footnote_all:
  719. if footdata[2] == 0:
  720. footdata_in = ''
  721. else:
  722. footdata_in = footdata[2]
  723. footdata_all += '<li><a href="#rfn-' + str(footdata[0]) + '">(' + footdata[1] + ')</a> <span id="fn-' + str(footdata[0]) + '">' + footdata_in + '</span></li>'
  724. data = re_footnote.sub(footdata_all + '</ul>', data, 1)
  725. footnote_all = []
  726. footdata_all = '\n<hr><ul id="footnote_data">'
  727. else:
  728. footnote = footnote_data[1]
  729. footnote_name = footnote_data[0]
  730. if footnote_name and not footnote:
  731. if footnote_name in footnote_dict:
  732. footnote_re[footnote_name] += 1
  733. foot_plus_num = str(footnote_re[footnote_name])
  734. footshort = footnote_dict[footnote_name] + '.' + foot_plus_num
  735. footnote_all += [[float(footshort), footshort, 0]]
  736. data = re_footnote.sub('<sup><a href="javascript:open_foot(\'fn-' + footshort + '\')" id="rfn-' + footshort + '">(' + footnote_name + ')</a></sup><span class="foot_plus" id="cfn-' + footshort + '"></span>', data, 1)
  737. else:
  738. data = re_footnote.sub('<sup><a href="#">(' + footnote_name + ')</a></sup>', data, 1)
  739. else:
  740. footnote_number += 1
  741. if not footnote_name:
  742. footnote_name = str(footnote_number)
  743. footnote_dict.update({ footnote_name : str(footnote_number) })
  744. if not footnote_name in footnote_re:
  745. footnote_re.update({ footnote_name : 0 })
  746. else:
  747. footnote_re[footnote_name] += 1
  748. footnote_all += [[footnote_number, footnote_name, footnote]]
  749. data = re_footnote.sub('<sup><a href="javascript:open_foot(\'fn-' + str(footnote_number) + '\')" id="rfn-' + str(footnote_number) + '">(' + footnote_name + ')</a></sup><span class="foot_plus" id="cfn-' + str(footnote_number) + '"></span>', data, 1)
  750. else:
  751. break
  752. data = re.sub('\n+$', '', data)
  753. footnote_all.sort()
  754. for footdata in footnote_all:
  755. if footdata[2] == 0:
  756. footdata_in = ''
  757. else:
  758. footdata_in = footdata[2]
  759. footdata_all += '<li><a href="#rfn-' + str(footdata[0]) + '">(' + footdata[1] + ')</a> <span id="fn-' + str(footdata[0]) + '">' + footdata_in + '</span></li>'
  760. footdata_all += '</ul>'
  761. if footdata_all == '\n<hr><ul id="footnote_data"></ul>':
  762. footdata_all = ''
  763. data = re.sub('\n$', footdata_all, data + '\n', 1)
  764. category += '</div></div>'
  765. if category == '\n<div id="cate_all"><hr><div id="cate">Category : </div></div>':
  766. category = ''
  767. data += category
  768. i = 0
  769. while 1:
  770. try:
  771. _ = end_data[i][0]
  772. except:
  773. break
  774. if end_data[i][2] == 'normal':
  775. data = data.replace('<span id="' + end_data[i][0] + '"></span>', end_data[i][1])
  776. data = data.replace(tool.url_pas('<span id="' + end_data[i][0] + '"></span>'), tool.url_pas(end_data[i][1]))
  777. else:
  778. if re.search('\n', end_data[i][1]):
  779. data = data.replace('<span id="' + end_data[i][0] + '"></span>', '\n<pre>' + re.sub('^\n', '', end_data[i][1]) + '</pre>')
  780. else:
  781. data = data.replace('<span id="' + end_data[i][0] + '"></span>', '<code>' + end_data[i][1] + '</code>')
  782. i += 1
  783. if main_num == 1:
  784. i = 0
  785. while 1:
  786. try:
  787. _ = backlink[i][0]
  788. except:
  789. break
  790. find_data = re.search('<span id="(one_nowiki_[0-9]+)">', backlink[i][1])
  791. if find_data:
  792. j = 0
  793. find_data = find_data.groups()[0]
  794. while 1:
  795. try:
  796. _ = end_data[j][0]
  797. except:
  798. break
  799. if end_data[j][0] == find_data:
  800. backlink[i][1] = backlink[i][1].replace('<span id="' + end_data[j][0] + '"></span>', end_data[j][1])
  801. j += 1
  802. i += 1
  803. data = re.sub('<\/td_end>', '</td>', data)
  804. data = re.sub('<include>\n', '', data)
  805. data = re.sub('\n<\/include>', '', data)
  806. data = re.sub('(?P<in><\/h[0-9]>)(\n)+', '\g<in>', data)
  807. data = re.sub('\n\n<ul>', '\n<ul>', data)
  808. data = re.sub('<\/ul>\n\n', '</ul>', data)
  809. data = re.sub('^(\n)+', '', data)
  810. data = re.sub('(\n)+<hr><ul id="footnote_data">', '<hr><ul id="footnote_data">', data)
  811. data = re.sub('(?P<in><td(((?!>).)*)>)\n', '\g<in>', data)
  812. data = re.sub('(\n)?<hr>(\n)?', '<hr>', data)
  813. data = re.sub('<\/ul>\n\n<ul>', '</ul>\n<ul>', data)
  814. data = re.sub('\n', '<br>', data)
  815. return [data, plus_data, backlink]