namu.py 44 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026
  1. from . import tool
  2. import datetime
  3. import html
  4. import re
  5. def table_parser(data, cel_data, start_data, num = 0):
  6. table_class = 'class="'
  7. all_table = 'style="'
  8. cel_style = 'style="'
  9. row_style = 'style="'
  10. row = ''
  11. cel = ''
  12. table_width = re.search("<table ?width=((?:(?!>).)*)>", data)
  13. if table_width:
  14. if re.search('^[0-9]+$', table_width.groups()[0]):
  15. all_table += 'width: ' + table_width.groups()[0] + 'px;'
  16. else:
  17. all_table += 'width: ' + table_width.groups()[0] + ';'
  18. table_height = re.search("<table ?height=((?:(?!>).)*)>", data)
  19. if table_height:
  20. if re.search('^[0-9]+$', table_height.groups()[0]):
  21. all_table += 'height: ' + table_height.groups()[0] + 'px;'
  22. else:
  23. all_table += 'height: ' + table_height.groups()[0] + ';'
  24. table_align = re.search("<table ?align=((?:(?!>).)*)>", data)
  25. if table_align:
  26. if table_align.groups()[0] == 'right':
  27. all_table += 'float: right;'
  28. elif table_align.groups()[0] == 'center':
  29. all_table += 'margin: auto;'
  30. table_text_align = re.search("<table ?textalign=((?:(?!>).)*)>", data)
  31. if table_text_align:
  32. num = 1
  33. if table_text_align.groups()[0] == 'right':
  34. all_table += 'text-align: right;'
  35. elif table_text_align.groups()[0] == 'center':
  36. all_table += 'text-align: center;'
  37. row_table_align = re.search("<row ?textalign=((?:(?!>).)*)>", data)
  38. if row_table_align:
  39. if row_table_align.groups()[0] == 'right':
  40. row_style += 'text-align: right;'
  41. elif row_table_align.groups()[0] == 'center':
  42. row_style += 'text-align: center;'
  43. else:
  44. row_style += 'text-align: left;'
  45. table_cel = re.search("<-((?:(?!>).)*)>", data)
  46. if table_cel:
  47. cel = 'colspan="' + table_cel.groups()[0] + '"'
  48. else:
  49. cel = 'colspan="' + str(round(len(start_data) / 2)) + '"'
  50. table_row = re.search("<\|((?:(?!>).)*)>", data)
  51. if table_row:
  52. row = 'rowspan="' + table_row.groups()[0] + '"'
  53. row_bgcolor = re.search("<rowbgcolor=(#(?:[0-9a-f-A-F]{3}){1,2}|\w+)>", data)
  54. if row_bgcolor:
  55. row_style += 'background: ' + row_bgcolor.groups()[0] + ';'
  56. table_border = re.search("<table ?bordercolor=(#(?:[0-9a-f-A-F]{3}){1,2}|\w+)>", data)
  57. if table_border:
  58. all_table += 'border: ' + table_border.groups()[0] + ' 2px solid;'
  59. table_bgcolor = re.search("<table ?bgcolor=(#(?:[0-9a-f-A-F]{3}){1,2}|\w+)>", data)
  60. if table_bgcolor:
  61. all_table += 'background: ' + table_bgcolor.groups()[0] + ';'
  62. bgcolor = re.search("<bgcolor=(#(?:[0-9a-f-A-F]{3}){1,2}|\w+)>", data)
  63. if bgcolor:
  64. cel_style += 'background: ' + bgcolor.groups()[0] + ';'
  65. cel_width = re.search("<width=((?:(?!>).)*)>", data)
  66. if cel_width:
  67. cel_style += 'width: ' + cel_width.groups()[0] + 'px;'
  68. cel_height = re.search("<height=((?:(?!>).)*)>", data)
  69. if cel_height:
  70. cel_style += 'height: ' + cel_height.groups()[0] + 'px;'
  71. text_right = re.search("<\)>", data)
  72. text_center = re.search("<:>", data)
  73. text_left = re.search("<\(>", data)
  74. if text_right:
  75. cel_style += 'text-align: right;'
  76. elif text_center:
  77. cel_style += 'text-align: center;'
  78. elif text_left:
  79. cel_style += 'text-align: left;'
  80. elif num == 0:
  81. if re.search('^ ', cel_data) and re.search(' $', cel_data):
  82. cel_style += 'text-align: center;'
  83. elif re.search('^ ', cel_data):
  84. cel_style += 'text-align: right;'
  85. elif re.search(' $', cel_data):
  86. cel_style += 'text-align: left;'
  87. text_class = re.search("<table ?class=((?:(?!>).)+)>", data)
  88. if text_class:
  89. table_class += text_class.groups()[0]
  90. all_table += '"'
  91. cel_style += '"'
  92. row_style += '"'
  93. table_class += '"'
  94. return [all_table, row_style, cel_style, row, cel, table_class, num]
  95. def table_start(data):
  96. while 1:
  97. table = re.search('\n((?:(?:(?:(?:\|\|)+(?:(?:(?!\|\|).(?:\n)*)*))+)\|\|(?:\n)?)+)', data)
  98. if table:
  99. table = table.groups()[0]
  100. while 1:
  101. all_table = re.search('^((?:\|\|)+)((?:<(?:(?:(?!>).)+)>)*)\n*((?:(?!\|\|).\n*)*)', table)
  102. if all_table:
  103. all_table = all_table.groups()
  104. return_table = table_parser(all_table[1], all_table[2], all_table[0])
  105. number = return_table[6]
  106. table = re.sub('^((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*', '\n<table ' + return_table[5] + ' ' + return_table[0] + '><tbody><tr ' + return_table[1] + '><td ' + return_table[2] + ' ' + return_table[3] + ' ' + return_table[4] + '>', table, 1)
  107. else:
  108. break
  109. table = re.sub('\|\|\n?$', '</td></tr></tbody></table>', table)
  110. while 1:
  111. row_table = re.search('\|\|\n((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*((?:(?!\|\||<\/td>).\n*)*)', table)
  112. if row_table:
  113. row_table = row_table.groups()
  114. return_table = table_parser(row_table[1], row_table[2], row_table[0], number)
  115. table = re.sub('\|\|\n((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*', '</td></tr><tr ' + return_table[1] + '><td ' + return_table[2] + ' ' + return_table[3] + ' ' + return_table[4] + '>', table, 1)
  116. else:
  117. break
  118. while 1:
  119. cel_table = re.search('((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*((?:(?:(?!\|\||<\/td>).)|\n)*\n*)', table)
  120. if cel_table:
  121. cel_table = cel_table.groups()
  122. return_table = table_parser(cel_table[1], re.sub('\n', ' ', cel_table[2]), cel_table[0], number)
  123. table = re.sub('((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*', '</td><td ' + return_table[2] + ' ' + return_table[3] + ' ' + return_table[4] + '>', table, 1)
  124. else:
  125. break
  126. data = re.sub('\n((?:(?:(?:(?:\|\|)+(?:(?:(?!\|\|).(?:\n)*)*))+)\|\|(?:\n)?)+)', table, data, 1)
  127. else:
  128. break
  129. return data
  130. def middle_parser(data, fol_num, syntax_num, folding_num):
  131. global end_data
  132. global plus_data
  133. middle_stack = 0
  134. middle_list = []
  135. middle_number = 0
  136. middle_re = '(?:{{{((?:(?! |{{{|}}}|&lt;).)*) ?|(}}}))'
  137. while 1:
  138. middle_data = middle_re.search(data)
  139. if middle_data:
  140. middle_data = middle_data.groups()
  141. if not middle_data[1]:
  142. if middle_stack > 0:
  143. middle_stack += 1
  144. data = middle_re.sub('(?:{{{((?:(?! |{{{|}}}|&lt;).)*)(?P<in> ?)|(}}}))', '&#123;&#123;&#123;' + middle_data[0] + '\g<in>', data, 1)
  145. else:
  146. if re.search('^(#|@|\+|\-)', middle_data[0]) and not re.search('^(#|@|\+|\-){2}', middle_data[0]):
  147. middle_search = re.search('^(#(?:[0-9a-f-A-F]{3}){1,2})', middle_data[0])
  148. if middle_search:
  149. middle_list += ['span']
  150. data = middle_re.sub('<span style="color: ' + middle_search.groups()[0] + ';">', data, 1)
  151. else:
  152. middle_search = re.search('^(?:#(\w+))', middle_data[0])
  153. if middle_search:
  154. middle_list += ['span']
  155. data = middle_re.sub('<span style="color: ' + middle_search.groups()[0] + ';">', data, 1)
  156. else:
  157. middle_search = re.search('^(?:@((?:[0-9a-f-A-F]{3}){1,2}))', middle_data[0])
  158. if middle_search:
  159. middle_list += ['span']
  160. data = middle_re.sub('<span style="background: #' + middle_search.groups()[0] + ';">', data, 1)
  161. else:
  162. middle_search = re.search('^(?:@(\w+))', middle_data[0])
  163. if middle_search:
  164. middle_list += ['span']
  165. data = middle_re.sub('<span style="background: ' + middle_search.groups()[0] + ';">', data, 1)
  166. else:
  167. middle_search = re.search('^(\+|-)([1-5])', middle_data[0])
  168. if middle_search:
  169. middle_search = middle_search.groups()
  170. if middle_search[0] == '+':
  171. font_size = str(int(middle_search[1]) * 20 + 100)
  172. else:
  173. font_size = str(100 - int(middle_search[1]) * 10)
  174. middle_list += ['span']
  175. data = middle_re.sub('<span style="font-size: ' + font_size + '%;">', data, 1)
  176. else:
  177. middle_search = re.search('^#!wiki', middle_data[0])
  178. if middle_search:
  179. middle_data_2 = re.search('{{{#!wiki(?: style=(?:&quot;|&#x27;)((?:(?!&quot;|&#x27;).)*)(?:&quot;|&#x27;))?\n?', data)
  180. if middle_data_2:
  181. middle_data_2 = middle_data_2.groups()
  182. else:
  183. middle_data_2 = ['']
  184. middle_list += ['div_end']
  185. data = re.sub('{{{#!wiki(?: style=(?:&quot;|&#x27;)((?:(?!&quot;|&#x27;).)*)(?:&quot;|&#x27;))?\n?', '<div id="wiki_div" style="' + str(middle_data_2[0]) + '">', data, 1)
  186. else:
  187. middle_search = re.search('^#!syntax', middle_data[0])
  188. if middle_search:
  189. middle_data_2 = re.search('{{{#!syntax ((?:(?!\n).)+)\n?', data)
  190. if middle_data_2:
  191. middle_data_2 = middle_data_2.groups()
  192. else:
  193. middle_data_2 = ['python']
  194. if syntax_num == 0:
  195. plus_data += '''
  196. <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/9.12.0/styles/default.min.css">
  197. <script src="//cdnjs.cloudflare.com/ajax/libs/highlight.js/9.12.0/highlight.min.js"></script>
  198. '''
  199. syntax_num = 1
  200. middle_list += ['pre']
  201. data = re.sub('{{{#!syntax ?((?:(?!\n).)*)\n?', '<pre id="syntax"><code class="' + middle_data_2[0] + '">', data, 1)
  202. else:
  203. middle_search = re.search('^#!folding', middle_data[0])
  204. if middle_search:
  205. middle_list += ['2div']
  206. folding_data = re.search('{{{#!folding ?((?:(?!\n).)*)\n?', data)
  207. if folding_data:
  208. folding_data = folding_data.groups()
  209. else:
  210. folding_data = ['Test']
  211. if folding_num == 0:
  212. plus_data += '<script src="/views/main_css/parser.js"></script>'
  213. folding_num = 1
  214. data = re.sub('{{{#!folding ?((?:(?!\n).)*)\n?', '<div>' + str(folding_data[0]) + ' <div style="display: inline-block;"><a href="javascript:void(0);" onclick="folding(' + str(fol_num) + ');">[do]</a></div_end><div id="folding_' + str(fol_num) + '" style="display: none;"><div id="wiki_div" style="">', data, 1)
  215. fol_num += 1
  216. else:
  217. middle_list += ['span']
  218. data = middle_re.sub('<span>', data, 1)
  219. else:
  220. middle_list += ['code']
  221. middle_stack += 1
  222. data = middle_re.sub('<code>' + middle_data[0].replace('\\', '\\\\'), data, 1)
  223. middle_number += 1
  224. else:
  225. if middle_list == []:
  226. data = middle_re.sub('&#125;&#125;&#125;', data, 1)
  227. else:
  228. if middle_stack > 0:
  229. middle_stack -= 1
  230. if middle_stack > 0:
  231. data = middle_re.sub('&#125;&#125;&#125;', data, 1)
  232. else:
  233. if middle_number > 0:
  234. middle_number -= 1
  235. if middle_list[middle_number] == '2div':
  236. data = middle_re.sub('</div_end></div_end></div_end>', data, 1)
  237. elif middle_list[middle_number] == 'pre':
  238. data = middle_re.sub('</code></pre>', data, 1)
  239. else:
  240. data = middle_re.sub('</' + middle_list[middle_number] + '>', data, 1)
  241. del(middle_list[middle_number])
  242. else:
  243. break
  244. num = 0
  245. while 1:
  246. nowiki_data = re.search('<code>((?:(?:(?!<\/code>).)*\n*)*)<\/code>', data)
  247. if nowiki_data:
  248. nowiki_data = nowiki_data.groups()
  249. num += 1
  250. end_data += [['nowiki_' + str(num), nowiki_data[0], 'code']]
  251. data = re.sub('<code>((?:(?:(?!<\/code>).)*\n*)*)<\/code>', '<span id="nowiki_' + str(num) + '"></span>', data, 1)
  252. else:
  253. break
  254. num = 0
  255. while 1:
  256. syntax_data = re.search('<code class="((?:(?!").)+)">((?:(?:(?:(?!<\/code>|<span id="syntax_)).)+\n*)+)<\/code>', data)
  257. if syntax_data:
  258. syntax_data = syntax_data.groups()
  259. num += 1
  260. end_data += [['syntax_' + str(num), syntax_data[1], 'normal']]
  261. data = re.sub('<code class="((?:(?!").)+)">((?:(?:(?:(?!<\/code>|<span id="syntax_)).)+\n*)+)<\/code>', '<code class="' + syntax_data[0] + '"><span id="syntax_' + str(num) + '"></span></code>', data, 1)
  262. else:
  263. break
  264. return [data, [fol_num, syntax_num, folding_num]]
  265. def link_fix(main_link):
  266. if re.search('^:', main_link):
  267. main_link = re.sub('^:', '', main_link)
  268. main_link = re.sub('^사용자:', 'user:', main_link)
  269. main_link = re.sub('^파일:', 'file:', main_link)
  270. main_link = re.sub('^분류:', 'category:', main_link)
  271. other_link = re.search('(#.+)$', main_link)
  272. if other_link:
  273. other_link = other_link.groups()[0]
  274. main_link = re.sub('(#.+)$', '', main_link)
  275. else:
  276. other_link = ''
  277. return [main_link, other_link]
  278. def namu(conn, data, title, main_num):
  279. curs = conn.cursor()
  280. global plus_data
  281. global end_data
  282. data = '\n' + data + '\n'
  283. plus_data = ''
  284. backlink = []
  285. end_data = []
  286. data = html.escape(data)
  287. data = re.sub('\r\n', '\n', data)
  288. t_data = middle_parser(data, 0, 0, 0)
  289. data = t_data[0]
  290. include_re = re.compile('\[include\(((?:(?!\)\]).)+)\)\]', re.I)
  291. while 1:
  292. include = include_re.search(data)
  293. if include:
  294. include = include.groups()[0]
  295. include_data = re.search('^((?:(?!,).)+)', include)
  296. if include_data:
  297. include_data = include_data.groups()[0]
  298. else:
  299. include_data = 'Test'
  300. include_link = include_data
  301. backlink += [[title, include_link, 'include']]
  302. include = re.sub('^((?:(?!,).)+)', '', include)
  303. num = 0
  304. while 1:
  305. include_one_nowiki = re.search('(?:\\\\){2}(.)', include)
  306. if include_one_nowiki:
  307. include_one_nowiki = include_one_nowiki.groups()
  308. num += 1
  309. end_data += [['include_one_nowiki_' + str(num), include_one_nowiki[0], 'normal']]
  310. include = re.sub('(?:\\\\){2}(.)', '<span id="include_one_nowiki_' + str(num) + '"></span>', include, 1)
  311. else:
  312. break
  313. curs.execute("select data from data where title = ?", [include_data])
  314. include_data = curs.fetchall()
  315. if include_data:
  316. include_parser = include_re.sub('', include_data[0][0])
  317. include_parser = html.escape(include_parser)
  318. while 1:
  319. include_plus = re.search(', ?((?:(?!=).)+)=((?:(?!,).)+)', include)
  320. if include_plus:
  321. include_plus = include_plus.groups()
  322. include_parser = include_parser.replace('@' + include_plus[0] + '@', include_plus[1])
  323. include = re.sub(', ?((?:(?!=).)+)=((?:(?!,).)+)', '', include, 1)
  324. else:
  325. break
  326. include_parser = re.sub('\[\[(?:category|분류):(((?!\]\]|#include).)+)\]\]', '', include_parser)
  327. data = include_re.sub('<include>\n<a id="include_link" href="/w/' + tool.url_pas(include_link) + '">[' + include_link + ']</a>\n' + include_parser + '\n</include>', data, 1)
  328. else:
  329. data = include_re.sub('<a id="not_thing" href="/w/' + tool.url_pas(include_link) + '">' + include_link + '</a>', data, 1)
  330. else:
  331. break
  332. data = re.sub('\r\n', '\n', data)
  333. t_data = middle_parser(data, t_data[1][0], t_data[1][1], t_data[1][2])
  334. data = t_data[0]
  335. data = re.sub('&amp;', '&', data)
  336. data = re.sub('\n( +)\|\|', '\n||', data)
  337. data = re.sub('\|\|( +)\n', '||\n', data)
  338. data = re.sub('\n##(((?!\n).)+)', '', data)
  339. while 1:
  340. wiki_table_data = re.search('<div id="wiki_div" ((?:(?!>).)+)>((?:(?!<div id="wiki_div"|<\/div_end>).\n*)+)<\/div_end>', data)
  341. if wiki_table_data:
  342. wiki_table_data = wiki_table_data.groups()
  343. if re.search('\|\|', wiki_table_data[1]):
  344. end_parser = re.sub('\n$', '', re.sub('^\n', '', table_start('\n' + wiki_table_data[1] + '\n')))
  345. else:
  346. end_parser = wiki_table_data[1]
  347. data = re.sub('<div id="wiki_div" ((?:(?!>).)+)>((?:(?!<div id="wiki_div"|<\/div_end>).\n*)+)<\/div_end>', '<div ' + wiki_table_data[0] + '>' + end_parser + '</div>', data, 1)
  348. else:
  349. break
  350. data = re.sub('<\/div_end>', '</div>', data)
  351. data = re.sub('<\/td>', '</td_end>', data)
  352. first = 0
  353. math_re = re.compile('\[math\(((?:(?!\)\]).)+)\)\]', re.I)
  354. while 1:
  355. math = math_re.search(data)
  356. if math:
  357. if first == 0:
  358. plus_data += '''
  359. <link rel="stylesheet" href="/views/main_css/katex/katex.min.css">
  360. <script src="/views/main_css/katex/katex.min.js"></script>
  361. '''
  362. math = math.groups()[0]
  363. first += 1
  364. data = math_re.sub('<span id="math_' + str(first) + '"></span>', data, 1)
  365. plus_data += '<script>katex.render("' + math.replace('\\', '\\\\').replace('&lt;', '<').replace('&gt;', '>') +'", document.getElementById("math_' + str(first) + '"));</script>'
  366. else:
  367. break
  368. num = 0
  369. while 1:
  370. one_nowiki = re.search('(?:\\\\)(.)', data)
  371. if one_nowiki:
  372. one_nowiki = one_nowiki.groups()
  373. num += 1
  374. end_data += [['one_nowiki_' + str(num), one_nowiki[0], 'normal']]
  375. data = re.sub('(?:\\\\)(.)', '<span id="one_nowiki_' + str(num) + '"></span>', data, 1)
  376. else:
  377. break
  378. while 1:
  379. hr = re.search('\n-{4,9}\n', data)
  380. if hr:
  381. data = re.sub('\n-{4,9}\n', '\n<hr>\n', data, 1)
  382. else:
  383. break
  384. data += '\n'
  385. data = data.replace('\\', '&#92;')
  386. data = re.sub('&#x27;&#x27;&#x27;(?P<in>((?!&#x27;&#x27;&#x27;).)+)&#x27;&#x27;&#x27;', '<b>\g<in></b>', data)
  387. data = re.sub('&#x27;&#x27;(?P<in>((?!&#x27;&#x27;).)+)&#x27;&#x27;', '<i>\g<in></i>', data)
  388. data = re.sub('~~(?P<in>(?:(?!~~).)+)~~', '<s>\g<in></s>', data)
  389. data = re.sub('--(?P<in>(?:(?!--).)+)--', '<s>\g<in></s>', data)
  390. data = re.sub('__(?P<in>(?:(?!__).)+)__', '<u>\g<in></u>', data)
  391. data = re.sub('\^\^(?P<in>(?:(?!\^\^).)+)\^\^', '<sup>\g<in></sup>', data)
  392. data = re.sub(',,(?P<in>(?:(?!,,).)+),,', '<sub>\g<in></sub>', data)
  393. redirect_re = re.compile('\n#(?:redirect|넘겨주기) ((?:(?!\n).)+)\n', re.I)
  394. redirect = redirect_re.search(data)
  395. if redirect:
  396. redirect = redirect.groups()[0]
  397. return_link = link_fix(redirect)
  398. main_link = return_link[0]
  399. other_link = return_link[1]
  400. backlink += [[title, main_link, 'redirect']]
  401. data = redirect_re.sub('\n * ' + title + ' - [[' + main_link + ']]\n', data, 1)
  402. no_toc_re = re.compile('\[(?:목차|toc)\((?:no)\)\]\n', re.I)
  403. toc_re = re.compile('\[(?:목차|toc)\]', re.I)
  404. if not no_toc_re.search(data):
  405. if not toc_re.search(data):
  406. data = re.sub('\n(?P<in>={1,6}) ?(?P<out>(?:(?!=).)+) ?={1,6}\n', '\n[toc]\n\g<in> \g<out> \g<in>\n', data, 1)
  407. else:
  408. data = no_toc_re.sub('', data)
  409. toc_full = 0
  410. toc_top_stack = 6
  411. toc_stack = [0, 0, 0, 0, 0, 0]
  412. edit_number = 0
  413. toc_data = '<div id="toc"><span style="font-size: 18px;">toc</span>\n\n'
  414. while 1:
  415. toc = re.search('\n(={1,6}) ?((?:(?!\n).)+) ?\n', data)
  416. if toc:
  417. toc = toc.groups()
  418. toc_number = len(toc[0])
  419. edit_number += 1
  420. if toc_full > toc_number:
  421. for i in range(toc_number, 6):
  422. toc_stack[i] = 0
  423. if toc_top_stack > toc_number:
  424. toc_top_stack = toc_number
  425. toc_full = toc_number
  426. toc_stack[toc_number - 1] += 1
  427. toc_number = str(toc_number)
  428. all_stack = ''
  429. for i in range(0, 6):
  430. all_stack += str(toc_stack[i]) + '.'
  431. while 1:
  432. if re.search('[^0-9]0\.', all_stack):
  433. all_stack = re.sub('[^0-9]0\.', '.', all_stack)
  434. else:
  435. break
  436. all_stack = re.sub('^0\.', '', all_stack)
  437. data = re.sub('\n(={1,6}) ?((?:(?!\n).)+) ?\n', '\n<h' + toc_number + ' id="s-' + re.sub('\.$', '', all_stack) + '"><a href="#toc">' + all_stack + '</a> ' + re.sub('=*$', '', toc[1]) + ' <span style="font-size: 12px"><a href="/edit/' + tool.url_pas(title) + '?section=' + str(edit_number) + '">(Edit)</a></span></h' + toc_number + '>\n', data, 1)
  438. toc_main_data = toc[1]
  439. toc_main_data = re.sub('=*$', '', toc_main_data)
  440. toc_main_data = re.sub('\[\*((?:(?! |\]).)*)(?: ((?:(?!(\[\*(?:(?:(?!\]).)+)\]|\])).)+))?\]', '', toc_main_data)
  441. toc_main_data = re.sub('<span id="math_[0-9]"><\/span>', '(수식)', toc_main_data)
  442. toc_data += '<span style="margin-left: ' + str((toc_full - toc_top_stack) * 10) + 'px;"><a href="#s-' + re.sub('\.$', '', all_stack) + '">' + all_stack + '</a> ' + toc_main_data + '</span>\n'
  443. else:
  444. break
  445. toc_data += '</div>'
  446. data = toc_re.sub(toc_data, data)
  447. data = tool.savemark(data)
  448. anchor_re = re.compile("\[anchor\((?P<in>(?:(?!\)\]).)+)\)\]", re.I)
  449. data = anchor_re.sub('<span id="\g<in>"></span>', data)
  450. ruby_re = re.compile("\[ruby\((?P<in>(?:(?!,).)+)\, ?(?P<out>(?:(?!\)\]).)+)\)\]", re.I)
  451. data = ruby_re.sub('<ruby>\g<in><rp>(</rp><rt>\g<out></rt><rp>)</rp></ruby>', data)
  452. now_time = tool.get_time()
  453. date_re = re.compile('\[date\]', re.I)
  454. data = date_re.sub(now_time, data)
  455. time_data = re.search('^([0-9]{4}-[0-9]{2}-[0-9]{2})', now_time)
  456. time = time_data.groups()
  457. age_re = re.compile('\[age\(([0-9]{4}-[0-9]{2}-[0-9]{2})\)\]', re.I)
  458. while 1:
  459. age_data = age_re.search(data)
  460. if age_data:
  461. age = age_data.groups()[0]
  462. old = datetime.datetime.strptime(time[0], '%Y-%m-%d')
  463. will = datetime.datetime.strptime(age, '%Y-%m-%d')
  464. e_data = old - will
  465. data = age_re.sub(str(int(e_data.days / 365)), data, 1)
  466. else:
  467. break
  468. dday_re = re.compile('\[dday\(([0-9]{4}-[0-9]{2}-[0-9]{2})\)\]', re.I)
  469. while 1:
  470. dday_data = dday_re.search(data)
  471. if dday_data:
  472. dday = dday_data.groups()[0]
  473. old = datetime.datetime.strptime(time[0], '%Y-%m-%d')
  474. will = datetime.datetime.strptime(dday, '%Y-%m-%d')
  475. e_data = old - will
  476. if re.search('^-', str(e_data.days)):
  477. e_day = str(e_data.days)
  478. else:
  479. e_day = '+' + str(e_data.days)
  480. data = dday_re.sub(e_day, data, 1)
  481. else:
  482. break
  483. video_re = re.compile('\[(youtube|kakaotv|nicovideo)\(((?:(?!\)\]).)+)\)\]', re.I)
  484. youtube_re = re.compile('youtube', re.I)
  485. kakaotv_re = re.compile('kakaotv', re.I)
  486. while 1:
  487. video = video_re.search(data)
  488. if video:
  489. video = video.groups()
  490. width = re.search(', ?width=((?:(?!,).)+)', video[1])
  491. if width:
  492. video_width = width.groups()[0]
  493. else:
  494. video_width = '560'
  495. height = re.search(', ?height=((?:(?!,).)+)', video[1])
  496. if height:
  497. video_height = height.groups()[0]
  498. else:
  499. video_height = '315'
  500. code = re.search('^((?:(?!,).)+)', video[1])
  501. if code:
  502. video_code = code.groups()[0]
  503. else:
  504. video_code = ''
  505. if youtube_re.search(video[0]):
  506. video_code = re.sub('^https:\/\/www\.youtube\.com\/watch\?v=', '', video_code)
  507. video_code = re.sub('^https:\/\/youtu\.be\/', '', video_code)
  508. video_src = 'https://www.youtube.com/embed/' + video_code
  509. elif kakaotv_re.search(video[0]):
  510. video_code = re.sub('^https:\/\/tv\.kakao\.com\/channel\/9262\/cliplink\/', '', video_code)
  511. video_code = re.sub('^http:\/\/tv\.kakao\.com\/v\/', '', video_code)
  512. video_src = 'https://tv.kakao.com/embed/player/cliplink/' + video_code +'?service=kakao_tv'
  513. else:
  514. video_src = 'https://embed.nicovideo.jp/watch/' + video_code
  515. data = video_re.sub('<iframe width="' + video_width + '" height="' + video_height + '" src="' + video_src + '" allowfullscreen frameborder="0"></iframe>', data, 1)
  516. else:
  517. break
  518. while 1:
  519. block = re.search('(\n(?:&gt; ?(?:(?:(?!\n).)+)?\n)+)', data)
  520. if block:
  521. block = block.groups()[0]
  522. block = re.sub('^\n&gt; ?', '', block)
  523. block = re.sub('\n&gt; ?', '\n', block)
  524. block = re.sub('\n$', '', block)
  525. data = re.sub('(\n(?:&gt; ?(?:(?:(?!\n).)+)?\n)+)', '\n<blockquote>' + block + '</blockquote>\n', data, 1)
  526. else:
  527. break
  528. data = re.sub('(?P<in>\n +\* ?(?:(?:(?!\|\|).)+))\|\|', '\g<in>\n ||', data)
  529. while 1:
  530. li = re.search('(\n(?:(?: *)\* ?(?:(?:(?!\n).)+)\n)+)', data)
  531. if li:
  532. li = li.groups()[0]
  533. while 1:
  534. sub_li = re.search('\n(?:( *)\* ?((?:(?!\n).)+))', li)
  535. if sub_li:
  536. sub_li = sub_li.groups()
  537. if len(sub_li[0]) == 0:
  538. margin = 20
  539. else:
  540. margin = len(sub_li[0]) * 20
  541. li = re.sub('\n(?:( *)\* ?((?:(?!\n).)+))', '<li style="margin-left: ' + str(margin) + 'px;">' + sub_li[1] + '</li>', li, 1)
  542. else:
  543. break
  544. data = re.sub('(\n(?:(?: *)\* ?(?:(?:(?!\n).)+)\n)+)', '\n\n<ul>' + li + '</ul>\n', data, 1)
  545. else:
  546. break
  547. data = re.sub('<\/ul>\n \|\|', '</ul>||', data)
  548. while 1:
  549. indent = re.search('\n( +)', data)
  550. if indent:
  551. indent = len(indent.groups()[0])
  552. margin = '<span style="margin-left: 20px;"></span>' * indent
  553. data = re.sub('\n( +)', '\n' + margin, data, 1)
  554. else:
  555. break
  556. data = table_start(data)
  557. category = '\n<hr><div id="cate">category : '
  558. category_re = re.compile('^(?:category|분류):', re.I)
  559. while 1:
  560. link = re.search('\[\[((?:(?!\[\[|\]\]).)+)\]\]', data)
  561. if link:
  562. link = link.groups()[0]
  563. link_split = re.search('((?:(?!\|).)+)(?:\|((?:(?!\|).)+))', link)
  564. if link_split:
  565. link_split = link_split.groups()
  566. main_link = link_split[0]
  567. see_link = link_split[1]
  568. else:
  569. main_link = link
  570. see_link = link
  571. if re.search('^((?:file|파일)|(?:out|외부)):', main_link):
  572. file_style = ''
  573. width = re.search('width=((?:(?!&).)+)', see_link)
  574. if width:
  575. file_width = width.groups()[0]
  576. if re.search('px$', file_width):
  577. file_style += 'width: ' + file_width + ';'
  578. else:
  579. file_style += 'width: ' + file_width + 'px;'
  580. height = re.search('height=((?:(?!&).)+)', see_link)
  581. if height:
  582. file_height = height.groups()[0]
  583. if re.search('px$', file_height):
  584. file_style += 'height: ' + file_height + ';'
  585. else:
  586. file_style += 'height: ' + file_height + 'px;'
  587. align = re.search('align=((?:(?!&).)+)', see_link)
  588. if align:
  589. file_align = align.groups()[0]
  590. if file_align == 'center':
  591. file_align = 'display: block; text-align: center;'
  592. else:
  593. file_align = 'float: ' + file_align + ';'
  594. else:
  595. file_align = ''
  596. if re.search('^(?:out|외부):', main_link):
  597. file_src = re.sub('^(?:out|외부):', '', main_link)
  598. file_alt = main_link
  599. exist = 'Yes'
  600. else:
  601. file_data = re.search('^(?:file|파일):((?:(?!\.).)+)\.(.+)$', main_link)
  602. if file_data:
  603. file_data = file_data.groups()
  604. file_name = file_data[0]
  605. file_end = file_data[1]
  606. backlink += [[title, main_link, 'file']]
  607. else:
  608. file_name = 'TEST'
  609. file_end = 'jpg'
  610. file_src = '/image/' + tool.sha224(file_name) + '.' + file_end
  611. file_alt = 'file:' + file_name + '.' + file_end
  612. curs.execute("select title from data where title = ?", [file_alt])
  613. exist = curs.fetchall()
  614. if exist:
  615. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<span style="' + file_align + '"><img style="' + file_style + '" alt="' + file_alt + '" src="' + file_src + '"></span>', data, 1)
  616. else:
  617. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="not_thing" href="/w/' + tool.url_pas(file_alt) + '">' + file_alt + '</a>', data, 1)
  618. elif category_re.search(main_link):
  619. see_link = re.sub('#include', '', see_link)
  620. main_link = re.sub('#include', '', category_re.sub('category:', main_link))
  621. if re.search('#blur', main_link):
  622. see_link = 'Hidden'
  623. link_id = 'id="inside"'
  624. main_link = re.sub('#blur', '', main_link)
  625. else:
  626. link_id = ''
  627. backlink += [[title, main_link, 'cat']]
  628. category += '<a ' + link_id + ' href="' + tool.url_pas(main_link) + '">' + category_re.sub('', see_link) + '</a> / '
  629. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '', data, 1)
  630. elif re.search('^wiki:', main_link):
  631. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="inside" href="/' + tool.url_pas(re.sub('^wiki:', '', main_link)) + '">' + see_link + '</a>', data, 1)
  632. elif re.search('^inter:((?:(?!:).)+):', main_link):
  633. inter_data = re.search('^inter:((?:(?!:).)+):((?:(?!\]\]|\|).)+)', main_link)
  634. inter_data = inter_data.groups()
  635. curs.execute('select link from inter where title = ?', [inter_data[0]])
  636. inter = curs.fetchall()
  637. if inter:
  638. if see_link != main_link:
  639. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="inside" href="' + inter[0][0] + inter_data[1] + '">' + inter_data[0] + ':' + see_link + '</a>', data, 1)
  640. else:
  641. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="inside" href="' + inter[0][0] + inter_data[1] + '">' + inter_data[0] + ':' + inter_data[1] + '</a>', data, 1)
  642. else:
  643. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', 'Not exist', data, 1)
  644. elif re.search('^\/', main_link):
  645. under_title = re.search('^(\/(?:.+))$', main_link)
  646. under_title = under_title.groups()[0]
  647. if see_link != main_link:
  648. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '[[' + title + under_title + '|' + see_link + ']]', data, 1)
  649. else:
  650. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '[[' + title + under_title + ']]', data, 1)
  651. elif re.search('^http(s)?:\/\/', main_link):
  652. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="out_link" rel="nofollow" href="' + main_link + '">' + see_link + '</a>', data, 1)
  653. else:
  654. return_link = link_fix(main_link)
  655. main_link = return_link[0]
  656. other_link = return_link[1]
  657. if re.search('^\/', main_link):
  658. main_link = re.sub('^\/', title + '/', main_link)
  659. elif re.search('\.\.\/\/', main_link):
  660. main_link = re.sub('\.\.\/\/', '/', main_link)
  661. elif re.search('^\.\.\/', main_link):
  662. main_link = re.sub('^\.\.\/', re.sub('(?P<in>.+)\/.*$', '\g<in>', title), main_link)
  663. if not re.search('^\|', main_link):
  664. if main_link != title:
  665. if main_link != '':
  666. curs.execute("select title from data where title = ?", [main_link])
  667. if not curs.fetchall():
  668. link_id = 'id="not_thing"'
  669. backlink += [[title, main_link, 'no']]
  670. else:
  671. link_id = ''
  672. backlink += [[title, main_link, '']]
  673. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a ' + link_id + ' href="/w/' + tool.url_pas(main_link) + other_link + '">' + see_link + '</a>', data, 1)
  674. else:
  675. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a href="' + other_link + '">' + see_link + '</a>', data, 1)
  676. else:
  677. if re.search('^#', other_link):
  678. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a href="' + other_link + '">' + other_link + '</a>', data, 1)
  679. else:
  680. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<b>' + see_link + '</b>', data, 1)
  681. else:
  682. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '&#91;&#91;' + link + '&#93;&#93;', data, 1)
  683. else:
  684. break
  685. br_re = re.compile('\[br\]', re.I)
  686. data = br_re.sub('<br>', data)
  687. footnote_number = 0
  688. footnote_all = []
  689. footnote_dict = {}
  690. footnote_re = {}
  691. footdata_all = '\n<hr><ul id="footnote_data">'
  692. while 1:
  693. footnote = re.search('(?:\[\*((?:(?! |\]).)*)(?: ((?:(?!(?:\[\*(?:(?:(?!\]).)+)\]|\])).)+))?\]|(\[(?:각주|footnote)\]))', data)
  694. if footnote:
  695. footnote_data = footnote.groups()
  696. if footnote_data[2]:
  697. footnote_all.sort()
  698. for footdata in footnote_all:
  699. if footdata[2] == 0:
  700. footdata_in = ''
  701. else:
  702. footdata_in = footdata[2]
  703. footdata_all += '<li><a href="#rfn-' + str(footdata[0]) + '" id="fn-' + str(footdata[0]) + '">(' + footdata[1] + ')</a> ' + footdata_in + '</li>'
  704. data = re.sub('(?:\[\*((?:(?! ).)*) ((?:(?!\]).)+)\]|(\[(?:각주|footnote)\]))', footdata_all + '</ul>', data, 1)
  705. footnote_all = []
  706. footdata_all = '\n<hr><ul id="footnote_data">'
  707. else:
  708. footnote = footnote_data[1]
  709. footnote_name = footnote_data[0]
  710. if footnote_name and not footnote:
  711. if footnote_name in footnote_dict:
  712. footnote_re[footnote_name] += 1
  713. foot_plus_num = str(footnote_re[footnote_name])
  714. footshort = footnote_dict[footnote_name] + '.' + foot_plus_num
  715. footnote_all += [[float(footshort), footshort, 0]]
  716. data = re.sub('(?:\[\*((?:(?! |\]).)*)(?: ((?:(?!(?:\[\*(?:(?:(?!\]).)+)\]|\])).)+))?\]|(\[(?:각주|footnote)\]))', '<sup><a href="#fn-' + footshort + '" id="rfn-' + footshort + '">(' + footshort + ')</a></sup>', data, 1)
  717. else:
  718. data = re.sub('(?:\[\*((?:(?! |\]).)*)(?: ((?:(?!(?:\[\*(?:(?:(?!\]).)+)\]|\])).)+))?\]|(\[(?:각주|footnote)\]))', '<sup><a href="#">(' + footnote_name + ')</a></sup>', data, 1)
  719. else:
  720. footnote_number += 1
  721. if not footnote_name:
  722. footnote_name = str(footnote_number)
  723. footnote_dict.update({ footnote_name : str(footnote_number) })
  724. if not footnote_name in footnote_re:
  725. footnote_re.update({ footnote_name : 0 })
  726. else:
  727. footnote_re[footnote_name] += 1
  728. footnote_all += [[footnote_number, footnote_name, footnote]]
  729. data = re.sub('(?:\[\*((?:(?! |\]).)*)(?: ((?:(?!(?:\[\*(?:(?:(?!\]).)+)\]|\])).)+))?\]|(\[(?:각주|footnote)\]))', '<sup><a href="#fn-' + str(footnote_number) + '" id="rfn-' + str(footnote_number) + '">(' + footnote_name + ')</a></sup>', data, 1)
  730. else:
  731. break
  732. data = re.sub('\n+$', '', data)
  733. footnote_all.sort()
  734. for footdata in footnote_all:
  735. if footdata[2] == 0:
  736. footdata_in = ''
  737. else:
  738. footdata_in = footdata[2]
  739. footdata_all += '<li><a href="#rfn-' + str(footdata[0]) + '" id="fn-' + str(footdata[0]) + '">(' + footdata[1] + ')</a> ' + footdata_in + '</li>'
  740. footdata_all += '</ul>'
  741. if footdata_all == '\n<hr><ul id="footnote_data"></ul>':
  742. footdata_all = ''
  743. data = re.sub('\n$', footdata_all, data + '\n', 1)
  744. category += '</div>'
  745. category = re.sub(' / <\/div>$', '</div>', category)
  746. if category == '\n<hr><div id="cate">category : </div>':
  747. category = ''
  748. data += category
  749. i = 0
  750. while 1:
  751. try:
  752. _ = end_data[i][0]
  753. except:
  754. break
  755. if end_data[i][2] == 'normal':
  756. data = data.replace('<span id="' + end_data[i][0] + '"></span>', end_data[i][1])
  757. data = data.replace(tool.url_pas('<span id="' + end_data[i][0] + '"></span>'), tool.url_pas(end_data[i][1]))
  758. else:
  759. if re.search('\n', end_data[i][1]):
  760. data = data.replace('<span id="' + end_data[i][0] + '"></span>', '\n<pre>' + re.sub('^\n', '', end_data[i][1]) + '</pre>')
  761. else:
  762. data = data.replace('<span id="' + end_data[i][0] + '"></span>', '<code>' + end_data[i][1] + '</code>')
  763. i += 1
  764. if main_num == 1:
  765. i = 0
  766. while 1:
  767. try:
  768. _ = backlink[i][0]
  769. except:
  770. break
  771. find_data = re.search('<span id="(one_nowiki_[0-9]+)">', backlink[i][1])
  772. if find_data:
  773. j = 0
  774. find_data = find_data.groups()[0]
  775. while 1:
  776. try:
  777. _ = end_data[j][0]
  778. except:
  779. break
  780. if end_data[j][0] == find_data:
  781. backlink[i][1] = backlink[i][1].replace('<span id="' + end_data[j][0] + '"></span>', end_data[j][1])
  782. j += 1
  783. i += 1
  784. data = re.sub('<\/td_end>', '</td>', data)
  785. data = re.sub('<include>\n', '', data)
  786. data = re.sub('\n<\/include>', '', data)
  787. data = re.sub('(?P<in><\/h[0-9]>)(\n)+', '\g<in>', data)
  788. data = re.sub('\n\n<ul>', '\n<ul>', data)
  789. data = re.sub('<\/ul>\n\n', '</ul>', data)
  790. data = re.sub('^(\n)+', '', data)
  791. data = re.sub('(\n)+<hr><ul id="footnote_data">', '<hr><ul id="footnote_data">', data)
  792. data = re.sub('(?P<in><td(((?!>).)*)>)\n', '\g<in>', data)
  793. data = re.sub('(\n)?<hr>(\n)?', '<hr>', data)
  794. data = re.sub('<\/ul>\n\n<ul>', '</ul>\n<ul>', data)
  795. data = re.sub('\n', '<br>', data)
  796. return [data, plus_data, backlink]