start.py 40 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902
  1. from . import tool
  2. import datetime
  3. import html
  4. import re
  5. def table_parser(data, cel_data, start_data, num = 0):
  6. table_class = 'class="'
  7. all_table = 'style="'
  8. cel_style = 'style="'
  9. row_style = 'style="'
  10. row = ''
  11. cel = ''
  12. table_width = re.search("<table ?width=((?:(?!>).)*)>", data)
  13. if table_width:
  14. if re.search('^[0-9]+$', table_width.groups()[0]):
  15. all_table += 'width: ' + table_width.groups()[0] + 'px;'
  16. else:
  17. all_table += 'width: ' + table_width.groups()[0] + ';'
  18. table_height = re.search("<table ?height=((?:(?!>).)*)>", data)
  19. if table_height:
  20. if re.search('^[0-9]+$', table_height.groups()[0]):
  21. all_table += 'height: ' + table_height.groups()[0] + 'px;'
  22. else:
  23. all_table += 'height: ' + table_height.groups()[0] + ';'
  24. table_align = re.search("<table ?align=((?:(?!>).)*)>", data)
  25. if table_align:
  26. if table_align.groups()[0] == 'right':
  27. all_table += 'float: right;'
  28. elif table_align.groups()[0] == 'center':
  29. all_table += 'margin: auto;'
  30. table_text_align = re.search("<table ?textalign=((?:(?!>).)*)>", data)
  31. if table_text_align:
  32. num = 1
  33. if table_text_align.groups()[0] == 'right':
  34. all_table += 'text-align: right;'
  35. elif table_text_align.groups()[0] == 'center':
  36. all_table += 'text-align: center;'
  37. row_table_align = re.search("<row ?textalign=((?:(?!>).)*)>", data)
  38. if row_table_align:
  39. if row_table_align.groups()[0] == 'right':
  40. row_style += 'text-align: right;'
  41. elif row_table_align.groups()[0] == 'center':
  42. row_style += 'text-align: center;'
  43. else:
  44. row_style += 'text-align: left;'
  45. table_cel = re.search("<-((?:(?!>).)*)>", data)
  46. if table_cel:
  47. cel = 'colspan="' + table_cel.groups()[0] + '"'
  48. else:
  49. cel = 'colspan="' + str(round(len(start_data) / 2)) + '"'
  50. table_row = re.search("<\|((?:(?!>).)*)>", data)
  51. if table_row:
  52. row = 'rowspan="' + table_row.groups()[0] + '"'
  53. row_bgcolor = re.search("<rowbgcolor=(#(?:[0-9a-f-A-F]{3}){1,2}|\w+)>", data)
  54. if row_bgcolor:
  55. row_style += 'background: ' + row_bgcolor.groups()[0] + ';'
  56. table_border = re.search("<table ?bordercolor=(#(?:[0-9a-f-A-F]{3}){1,2}|\w+)>", data)
  57. if table_border:
  58. all_table += 'border: ' + table_border.groups()[0] + ' 2px solid;'
  59. table_bgcolor = re.search("<table ?bgcolor=(#(?:[0-9a-f-A-F]{3}){1,2}|\w+)>", data)
  60. if table_bgcolor:
  61. all_table += 'background: ' + table_bgcolor.groups()[0] + ';'
  62. bgcolor = re.search("<(?:bgcolor=)?(#(?:[0-9a-f-A-F]{3}){1,2}|\w+)>", data)
  63. if bgcolor:
  64. cel_style += 'background: ' + bgcolor.groups()[0] + ';'
  65. cel_width = re.search("<width=((?:(?!>).)*)>", data)
  66. if cel_width:
  67. cel_style += 'width: ' + cel_width.groups()[0] + 'px;'
  68. cel_height = re.search("<height=((?:(?!>).)*)>", data)
  69. if cel_height:
  70. cel_style += 'height: ' + cel_height.groups()[0] + 'px;'
  71. text_right = re.search("<\)>", data)
  72. text_center = re.search("<:>", data)
  73. text_left = re.search("<\(>", data)
  74. if text_right:
  75. cel_style += 'text-align: right;'
  76. elif text_center:
  77. cel_style += 'text-align: center;'
  78. elif text_left:
  79. cel_style += 'text-align: left;'
  80. elif num == 0:
  81. if re.search('^ (.*) $', cel_data):
  82. cel_style += 'text-align: center;'
  83. elif re.search('^ (.*)$', cel_data):
  84. cel_style += 'text-align: right;'
  85. elif re.search('^(.*) $', cel_data):
  86. cel_style += 'text-align: left;'
  87. text_class = re.search("<table ?class=((?:(?!>).)+)>", data)
  88. if text_class:
  89. table_class += text_class.groups()[0]
  90. all_table += '"'
  91. cel_style += '"'
  92. row_style += '"'
  93. table_class += '"'
  94. return [all_table, row_style, cel_style, row, cel, table_class, num]
  95. def link_fix(main_link):
  96. if re.search('^:', main_link):
  97. main_link = re.sub('^:', '', main_link)
  98. other_link = re.search('(#.+)$', main_link)
  99. if other_link:
  100. other_link = other_link.groups()[0]
  101. main_link = re.sub('(#.+)$', '', main_link)
  102. else:
  103. other_link = ''
  104. return [main_link, other_link]
  105. def start(conn, data, title):
  106. # DB 지정
  107. curs = conn.cursor()
  108. # 초기 설정
  109. data = '\n' + data + '\n'
  110. backlink = []
  111. plus_data = ''
  112. end_data= []
  113. # XSS 이스케이프
  114. data = html.escape(data)
  115. # 한 글자 NoWiki
  116. num = 0
  117. while 1:
  118. one_nowiki = re.search('(?:\\\\){1,2}(.)', data)
  119. if one_nowiki:
  120. one_nowiki = one_nowiki.groups()
  121. num += 1
  122. end_data += [['one_nowiki_' + str(num), one_nowiki[0]]]
  123. data = re.sub('(?:\\\\){1,2}(.)', '<span id="one_nowiki_' + str(num) + '"></span>', data, 1)
  124. else:
  125. break
  126. # 포함 문법 처리
  127. while 1:
  128. include = re.search('\[include\(((?:(?!\)\]).)+)\)\]', data)
  129. if include:
  130. include = include.groups()[0]
  131. include_data = re.search('^((?:(?!,).)+)', include)
  132. if include_data:
  133. include_data = include_data.groups()[0]
  134. else:
  135. include_data = 'Test'
  136. include_link = include_data
  137. backlink += [[title, include_link, 'include']]
  138. include = re.sub('^((?:(?!,).)+)', '', include)
  139. curs.execute("select data from data where title = ?", [include_data])
  140. include_data = curs.fetchall()
  141. if include_data:
  142. include_parser = include_data[0][0]
  143. while 1:
  144. include_plus = re.search(', ?((?:(?!=).)+)=((?:(?!,).)+)', include)
  145. if include_plus:
  146. include_plus = include_plus.groups()
  147. include_parser = re.sub('@' + include_plus[0] + '@', include_plus[1], include_parser)
  148. include = re.sub(', ?((?:(?!=).)+)=((?:(?!,).)+)', '', include, 1)
  149. else:
  150. break
  151. include_parser = re.sub('\[\[분류:(((?!\]\]|#include).)+)\]\]', '', include_parser)
  152. include_parser = html.escape(include_parser)
  153. data = re.sub('\[include\(((?:(?!\)\]).)+)\)\]', '\n' + include_parser + '\n', data, 1)
  154. else:
  155. data = re.sub('\[include\(((?:(?!\)\]).)+)\)\]', '<a id="not_thing" href="/w/' + tool.url_pas(include_link) + '">' + include_link + '</a>', data, 1)
  156. else:
  157. break
  158. # 개행 정리
  159. data = re.sub('\r\n', '\n', data)
  160. # 기타 처리
  161. data = re.sub('&amp;', '&', data)
  162. # HTML 허용
  163. src_list = ["www.youtube.com", "serviceapi.nmv.naver.com", "tv.kakao.com", "www.google.com", "serviceapi.rmcnmv.naver.com"]
  164. html_list = ['div', 'span', 'embed', 'iframe', 'ruby', 'rp', 'rt']
  165. html_data = re.findall('&lt;(\/)?((?:(?!&gt;| ).)+)( (?:(?:(?!&gt;).)+)?)?&gt;', data)
  166. for in_data in html_data:
  167. if in_data[0] == '':
  168. if in_data[1] in html_list:
  169. if re.search('&lt;\/' + in_data[1] + '&gt;', data):
  170. src = re.search('src=([^ ]*)', in_data[2])
  171. if src:
  172. v_src = re.search('http(?:s)?:\/\/([^/\'" ]*)', src.groups()[0])
  173. if v_src:
  174. if not v_src.groups()[0] in src_list:
  175. and_data = re.sub('&#x27;', '\'', re.sub('&quot;', '"', re.sub('src=([^ ]*)', '', in_data[2])))
  176. else:
  177. and_data = re.sub('&#x27;', '\'', re.sub('&quot;', '"', in_data[2]))
  178. else:
  179. and_data = re.sub('&#x27;', '\'', re.sub('&quot;', '"', re.sub('src=([^ ]*)', '', in_data[2])))
  180. else:
  181. and_data = re.sub('&#x27;', '\'', re.sub('&quot;', '"', in_data[2]))
  182. data = re.sub('&lt;' + in_data[1] + in_data[2] + '&gt;', '<' + in_data[1] + and_data + '>', data, 1)
  183. data = re.sub('&lt;\/' + in_data[1] + '&gt;', '</' + in_data[1] + '>', data, 1)
  184. position = re.compile('position', re.I)
  185. data = position.sub('', data)
  186. # 표 정리
  187. data = re.sub('\n( +)\|\|', '\n||', data)
  188. data = re.sub('\|\|( +)\n', '||\n', data)
  189. # 주석 처리
  190. data = re.sub('\n##(((?!\n).)+)', '', data)
  191. # 중괄호 문법 처리
  192. middle_stack = 0
  193. middle_list = []
  194. middle_number = 0
  195. while 1:
  196. middle_data = re.search('(?:{{{((?:(?! |{{{|}}}).)*) ?|(}}}))', data)
  197. if middle_data:
  198. middle_data = middle_data.groups()
  199. if middle_data[0]:
  200. if middle_stack > 0:
  201. middle_stack += 1
  202. data = re.sub('(?:{{{((?:(?! |{{{|}}}).)*) ?|(}}}))', '&#123;&#123;&#123;' + middle_data[0], data, 1)
  203. else:
  204. if re.search('^(#|@|\+|\-)', middle_data[0]):
  205. middle_search = re.search('^(#(?:[0-9a-f-A-F]{3}){1,2})', middle_data[0])
  206. if middle_search:
  207. middle_list += ['span']
  208. data = re.sub('(?:{{{((?:(?! |{{{|}}}).)*) ?|(}}}))', '<span style="color: ' + middle_search.groups()[0] + ';">', data, 1)
  209. else:
  210. middle_search = re.search('^(?:#(\w+))', middle_data[0])
  211. if middle_search:
  212. middle_list += ['span']
  213. data = re.sub('(?:{{{((?:(?! |{{{|}}}).)*) ?|(}}}))', '<span style="color: ' + middle_search.groups()[0] + ';">', data, 1)
  214. else:
  215. middle_search = re.search('^(?:@((?:[0-9a-f-A-F]{3}){1,2}))', middle_data[0])
  216. if middle_search:
  217. middle_list += ['span']
  218. data = re.sub('(?:{{{((?:(?! |{{{|}}}).)*) ?|(}}}))', '<span style="background: #' + middle_search.groups()[0] + ';">', data, 1)
  219. else:
  220. middle_search = re.search('^(?:@(\w+))', middle_data[0])
  221. if middle_search:
  222. middle_list += ['span']
  223. data = re.sub('(?:{{{((?:(?! |{{{|}}}).)*) ?|(}}}))', '<span style="background: ' + middle_search.groups()[0] + ';">', data, 1)
  224. else:
  225. middle_search = re.search('^(\+|-)([1-5])', middle_data[0])
  226. if middle_search:
  227. middle_search = middle_search.groups()
  228. if middle_search[0] == '+':
  229. font_size = str(int(middle_search[1]) * 20 + 100)
  230. else:
  231. font_size = str(100 - int(middle_search[1]) * 10)
  232. middle_list += ['span']
  233. data = re.sub('(?:{{{((?:(?! |{{{|}}}).)*) ?|(}}}))', '<span style="font-size: ' + font_size + '%;">', data, 1)
  234. else:
  235. middle_search = re.search('^#!wiki', middle_data[0])
  236. if middle_search:
  237. middle_data_2 = re.search('{{{#!wiki style=(?:&quot;|&#x27;)((?:(?!&quot;|&#x27;).)*)(?:&quot;|&#x27;)\n', data)
  238. middle_data_2 = middle_data_2.groups()
  239. middle_list += ['div']
  240. data = re.sub('{{{#!wiki style=(?:&quot;|&#x27;)((?:(?!&quot;|&#x27;).)*)(?:&quot;|&#x27;)\n', '<div style="' + middle_data_2[0] + '">', data, 1)
  241. else:
  242. middle_search = re.search('^#!syntax', middle_data[0])
  243. if middle_search:
  244. if plus_data == '':
  245. plus_data = '<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/9.12.0/styles/default.min.css"><script src="//cdnjs.cloudflare.com/ajax/libs/highlight.js/9.12.0/highlight.min.js"></script><script>hljs.initHighlightingOnLoad();</script>'
  246. middle_data_2 = re.search('{{{#!syntax ((?:(?!\n).)+)\n', data)
  247. middle_data_2 = middle_data_2.groups()
  248. middle_list += ['code', 'pre']
  249. middle_number += 1
  250. data = re.sub('{{{#!syntax ((?:(?!\n).)+)\n', '<pre id="syntax"><code class="' + middle_data_2[0] + '">', data, 1)
  251. else:
  252. middle_search = re.search('^#!html', middle_data[0])
  253. if middle_search:
  254. middle_list += ['span']
  255. data = re.sub('(?:{{{((?:(?! |{{{|}}}).)*) ?|(}}}))', '<span>', data, 1)
  256. else:
  257. middle_search = re.search('^#!folding', middle_data[0])
  258. if middle_search:
  259. middle_list += ['span']
  260. data = re.sub('(?:{{{((?:(?! |{{{|}}}).)*) ?|(}}}))', '<span>', data, 1)
  261. else:
  262. middle_list += ['span']
  263. data = re.sub('(?:{{{((?:(?! |{{{|}}}).)*) ?|(}}}))', '<span>', data, 1)
  264. else:
  265. middle_list += ['code']
  266. middle_stack += 1
  267. data = re.sub('(?:{{{((?:(?! |{{{|}}}).)*)|(}}}))', '<code>' + middle_data[0], data, 1)
  268. middle_number += 1
  269. else:
  270. if middle_list == []:
  271. break
  272. if middle_stack > 0:
  273. middle_stack -= 1
  274. if middle_stack > 0:
  275. data = re.sub('(?:{{{((?:(?! |{{{|}}}).)*) ?|(}}}))', '&#125;&#125;&#125;', data, 1)
  276. else:
  277. if middle_number > 0:
  278. middle_number -= 1
  279. if middle_list[middle_number] == 'pre':
  280. data = re.sub('(?:{{{((?:(?! |{{{|}}}).)*) ?|(}}}))', '</code></pre>', data, 1)
  281. del(middle_list[middle_number])
  282. middle_number -= 1
  283. else:
  284. data = re.sub('(?:{{{((?:(?! |{{{|}}}).)*) ?|(}}}))', '</' + middle_list[middle_number] + '>', data, 1)
  285. del(middle_list[middle_number])
  286. else:
  287. break
  288. # NoWiki 처리
  289. num = 0
  290. while 1:
  291. nowiki_data = re.search('<code>((?:(?:(?!<\/code>).)+\n*)+)<\/code>', data)
  292. if nowiki_data:
  293. nowiki_data = nowiki_data.groups()
  294. num += 1
  295. end_data += [['nowiki_' + str(num), nowiki_data[0]]]
  296. data = re.sub('<code>((?:(?:(?!<\/code>).)+\n*)+)<\/code>', '<span id="nowiki_' + str(num) + '"></span>', data, 1)
  297. else:
  298. break
  299. # Syntax 처리
  300. num = 0
  301. while 1:
  302. syntax_data = re.search('<code class="((?:(?!").)+)">((?:(?:(?:(?!<\/code>|<span id="syntax_)).)+\n*)+)<\/code>', data)
  303. if syntax_data:
  304. syntax_data = syntax_data.groups()
  305. num += 1
  306. end_data += [['syntax_' + str(num), syntax_data[1]]]
  307. data = re.sub('<code class="((?:(?!").)+)">((?:(?:(?:(?!<\/code>|<span id="syntax_)).)+\n*)+)<\/code>', '<code class="' + syntax_data[0] + '"><span id="syntax_' + str(num) + '"></span></code>', data, 1)
  308. else:
  309. break
  310. # 수식 처리
  311. first = 0
  312. while 1:
  313. math = re.search('&lt;math&gt;((?:(?!&lt;\/math&gt;).)+)&lt;\/math&gt;', data)
  314. if math:
  315. if first == 0:
  316. plus_data += '<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.9.0/katex.min.css" integrity="sha384-TEMocfGvRuD1rIAacqrknm5BQZ7W7uWitoih+jMNFXQIbNl16bO8OZmylH/Vi/Ei" crossorigin="anonymous"><script src="https://cdnjs.cloudflare.com/ajax/libs/KaTeX/0.9.0/katex.min.js" integrity="sha384-jmxIlussZWB7qCuB+PgKG1uLjjxbVVIayPJwi6cG6Zb4YKq0JIw+OMnkkEC7kYCq" crossorigin="anonymous"></script>'
  317. math = math.groups()[0]
  318. first += 1
  319. data = re.sub('&lt;math&gt;((?:(?!&lt;\/math&gt;).)+)&lt;\/math&gt;', '<span id="math_' + str(first) + '"></span>', data, 1)
  320. plus_data += '<script>katex.render("' + math.replace('\\', '\\\\') +'", document.getElementById("math_' + str(first) + '"));</script>'
  321. else:
  322. break
  323. # 추가 이스케이프
  324. data = data.replace('\\', '&#92;')
  325. # 텍스트 꾸미기 문법
  326. data = re.sub('&#x27;&#x27;&#x27;(?P<in>((?!&#x27;&#x27;&#x27;).)+)&#x27;&#x27;&#x27;', '<b>\g<in></b>', data)
  327. data = re.sub('&#x27;&#x27;(?P<in>((?!&#x27;&#x27;).)+)&#x27;&#x27;', '<i>\g<in></i>', data)
  328. data = re.sub('~~(?P<in>(?:(?!~~).)+)~~', '<s>\g<in></s>', data)
  329. data = re.sub('--(?P<in>(?:(?!~~).)+)--', '<s>\g<in></s>', data)
  330. data = re.sub('__(?P<in>(?:(?!__).)+)__', '<u>\g<in></u>', data)
  331. data = re.sub('\^\^(?P<in>(?:(?!\^\^).)+)\^\^', '<sup>\g<in></sup>', data)
  332. data = re.sub(',,(?P<in>(?:(?!,,).)+),,', '<sub>\g<in></sub>', data)
  333. # 넘겨주기 변환
  334. redirect = re.search('\n#(?:redirect|넘겨주기) ((?:(?!\n).)+)\n', data)
  335. if redirect:
  336. redirect = redirect.groups()[0]
  337. return_link = link_fix(redirect)
  338. main_link = return_link[0]
  339. other_link = return_link[1]
  340. backlink += [[title, main_link, 'redirect']]
  341. data = re.sub('\n#(?:redirect|넘겨주기) (?P<in>(?:(?!\n).)+)\n', '<meta http-equiv="refresh" content="0; url=/w/' + tool.url_pas(main_link) + '?froms=' + tool.url_pas(title) + other_link + '">', data, 1)
  342. # [목차(없음)] 처리
  343. if not re.search('\[목차\(없음\)\]\n', data):
  344. if not re.search('\[목차\]', data):
  345. data = re.sub('\n(?P<in>={1,6}) ?(?P<out>(?:(?!=).)+) ?={1,6}\n', '\n[목차]\n\g<in> \g<out> \g<in>\n', data, 1)
  346. else:
  347. data = re.sub('\[목차\(없음\)\]\n', '', data)
  348. # 문단 문법
  349. toc_full = 0
  350. toc_top_stack = 6
  351. toc_stack = [0, 0, 0, 0, 0, 0]
  352. edit_number = 0
  353. toc_data = '<div id="toc"><span style="font-size: 18px;">목차</span>\n\n'
  354. while 1:
  355. toc = re.search('\n(={1,6}) ?((?:(?!=).)+) ?={1,6}\n', data)
  356. if toc:
  357. toc = toc.groups()
  358. toc_number = len(toc[0])
  359. edit_number += 1
  360. # 더 크면 그 전 스택은 초기화
  361. if toc_full > toc_number:
  362. for i in range(toc_number, 6):
  363. toc_stack[i] = 0
  364. if toc_top_stack > toc_number:
  365. toc_top_stack = toc_number
  366. toc_full = toc_number
  367. toc_stack[toc_number - 1] += 1
  368. toc_number = str(toc_number)
  369. all_stack = ''
  370. # 스택 합치기
  371. for i in range(0, 6):
  372. all_stack += str(toc_stack[i]) + '.'
  373. all_stack = re.sub('0.', '', all_stack)
  374. data = re.sub('\n(={1,6}) ?((?:(?!=).)+) ?={1,6}\n', '\n<h' + toc_number + ' id="s-' + re.sub('\.$', '', all_stack) + '"><a href="#toc">' + all_stack + '</a> ' + toc[1] + ' <span style="font-size: 12px"><a href="/edit/' + tool.url_pas(title) + '?section=' + str(edit_number) + '">(편집)</a></span></h' + toc_number + '>\n', data, 1)
  375. toc_data += '<span style="margin-left: ' + str((toc_full - toc_top_stack) * 10) + 'px;"><a href="#s-' + re.sub('\.$', '', all_stack) + '">' + all_stack + '</a> ' + re.sub('\[\*((?:(?! |\]).)*)(?: ((?:(?!\]).)+))?\]', '', toc[1]) + '</span>\n'
  376. else:
  377. break
  378. toc_data += '</div>'
  379. data = re.sub('\[목차\]', toc_data, data)
  380. while 1:
  381. hr = re.search('\n-{4,9}\n', data)
  382. if hr:
  383. data = re.sub('\n-{4,9}\n', '\n<hr>\n', data, 1)
  384. else:
  385. break
  386. data += '\n'
  387. # 일부 매크로 처리
  388. data = tool.savemark(data)
  389. data = re.sub("\[anchor\((?P<in>(?:(?!\)\]).)+)\)\]", '<span id="\g<in>"></span>', data)
  390. data = re.sub("\[nicovideo\((?P<in>(?:(?!,|\)\]).)+)(?:(?:(?!\)\]).)*)\)\]", "[[http://embed.nicovideo.jp/watch/\g<in>|\g<in>]]", data)
  391. data = re.sub('\[ruby\((?P<in>(?:(?!,).)+)\, ?(?P<out>(?:(?!\)\]).)+)\)\]', '<ruby>\g<in><rp>(</rp><rt>\g<out></rt><rp>)</rp></ruby>', data)
  392. # 원래 코드 재탕
  393. now_time = tool.get_time()
  394. data = re.sub('\[date\]', now_time, data)
  395. time_data = re.search('^([0-9]{4}-[0-9]{2}-[0-9]{2})', now_time)
  396. time = time_data.groups()
  397. age_data = re.findall('\[age\(([0-9]{4}-[0-9]{2}-[0-9]{2})\)\]', data)
  398. for age in age_data:
  399. old = datetime.datetime.strptime(time[0], '%Y-%m-%d')
  400. will = datetime.datetime.strptime(age, '%Y-%m-%d')
  401. e_data = old - will
  402. data = re.sub('\[age\(([0-9]{4})-([0-9]{2})-([0-9]{2})\)\]', str(int(int(e_data.days) / 365)), data, 1)
  403. dday_data = re.findall('\[dday\(([0-9]{4}-[0-9]{2}-[0-9]{2})\)\]', data)
  404. for dday in dday_data:
  405. old = datetime.datetime.strptime(time[0], '%Y-%m-%d')
  406. will = datetime.datetime.strptime(dday, '%Y-%m-%d')
  407. e_data = old - will
  408. if re.search('^-', str(e_data.days)):
  409. e_day = str(e_data.days)
  410. else:
  411. e_day = '+' + str(e_data.days)
  412. data = re.sub('\[dday\(([0-9]{4}-[0-9]{2}-[0-9]{2})\)\]', e_day, data, 1)
  413. # 유튜브, 카카오 티비 처리
  414. while 1:
  415. video = re.search('\[(youtube|kakaotv)\(((?:(?!\)\]).)+)\)\]', data)
  416. if video:
  417. video = video.groups()
  418. width = re.search(', ?width=((?:(?!,).)+)', video[1])
  419. if width:
  420. video_width = width.groups()[0]
  421. else:
  422. video_width = '560'
  423. height = re.search(', ?height=((?:(?!,).)+)', video[1])
  424. if height:
  425. video_height = height.groups()[0]
  426. else:
  427. video_height = '315'
  428. code = re.search('^(((?!,).)+)', video[1])
  429. if code:
  430. video_code = code.groups()[0]
  431. else:
  432. if video[0] == 'youtube':
  433. video_code = 'BQ5PcIUcdUE'
  434. else:
  435. video_code = '66861302'
  436. if video[0] == 'youtube':
  437. video_code = re.sub('^https:\/\/www\.youtube\.com\/watch\?v=', '', video_code)
  438. video_code = re.sub('^https:\/\/youtu\.be\/', '', video_code)
  439. video_src = 'https://www.youtube.com/embed/' + video_code
  440. else:
  441. video_code = re.sub('^https:\/\/tv\.kakao\.com\/channel\/9262\/cliplink\/', '', video_code)
  442. video_code = re.sub('^http:\/\/tv\.kakao\.com\/v\/', '', video_code)
  443. video_src = 'https://tv.kakao.com/embed/player/cliplink/' + video_code +'?service=kakao_tv'
  444. data = re.sub('\[(youtube|kakaotv)\(((?:(?!\)\]).)+)\)\]', '<iframe width="' + video_width + '" height="' + video_height + '" src="' + video_src + '" allowfullscreen frameborder="0"></iframe>', data, 1)
  445. else:
  446. break
  447. # 인용문 구현
  448. while 1:
  449. block = re.search('(\n(?:&gt; ?(?:(?:(?!\n).)+)?\n)+)', data)
  450. if block:
  451. block = block.groups()[0]
  452. block = re.sub('^\n&gt; ?', '', block)
  453. block = re.sub('\n&gt; ?', '\n', block)
  454. block = re.sub('\n$', '', block)
  455. data = re.sub('(\n(?:&gt; ?(?:(?:(?!\n).)+)?\n)+)', '\n<blockquote>' + block + '</blockquote>\n', data, 1)
  456. else:
  457. break
  458. # 리스트 구현
  459. while 1:
  460. li = re.search('(\n(?:(?: *)\* ?(?:(?:(?!\n).)+)\n)+)', data)
  461. if li:
  462. li = li.groups()[0]
  463. while 1:
  464. sub_li = re.search('\n(?:( *)\* ?((?:(?!\n).)+))', li)
  465. if sub_li:
  466. sub_li = sub_li.groups()
  467. # 앞의 공백 만큼 margin 먹임
  468. if len(sub_li[0]) == 0:
  469. margin = 20
  470. else:
  471. margin = len(sub_li[0]) * 20
  472. li = re.sub('\n(?:( *)\* ?((?:(?!\n).)+))', '<li style="margin-left: ' + str(margin) + 'px;">' + sub_li[1] + '</li>', li, 1)
  473. else:
  474. break
  475. data = re.sub('(\n(?:(?: *)\* ?(?:(?:(?!\n).)+)\n)+)', '\n\n<ul>' + li + '</ul>\n', data, 1)
  476. else:
  477. break
  478. # 들여쓰기 구현
  479. while 1:
  480. indent = re.search('\n( +)', data)
  481. if indent:
  482. indent = len(indent.groups()[0])
  483. # 앞에 공백 만큼 margin 먹임
  484. margin = '<span style="margin-left: 20px;"></span>' * indent
  485. data = re.sub('\n( +)', '\n' + margin, data, 1)
  486. else:
  487. break
  488. # 표 처리
  489. while 1:
  490. table = re.search('\n((?:(?:(?:(?:\|\|)+(?:(?:(?!\|\|).(?:\n)*)*))+)\|\|(?:\n)?)+)', data)
  491. if table:
  492. table = table.groups()[0]
  493. # return [all_table, row_style, cel_style, row, cel, table_class, num]
  494. while 1:
  495. all_table = re.search('^((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*((?:(?!\|\||<\/td>).)*\n*)', table)
  496. if all_table:
  497. all_table = all_table.groups()
  498. return_table = table_parser(all_table[1], all_table[2], all_table[0])
  499. number = return_table[6]
  500. table = re.sub('^((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*', '\n<table ' + return_table[5] + ' ' + return_table[0] + '><tbody><tr ' + return_table[1] + '><td ' + return_table[2] + ' ' + return_table[3] + ' ' + return_table[4] + '>\n', table, 1)
  501. else:
  502. break
  503. table = re.sub('\|\|\n$', '</td></tr></tbody></table>', table)
  504. while 1:
  505. row_table = re.search('\|\|\n((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*((?:(?!\|\||<\/td>).)*\n*)', table)
  506. if row_table:
  507. row_table = row_table.groups()
  508. return_table = table_parser(row_table[1], row_table[2], row_table[0], number)
  509. table = re.sub('\|\|\n((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*', '</td></tr><tr ' + return_table[1] + '><td ' + return_table[2] + ' ' + return_table[3] + ' ' + return_table[4] + '>', table, 1)
  510. else:
  511. break
  512. while 1:
  513. cel_table = re.search('((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*((?:(?:(?!\|\||<\/td>).)|\n)*\n*)', table)
  514. if cel_table:
  515. cel_table = cel_table.groups()
  516. return_table = table_parser(cel_table[1], re.sub('\n', ' ', cel_table[2]), cel_table[0], number)
  517. table = re.sub('((?:\|\|)+)((?:&lt;(?:(?:(?!&gt;).)+)&gt;)*)\n*', '</td><td ' + return_table[2] + ' ' + return_table[3] + ' ' + return_table[4] + '>', table, 1)
  518. else:
  519. break
  520. data = re.sub('\n((?:(?:(?:(?:\|\|)+(?:(?:(?!\|\|).(?:\n)*)*))+)\|\|(?:\n)?)+)', table, data, 1)
  521. else:
  522. break
  523. # 하위 문서
  524. while 1:
  525. under_link = re.search('\[\[\.\.\/(?:\|((?:(?!]]).)+))?]]', data)
  526. if under_link:
  527. under_link = under_link.groups()
  528. title_data = re.search('^(.+)\/(?:(?:(?!\/).)+)$', title)
  529. if title_data:
  530. title_data = title_data.groups()[0]
  531. if under_link[0]:
  532. data = re.sub('\[\[\.\.\/(?:\|((?:(?!]]).)+))?]]', '[[' + title_data + '|' + under_link[0] + ']]', data, 1)
  533. else:
  534. data = re.sub('\[\[\.\.\/(?:\|((?:(?!]]).)+))?]]', '[[' + title_data + ']]', data, 1)
  535. else:
  536. if under_link[0]:
  537. data = re.sub('\[\[\.\.\/(?:\|((?:(?!]]).)+))?]]', '[[' + title + '|' + under_link[0] + ']]', data, 1)
  538. else:
  539. data = re.sub('\[\[\.\.\/(?:\|((?:(?!]]).)+))?]]', '[[' + title + ']]', data, 1)
  540. else:
  541. break
  542. # 링크 관련 문법 구현
  543. category = '\n<hr><div id="cate">분류: '
  544. while 1:
  545. link = re.search('\[\[((?:(?!\[\[|\]\]).)+)\]\]', data)
  546. if link:
  547. link = link.groups()[0]
  548. link_split = re.search('((?:(?!\|).)+)(?:\|((?:(?!\|).)+))', link)
  549. if link_split:
  550. link_split = link_split.groups()
  551. main_link = link_split[0]
  552. see_link = link_split[1]
  553. else:
  554. main_link = link
  555. see_link = link
  556. if re.search('^(파일|외부):', main_link):
  557. file_style = ''
  558. width = re.search('width=((?:(?!&).)+)', see_link)
  559. if width:
  560. file_width = width.groups()[0]
  561. if re.search('px$', file_width):
  562. file_style += 'width: ' + file_width + ';'
  563. else:
  564. file_style += 'width: ' + file_width + 'px;'
  565. height = re.search('height=((?:(?!&).)+)', see_link)
  566. if height:
  567. file_height = height.groups()[0]
  568. if re.search('px$', file_height):
  569. file_style += 'height: ' + file_height + ';'
  570. else:
  571. file_style += 'height: ' + file_height + 'px;'
  572. align = re.search('align=((?:(?!&).)+)', see_link)
  573. if align:
  574. file_align = align.groups()[0]
  575. if file_align == 'center':
  576. file_align = 'display: block; text-align: center;'
  577. else:
  578. file_align = 'float: ' + file_align + ';'
  579. else:
  580. file_align = ''
  581. if re.search('^외부:', main_link):
  582. file_src = re.sub('^외부:', '', main_link)
  583. file_alt = main_link
  584. exist = 'Yes'
  585. else:
  586. file_data = re.search('^파일:((?:(?!\.).)+)\.(.+)$', main_link)
  587. if file_data:
  588. file_data = file_data.groups()
  589. file_name = file_data[0]
  590. file_end = file_data[1]
  591. backlink += [[title, main_link, 'file']]
  592. else:
  593. file_name = 'TEST'
  594. file_end = 'jpg'
  595. file_src = '/image/' + tool.sha224(file_name) + '.' + file_end
  596. file_alt = '파일:' + file_name + '.' + file_end
  597. curs.execute("select title from data where title = ?", [file_alt])
  598. exist = curs.fetchall()
  599. if exist:
  600. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<span style="' + file_align + '"><img style="' + file_style + '" alt="' + file_alt + '" src="' + file_src + '"></span>', data, 1)
  601. else:
  602. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="not_thing" href="/w/' + tool.url_pas(file_alt) + '">' + file_alt + '</a>', data, 1)
  603. elif re.search('^분류:', main_link):
  604. see_link = re.sub('#include', '', see_link)
  605. main_link = re.sub('#include', '', main_link)
  606. if re.search('#blur', main_link):
  607. see_link = '스포일러'
  608. link_id = 'id="inside"'
  609. main_link = re.sub('#blur', '', main_link)
  610. else:
  611. link_id = ''
  612. backlink += [[title, main_link, 'cat']]
  613. category += '<a ' + link_id + ' href="' + tool.url_pas(main_link) + '">' + re.sub('^분류:', '', see_link) + '</a> / '
  614. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '', data, 1)
  615. elif re.search('^wiki:', main_link):
  616. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="inside" href="/' + tool.url_pas(re.sub('^wiki:', '', main_link)) + '">' + see_link + '</a>', data, 1)
  617. elif re.search('^inter:((?:(?!:).)+):', main_link):
  618. inter_data = re.search('^inter:((?:(?!:).)+):((?:(?!\]\]|\|).)+)', main_link)
  619. inter_data = inter_data.groups()
  620. curs.execute('select link from inter where title = ?', [inter_data[0]])
  621. inter = curs.fetchall()
  622. if inter:
  623. if see_link != main_link:
  624. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="inside" href="' + inter[0][0] + inter_data[1] + '">' + inter_data[0] + ':' + see_link + '</a>', data, 1)
  625. else:
  626. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="inside" href="' + inter[0][0] + inter_data[1] + '">' + inter_data[0] + ':' + inter_data[1] + '</a>', data, 1)
  627. else:
  628. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '인터위키 정보 없음', data, 1)
  629. elif re.search('^\/', main_link):
  630. under_title = re.search('^(\/(?:.+))$', main_link)
  631. under_title = under_title.groups()[0]
  632. if see_link != main_link:
  633. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '[[' + title + under_title + '|' + see_link + ']]', data, 1)
  634. else:
  635. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '[[' + title + under_title + ']]', data, 1)
  636. elif re.search('^http(s)?:\/\/', main_link):
  637. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a id="out_link" rel="nofollow" href="' + main_link + '">' + see_link + '</a>', data, 1)
  638. else:
  639. return_link = link_fix(main_link)
  640. main_link = return_link[0]
  641. other_link = return_link[1]
  642. if main_link != title:
  643. if main_link != '':
  644. curs.execute("select title from data where title = ?", [main_link])
  645. if not curs.fetchall():
  646. link_id = 'id="not_thing"'
  647. backlink += [[title, main_link, 'no']]
  648. else:
  649. link_id = ''
  650. backlink += [[title, main_link, '']]
  651. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a ' + link_id + ' href="/w/' + tool.url_pas(main_link) + other_link + '">' + see_link + '</a>', data, 1)
  652. else:
  653. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<a href="' + other_link + '">' + see_link + '</a>', data, 1)
  654. else:
  655. data = re.sub('\[\[((?:(?!\[\[|\]\]).)+)\]\]', '<b>' + see_link + '</b>', data, 1)
  656. else:
  657. break
  658. # 각주 처리
  659. footnote_number = 0
  660. footnote_all = '\n<hr><ul id="footnote_data">'
  661. footnote_dict = {}
  662. while 1:
  663. footnote = re.search('(?:\[\*((?:(?! |\]).)*)(?: ((?:(?!\]).)+))?\]|(\[각주\]))', data)
  664. if footnote:
  665. footnote_data = footnote.groups()
  666. if footnote_data[2]:
  667. footnote_all += '</ul>'
  668. data = re.sub('(?:\[\*((?:(?! ).)*) ((?:(?!\]).)+)\]|(\[각주\]))', footnote_all, data, 1)
  669. footnote_all = '\n<hr><ul id="footnote_data">'
  670. else:
  671. footnote = footnote_data[1]
  672. footnote_name = footnote_data[0]
  673. if footnote_name and not footnote:
  674. data = re.sub('(?:\[\*((?:(?! |\]).)*)(?: ((?:(?!\]).)+))?\]|(\[각주\]))', '<sup><a href="#fn-' + footnote_dict[footnote_name] + '" id="rfn-' + footnote_dict[footnote_name] + '">(' + footnote_name + ')</a></sup>', data, 1)
  675. else:
  676. footnote_number += 1
  677. if not footnote_name:
  678. footnote_name = str(footnote_number)
  679. else:
  680. footnote_dict.update({ footnote_name : str(footnote_number) })
  681. footnote_all += '<li><a href="#rfn-' + str(footnote_number) + '" id="fn-' + str(footnote_number) + '">(' + footnote_name + ')</a> ' + footnote + '</li>'
  682. data = re.sub('(?:\[\*((?:(?! |\]).)*)(?: ((?:(?!\]).)+))?\]|(\[각주\]))', '<sup><a href="#fn-' + str(footnote_number) + '" id="rfn-' + str(footnote_number) + '">(' + footnote_name + ')</a></sup>', data, 1)
  683. else:
  684. break
  685. data = re.sub('\n+$', '', data)
  686. footnote_all += '</ul>'
  687. if footnote_all == '\n<hr><ul id="footnote_data"></ul>':
  688. footnote_all = ''
  689. data = re.sub('\n$', footnote_all, data + '\n', 1)
  690. # 분류 마지막 처리
  691. category += '</div>'
  692. category = re.sub(' / <\/div>$', '</div>', category)
  693. if category == '\n<hr><div id="cate">분류: </div>':
  694. category = ''
  695. data += category
  696. # NoWiki 마지막 처리
  697. for re_data in end_data:
  698. data = data.replace('<span id="' + re_data[0] + '"></span>', re_data[1])
  699. data = data.replace(tool.url_pas('<span id="' + re_data[0] + '"></span>'), tool.url_pas(re_data[1]))
  700. # 마지막 처리
  701. data = re.sub('(?P<in><\/h[0-9]>)(\n)+', '\g<in>', data)
  702. data = re.sub('\n\n<ul>', '\n<ul>', data)
  703. data = re.sub('<\/ul>\n\n', '</ul>\n', data)
  704. data = re.sub('^(\n)+', '', data)
  705. data = re.sub('(\n)+<hr><ul id="footnote_data">', '<hr><ul id="footnote_data">', data)
  706. data = re.sub('(?P<in><td(((?!>).)*)>)\n', '\g<in>', data)
  707. data = re.sub('(\n)?<hr>(\n)?', '<hr>', data)
  708. data = re.sub('<\/ul>\n\n<ul>', '</ul>\n<ul>', data)
  709. data = re.sub("\[br\]", '\n', data)
  710. data = re.sub('\n', '<br>', data)
  711. return [data, plus_data, backlink]