start.py 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319
  1. from . import tool
  2. import re
  3. def table_parser(data, cel_data, start_data, num = 0):
  4. table_class = 'class="'
  5. all_table = 'style="'
  6. cel_style = 'style="'
  7. row_style = 'style="'
  8. row = ''
  9. cel = ''
  10. table_width = re.search("<table ?width=((?:(?!>).)*)>", data)
  11. if table_width:
  12. all_table += 'width: ' + table_width.groups()[0] + ';'
  13. table_height = re.search("<table ?height=((?:(?!>).)*)>", data)
  14. if table_height:
  15. all_table += 'height: ' + table_height.groups()[0] + ';'
  16. table_align = re.search("<table ?align=((?:(?!>).)*)>", data)
  17. if table_align:
  18. if table_align.groups()[0] == 'right':
  19. all_table += 'float: right;'
  20. elif table_align.groups()[0] == 'center':
  21. all_table += 'margin: auto;'
  22. table_text_align = re.search("<table ?textalign=((?:(?!>).)*)>", data)
  23. if table_text_align:
  24. num = 1
  25. if table_text_align.groups()[0] == 'right':
  26. all_table += 'text-align: right;'
  27. elif table_text_align.groups()[0] == 'center':
  28. all_table += 'text-align: center;'
  29. row_t_a = re.search("<row ?textalign=((?:(?!>).)*)>", data)
  30. if row_t_a:
  31. if row_t_a.groups()[0] == 'right':
  32. row_style += 'text-align: right;'
  33. elif row_t_a.groups()[0] == 'center':
  34. row_style += 'text-align: center;'
  35. else:
  36. row_style += 'text-align: left;'
  37. table_cel = re.search("<-((?:(?!>).)*)>", data)
  38. if table_cel:
  39. cel = 'colspan="' + table_cel.groups()[0] + '"'
  40. else:
  41. cel = 'colspan="' + str(round(len(start_data) / 2)) + '"'
  42. table_row = re.search("<\|((?:(?!>).)*)>", data)
  43. if table_row:
  44. row = 'rowspan="' + table_row.groups()[0] + '"'
  45. row_bgcolor = re.search("<rowbgcolor=(#(?:[0-9a-f-A-F]{3}){1,2}|\w+)>", data)
  46. if row_bgcolor:
  47. row_style += 'background: ' + row_bgcolor.groups()[0] + ';'
  48. table_border = re.search("<table ?bordercolor=(#(?:[0-9a-f-A-F]{3}){1,2}|\w+)>", data)
  49. if table_border:
  50. all_table += 'border: ' + table_border.groups()[0] + ' 2px solid;'
  51. table_bgcolor = re.search("<table ?bgcolor=(#(?:[0-9a-f-A-F]{3}){1,2}|\w+)>", data)
  52. if table_bgcolor:
  53. all_table += 'background: ' + table_bgcolor.groups()[0] + ';'
  54. bgcolor = re.search("<(?:bgcolor=)?(#(?:[0-9a-f-A-F]{3}){1,2}|\w+)>", data)
  55. if bgcolor:
  56. cel_style += 'background: ' + bgcolor.groups()[0] + ';'
  57. cel_width = re.search("<width=((?:(?!>).)*)>", data)
  58. if cel_width:
  59. cel_style += 'width: ' + cel_width.groups()[0] + ';'
  60. cel_height = re.search("<height=((?:(?!>).)*)>", data)
  61. if cel_height:
  62. cel_style += 'height: ' + cel_height.groups()[0] + ';'
  63. text_right = re.search("<\)>", data)
  64. text_center = re.search("<:>", data)
  65. text_left = re.search("<\(>", data)
  66. if text_right:
  67. cel_style += 'text-align: right;'
  68. elif text_center:
  69. cel_style += 'text-align: center;'
  70. elif text_left:
  71. cel_style += 'text-align: left;'
  72. elif num == 0:
  73. if re.search('^ (.*) $', cel_data):
  74. cel_style += 'text-align: center;'
  75. elif re.search('^ (.*)$', cel_data):
  76. cel_style += 'text-align: right;'
  77. elif re.search('^(.*) $', cel_data):
  78. cel_style += 'text-align: left;'
  79. text_class = re.search("<table ?class=((?:(?!>).)+)>", data)
  80. if text_class:
  81. table_class += text_class.groups()[0]
  82. all_table += '"'
  83. cel_style += '"'
  84. row_style += '"'
  85. table_class += '"'
  86. return [all_table, row_style, cel_style, row, cel, table_class, num]
  87. def start(conn, data, title):
  88. # DB 지정
  89. curs = conn.cursor()
  90. # 맨 앞과 끝에 개행 문자 추가
  91. data = '\r\n' + data + '\r\n'
  92. while 1:
  93. include = re.search('\[include\(((?:(?!\)\]).)+)\)\]', data)
  94. if include:
  95. include = include.groups()[0]
  96. curs.execute("select data from data where title = ?", [include])
  97. include_data = curs.fetchall()
  98. if include_data:
  99. data = re.sub('\[include\(((?:(?!\)\]).)+)\)\]', '\r\n' + include_data[0][0] + '\r\n', data, 1)
  100. else:
  101. data = re.sub('\[include\(((?:(?!\)\]).)+)\)\]', '[[' + include + ']]', data, 1)
  102. else:
  103. break
  104. # 텍스트 꾸미기 문법
  105. data = re.sub('\'\'\'(?P<in>(?:(?!\'\'\').)+)\'\'\'', '<b>\g<in></b>', data)
  106. data = re.sub('\'\'(?P<in>(?:(?!\'\').)+)\'\'', '<i>\g<in></i>', data)
  107. data = re.sub('~~(?P<in>(?:(?!~~).)+)~~', '<s>\g<in></s>', data)
  108. data = re.sub('--(?P<in>(?:(?!~~).)+)--', '<s>\g<in></s>', data)
  109. data = re.sub('__(?P<in>(?:(?!__).)+)__', '<u>\g<in></u>', data)
  110. data = re.sub('^^(?P<in>(?:(?!^^).)+)^^', '<sup>\g<in></sup>', data)
  111. data = re.sub(',,(?P<in>(?:(?!,,).)+),,', '<sub>\g<in></sub>', data)
  112. # 넘겨주기 변환
  113. data = re.sub('\r\n#(?:redirect|넘겨주기) (?P<in>(?:(?!\r\n).)+)\r\n', '<meta http-equiv="refresh" content="0; url=/w/\g<in>?froms=' + tool.url_pas(title) + '">', data)
  114. # [목차(없음)] 처리
  115. if not re.search('\[목차\(없음\)\]\r\n', data):
  116. if not re.search('\[목차\]', data):
  117. data = re.sub('\r\n(?P<in>={1,6}) ?(?P<out>(?:(?!=).)+) ?={1,6}\r\n', '\r\n[목차]\r\n\g<in> \g<out> \g<in>\r\n', data, 1)
  118. else:
  119. data = re.sub('\[목차\(없음\)\]\r\n', '', data)
  120. # 문단 문법
  121. toc_full = 0
  122. toc_top_stack = 6
  123. toc_stack = [0, 0, 0, 0, 0, 0]
  124. toc_data = '<div id="toc"><span style="font-size: 18px;">목차</span>\r\n\r\n'
  125. while 1:
  126. toc = re.search('\r\n(={1,6}) ?((?:(?!=).)+) ?={1,6}\r\n', data)
  127. if toc:
  128. toc = toc.groups()
  129. toc_number = len(toc[0])
  130. # 더 크면 그 전 스택은 초기화
  131. if toc_full > toc_number:
  132. for i in range(toc_number, 6):
  133. toc_stack[i] = 0
  134. if toc_top_stack > toc_number:
  135. toc_top_stack = toc_number
  136. toc_full = toc_number
  137. toc_stack[toc_number - 1] += 1
  138. toc_number = str(toc_number)
  139. all_stack = ''
  140. # 스택 합치기
  141. for i in range(0, 6):
  142. all_stack += str(toc_stack[i]) + '.'
  143. all_stack = re.sub('0.', '', all_stack)
  144. data = re.sub('\r\n(={1,6}) ?((?:(?!=).)+) ?={1,6}\r\n', '\r\n<h' + toc_number + '><a href="">' + all_stack + '</a> ' + toc[1] + '</h' + toc_number + '><hr id="under_bar" style="margin-top: -5px; margin-bottom: 10px;">\r\n', data, 1)
  145. toc_data += '<span style="margin-left: ' + str((toc_full - toc_top_stack) * 10) + 'px"><a href="">' + all_stack + '</a> ' + toc[1] + '</span>\r\n'
  146. else:
  147. break
  148. toc_data += '</div>'
  149. data = re.sub('\[목차\]', toc_data, data)
  150. while 1:
  151. hr = re.search('\r\n-{4,9}\r\n', data)
  152. if hr:
  153. data = re.sub('\r\n-{4,9}\r\n', '<hr>', data, 1)
  154. else:
  155. break
  156. # 리스트 구현
  157. while 1:
  158. li = re.search('(\r\n(?:(?: *)\* ?(?:(?:(?!\r\n).)+)\r\n)+)', data)
  159. if li:
  160. li = li.groups()[0]
  161. while 1:
  162. sub_li = re.search('\r\n(?:( *)\* ?((?:(?!\r\n).)+))', li)
  163. if sub_li:
  164. sub_li = sub_li.groups()
  165. # 앞의 공백 만큼 margin 먹임
  166. if len(sub_li[0]) == 0:
  167. margin = 20
  168. else:
  169. margin = len(sub_li[0]) * 20
  170. li = re.sub('\r\n(?:( *)\* ?((?:(?!\r\n).)+))', '<li style="margin-left: ' + str(margin) + 'px">' + sub_li[1] + '</li>', li, 1)
  171. else:
  172. break
  173. data = re.sub('(\r\n(?:(?: *)\* ?(?:(?:(?!\r\n).)+)\r\n)+)', '<ul>' + li + '</ul>\r\n', data, 1)
  174. else:
  175. break
  176. # 들여쓰기 구현
  177. while 1:
  178. indent = re.search('\r\n( +)', data)
  179. if indent:
  180. indent = len(indent.groups()[0])
  181. # 앞에 공백 만큼 margin 먹임
  182. margin = '<span style="margin-left: 20px;"></span>' * indent
  183. data = re.sub('\r\n( +)', '\r\n' + margin, data, 1)
  184. else:
  185. break
  186. # 표 처리
  187. while 1:
  188. table = re.search('((?:(?:(?:(?:\|\|)+(?:(?:(?!\|\|).(?:\r\n)*)+))+)\|\|(?:\r\n)?)+)', data)
  189. if table:
  190. table = table.groups()[0]
  191. # return [all_table, row_style, cel_style, row, cel, table_class, num]
  192. while 1:
  193. all_table = re.search('^((?:\|\|)+)((?:<(?:(?:(?!>).)+)>)*)((?:(?!\|\||<\/td>).)+)', table)
  194. if all_table:
  195. all_table = all_table.groups()
  196. return_table = table_parser(all_table[1], all_table[2], all_table[0])
  197. number = return_table[6]
  198. table = re.sub('^\|\|((?:<(?:(?:(?!>).)+)>)*)', '<table ' + return_table[5] + ' ' + return_table[0] + '><tbody><tr ' + return_table[1] + '><td ' + return_table[2] + ' ' + return_table[3] + ' ' + return_table[4] + '>', table, 1)
  199. else:
  200. break
  201. table = re.sub('\|\|\r\n$', '</td></tr></tbody></table>', table)
  202. while 1:
  203. row_table = re.search('\|\|\r\n((?:\|\|)+)((?:<(?:(?:(?!>).)+)>)*)((?:(?!\|\||<\/td>).)+)', table)
  204. if row_table:
  205. row_table = row_table.groups()
  206. return_table = table_parser(row_table[1], row_table[2], row_table[0], number)
  207. table = re.sub('\|\|\r\n((?:\|\|)+)((?:<(?:(?:(?!>).)+)>)*)', '</td></tr><tr ' + return_table[1] + '><td ' + return_table[2] + ' ' + return_table[3] + ' ' + return_table[4] + '>', table, 1)
  208. else:
  209. break
  210. while 1:
  211. cel_table = re.search('((?:\|\|)+)((?:<(?:(?:(?!>).)+)>)*)((?:(?!\|\||<\/td>).)+)', table)
  212. if cel_table:
  213. cel_table = cel_table.groups()
  214. return_table = table_parser(cel_table[1], cel_table[2], cel_table[0], number)
  215. table = re.sub('((?:\|\|)+)((?:<(?:(?:(?!>).)+)>)*)', '</td><td ' + return_table[2] + ' ' + return_table[3] + ' ' + return_table[4] + '>', table, 1)
  216. else:
  217. break
  218. data = re.sub('((?:(?:(?:(?:\|\|)+(?:(?:(?!\|\|).(?:\r\n)*)+))+)\|\|(?:\r\n)?)+)', table, data, 1)
  219. else:
  220. break
  221. while 1:
  222. link = re.search('\[\[((?:(?!\]\]).)+)\]\]', data)
  223. if link:
  224. link = link.groups()[0]
  225. link_split = re.search('((?:(?!\|).)+)(?:\|((?:(?!\|).)+))', link)
  226. if link_split:
  227. link_split = link_split.groups()
  228. main_link = link_split[0]
  229. see_link = link_split[1]
  230. else:
  231. main_link = link
  232. see_link = link
  233. if re.search('^wiki:', main_link):
  234. data = re.sub('\[\[((?:(?!\]\]).)+)\]\]', '<a id="inside" href="/' + tool.url_pas(main_link) + '">' + see_link + '</a>', data, 1)
  235. if re.search('^http(s)?:\/\/', main_link):
  236. data = re.sub('\[\[((?:(?!\]\]).)+)\]\]', '<a class="out_link" rel="nofollow" href="' + tool.url_pas(main_link) + '">' + see_link + '</a>', data, 1)
  237. else:
  238. if re.search('^:', main_link):
  239. main_link = re.sub('^:', '', main_link)
  240. curs.execute("select title from data where title = ?", [main_link])
  241. if not curs.fetchall():
  242. link_class = 'class="not_thing"'
  243. else:
  244. link_class = ''
  245. data = re.sub('\[\[((?:(?!\]\]).)+)\]\]', '<a ' + link_class + ' href="/w/' + tool.url_pas(main_link) + '">' + see_link + '</a>', data, 1)
  246. else:
  247. break
  248. # 마지막 처리
  249. data = re.sub('(?P<in><hr id="under_bar" style="margin-top: -5px; margin-bottom: 10px;">)\r\n', '\g<in>', data)
  250. data = re.sub('<\/ul>\r\n\r\n', '</ul>\r\n', data)
  251. data = re.sub('\r\n', '<br>', data)
  252. return data