render.py 9.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233
  1. #!/usr/bin/env python3
  2. # -*- coding: UTF-8 -*-
  3. import os
  4. import base64
  5. import glob
  6. from pyquery import PyQuery
  7. import logging
  8. logger = logging.getLogger(__name__)
  9. LIB_PATH = os.path.dirname(os.path.abspath(__file__))
  10. STATIC_PATH = os.path.join(LIB_PATH, 'static')
  11. HTML_FILE = os.path.join(STATIC_PATH, 'TP_INDEX.html')
  12. TIME_HTML_FILE = os.path.join(STATIC_PATH, 'TP_TIME.html')
  13. FRIEND_AVATAR_CSS_FILE = os.path.join(STATIC_PATH, 'avatar.css.tpl')
  14. try:
  15. from csscompressor import compress as css_compress
  16. except ImportError:
  17. css_compress = lambda x: x
  18. from .msg import *
  19. from .common.textutil import ensure_unicode, get_file_b64
  20. from .common.progress import ProgressReporter
  21. from .common.timer import timing
  22. from .smiley import SmileyProvider
  23. from .msgslice import MessageSlicerByTime, MessageSlicerBySize
  24. TEMPLATES_FILES = {TYPE_MSG: "TP_MSG",
  25. TYPE_IMG: "TP_IMG",
  26. TYPE_SPEAK: "TP_SPEAK",
  27. TYPE_EMOJI: "TP_EMOJI",
  28. TYPE_CUSTOM_EMOJI: "TP_EMOJI",
  29. TYPE_LINK: "TP_MSG",
  30. TYPE_VIDEO_FILE: "TP_VIDEO_FILE"
  31. }
  32. TEMPLATES = {
  33. k: open(os.path.join(STATIC_PATH, '{}.html'.format(v))).read()
  34. for k, v in TEMPLATES_FILES.items()
  35. }
  36. class HTMLRender(object):
  37. def __init__(self, parser, res=None):
  38. self.html = ensure_unicode(open(HTML_FILE).read())
  39. self.time_html = open(TIME_HTML_FILE).read()
  40. self.parser = parser
  41. self.res = res
  42. assert self.res is not None, \
  43. "Resource Directory not given. Cannot render HTML."
  44. self.smiley = SmileyProvider()
  45. css_files = glob.glob(os.path.join(LIB_PATH, 'static/*.css'))
  46. self.css_string = [] # css to add
  47. for css in css_files:
  48. logger.info("Loading {}".format(os.path.basename(css)))
  49. css = ensure_unicode((open(css).read()))
  50. self.css_string.append(css)
  51. js_files = glob.glob(os.path.join(LIB_PATH, 'static/*.js'))
  52. # to load jquery before other js
  53. js_files = sorted(js_files, key=lambda f: 'jquery-latest' in f, reverse=True)
  54. self.js_string = []
  55. for js in js_files:
  56. logger.info("Loading {}".format(os.path.basename(js)))
  57. js = ensure_unicode(open(js).read())
  58. self.js_string.append(js)
  59. @property
  60. def all_css(self):
  61. # call after processing all messages,
  62. # because smiley css need to be included only when necessary
  63. def process(css):
  64. css = css_compress(css)
  65. return u'<style type="text/css">{}</style>'.format(css)
  66. if hasattr(self, 'final_css'):
  67. return self.final_css + process(self.smiley.gen_used_smiley_css())
  68. self.final_css = u"\n".join(map(process, self.css_string))
  69. return self.final_css + process(self.smiley.gen_used_smiley_css())
  70. @property
  71. def all_js(self):
  72. if hasattr(self, 'final_js'):
  73. return self.final_js
  74. def process(js):
  75. # TODO: add js compress
  76. return u'<script type="text/javascript">{}</script>'.format(js)
  77. self.final_js = u"\n".join(map(process, self.js_string))
  78. return self.final_js
  79. #@timing(total=True)
  80. def render_msg(self, msg):
  81. """ render a message, return the html block"""
  82. # TODO for chatroom, add nickname on avatar
  83. sender = u'you ' + msg.talker if not msg.isSend else 'me'
  84. format_dict = {'sender_label': sender,
  85. 'time': msg.createTime }
  86. if(not msg.isSend and msg.is_chatroom()):
  87. format_dict['nickname'] = '>\n <pre align=\'left\'>'+msg.talker_nickname+'</pre'
  88. else:
  89. format_dict['nickname'] = ' '
  90. def fallback():
  91. template = TEMPLATES[TYPE_MSG]
  92. content = msg.msg_str()
  93. format_dict['content'] = self.smiley.replace_smileycode(content)
  94. return template.format(**format_dict)
  95. template = TEMPLATES.get(msg.type)
  96. if msg.type == TYPE_SPEAK:
  97. audio_str, duration = self.res.get_voice_mp3(msg.imgPath)
  98. format_dict['voice_duration'] = duration
  99. format_dict['voice_str'] = audio_str
  100. return template.format(**format_dict)
  101. elif msg.type == TYPE_IMG:
  102. # imgPath was original THUMBNAIL_DIRPATH://th_xxxxxxxxx
  103. imgpath = msg.imgPath.split('_')[-1]
  104. if not imgpath:
  105. logger.warn('No imgpath in an image message. Perhaps a bug in wechat.')
  106. return fallback()
  107. bigimgpath = self.parser.imginfo.get(msg.msgSvrId)
  108. fnames = [k for k in [imgpath, bigimgpath] if k]
  109. img = self.res.get_img(fnames)
  110. if not img:
  111. logger.warn("No image thumbnail found for {}".format(imgpath))
  112. return fallback()
  113. # TODO do not show fancybox when no bigimg found
  114. format_dict['img'] = (img, 'jpeg')
  115. return template.format(**format_dict)
  116. elif msg.type == TYPE_EMOJI or msg.type == TYPE_CUSTOM_EMOJI:
  117. if 'emoticonmd5' in msg.content:
  118. pq = PyQuery(msg.content)
  119. md5 = pq('emoticonmd5').text()
  120. else:
  121. md5 = msg.imgPath
  122. # TODO md5 could exist in both.
  123. # first is emoji md5, second is image2/ md5
  124. # can use fallback here.
  125. if md5:
  126. emoji_img, format = self.res.get_emoji_by_md5(md5)
  127. format_dict['emoji_format'] = format
  128. format_dict['emoji_img'] = emoji_img
  129. else:
  130. import IPython as IP; IP.embed()
  131. return template.format(**format_dict)
  132. elif msg.type == TYPE_LINK:
  133. content = msg.msg_str()
  134. # TODO show a short link with long href, if link too long
  135. if content.startswith(u'URL:'):
  136. url = content[4:]
  137. content = u'URL:<a target="_blank" href="{0}">{0}</a>'.format(url)
  138. format_dict['content'] = content
  139. return template.format(**format_dict)
  140. elif msg.type == TYPE_VIDEO_FILE:
  141. video = self.res.get_video(msg.imgPath)
  142. if video.endswith(".mp4"):
  143. video_str = get_file_b64(video)
  144. format_dict["video_str"] = video_str
  145. return template.format(**format_dict)
  146. elif video.endswith(".jpg"):
  147. # only has thumbnail
  148. image_str = get_file_b64(video)
  149. format_dict["img"] = (image_str, 'jpeg')
  150. return TEMPLATES[TYPE_IMG].format(**format_dict)
  151. # fallback
  152. format_dict['content'] = f"VIDEO FILE {msg.imgPath}"
  153. return TEMPLATES_FILES[TYPE_MSG].format(**format_dict)
  154. elif msg.type == TYPE_WX_VIDEO:
  155. # TODO: fetch video from resource
  156. return fallback()
  157. return fallback()
  158. def _render_partial_msgs(self, msgs):
  159. """ return single html"""
  160. self.smiley.reset()
  161. slicer = MessageSlicerByTime()
  162. slices = slicer.slice(msgs)
  163. blocks = []
  164. for idx, slice in enumerate(slices):
  165. nowtime = slice[0].createTime
  166. if idx == 0 or \
  167. slices[idx - 1][0].createTime.date() != nowtime.date():
  168. timestr = nowtime.strftime("%m/%d %H:%M:%S")
  169. else:
  170. timestr = nowtime.strftime("%H:%M:%S")
  171. blocks.append(self.time_html.format(time=timestr))
  172. blocks.extend([self.render_msg(m) for m in slice])
  173. self.prgs.trigger(len(slice))
  174. # string operation is extremely slow
  175. return self.html.format(extra_css=self.all_css,
  176. extra_js=self.all_js,
  177. chat=msgs[0].chat_nickname,
  178. messages=u''.join(blocks)
  179. )
  180. def prepare_avatar_css(self, talkers):
  181. avatar_tpl= ensure_unicode(open(FRIEND_AVATAR_CSS_FILE).read())
  182. my_avatar = self.res.get_avatar(self.parser.username)
  183. css = avatar_tpl.format(name='me', avatar=my_avatar)
  184. for talker in talkers:
  185. avatar = self.res.get_avatar(talker)
  186. css += avatar_tpl.format(name=talker, avatar=avatar)
  187. self.css_string.append(css)
  188. def render_msgs(self, msgs):
  189. """ render msgs of one chat, return a list of html"""
  190. if msgs[0].is_chatroom():
  191. talkers = set([m.talker for m in msgs])
  192. else:
  193. talkers = set([msgs[0].talker])
  194. self.prepare_avatar_css(talkers)
  195. self.res.cache_voice_mp3(msgs)
  196. chat = msgs[0].chat_nickname
  197. logger.info(u"Rendering {} messages of {}".format(
  198. len(msgs), chat))
  199. self.prgs = ProgressReporter("Render", total=len(msgs))
  200. slice_by_size = MessageSlicerBySize().slice(msgs)
  201. ret = [self._render_partial_msgs(s) for s in slice_by_size]
  202. self.prgs.finish()
  203. return ret
  204. if __name__ == '__main__':
  205. r = HTMLRender()
  206. with open('/tmp/a.html', 'w') as f:
  207. print >> f, r.html.format(style=r.css, talker='talker',
  208. messages='haha')