import html import os import re import time from pathlib import Path import markdown from PIL import Image, ImageOps from modules.utils import get_available_chat_styles # This is to store the paths to the thumbnails of the profile pictures image_cache = {} with open(Path(__file__).resolve().parent / '../css/html_readable_style.css', 'r') as f: readable_css = f.read() with open(Path(__file__).resolve().parent / '../css/html_4chan_style.css', 'r') as css_f: _4chan_css = css_f.read() with open(Path(__file__).resolve().parent / '../css/html_instruct_style.css', 'r') as f: instruct_css = f.read() # Custom chat styles chat_styles = {} for k in get_available_chat_styles(): chat_styles[k] = open(Path(f'css/chat_style-{k}.css'), 'r').read() # Handle styles that derive from other styles for k in chat_styles: lines = chat_styles[k].split('\n') input_string = lines[0] match = re.search(r'chat_style-([a-z\-]*)\.css', input_string) if match: style = match.group(1) chat_styles[k] = chat_styles.get(style, '') + '\n\n' + '\n'.join(lines[1:]) def fix_newlines(string): string = string.replace('\n', '\n\n') string = re.sub(r"\n{3,}", "\n\n", string) string = string.strip() return string def replace_blockquote(m): return m.group().replace('\n', '\n> ').replace('\\begin{blockquote}', '').replace('\\end{blockquote}', '') def convert_to_markdown(string): # Blockquote string = re.sub(r'(^|[\n])>', r'\1>', string) pattern = re.compile(r'\\begin{blockquote}(.*?)\\end{blockquote}', re.DOTALL) string = pattern.sub(replace_blockquote, string) # Code string = string.replace('\\begin{code}', '```') string = string.replace('\\end{code}', '```') string = re.sub(r"(.)```", r"\1\n```", string) result = '' is_code = False for line in string.split('\n'): if line.lstrip(' ').startswith('```'): is_code = not is_code result += line if is_code or line.startswith('|'): # Don't add an extra \n for tables or code result += '\n' else: result += '\n\n' result = result.strip() if is_code: result += '\n```' # Unfinished code block # Unfinished list, like "\n1.". A |delete| string is added and then # removed to force a <ol> or <ul> to be generated instead of a <p>. if re.search(r'(\n\d+\.?|\n\*\s*)$', result): delete_str = '|delete|' if re.search(r'(\d+\.?)$', result) and not result.endswith('.'): result += '.' result = re.sub(r'(\n\d+\.?|\n\*\s*)$', r'\g<1> ' + delete_str, result) html_output = markdown.markdown(result, extensions=['fenced_code', 'tables']) pos = html_output.rfind(delete_str) if pos > -1: html_output = html_output[:pos] + html_output[pos + len(delete_str):] else: html_output = markdown.markdown(result, extensions=['fenced_code', 'tables']) # Unescape code blocks pattern = re.compile(r'<code[^>]*>(.*?)</code>', re.DOTALL) html_output = pattern.sub(lambda x: html.unescape(x.group()), html_output) return html_output def generate_basic_html(string): string = convert_to_markdown(string) string = f'<style>{readable_css}</style><div class="readable-container">{string}</div>' return string def process_post(post, c): t = post.split('\n') number = t[0].split(' ')[1] if len(t) > 1: src = '\n'.join(t[1:]) else: src = '' src = re.sub('>', '>', src) src = re.sub('(>>[0-9]*)', '<span class="quote">\\1</span>', src) src = re.sub('\n', '<br>\n', src) src = f'<blockquote class="message_4chan">{src}\n' src = f'<span class="name">Anonymous </span> <span class="number">No.{number}</span>\n{src}' return src def generate_4chan_html(f): posts = [] post = '' c = -2 for line in f.splitlines(): line += "\n" if line == '-----\n': continue elif line.startswith('--- '): c += 1 if post != '': src = process_post(post, c) posts.append(src) post = line else: post += line if post != '': src = process_post(post, c) posts.append(src) for i in range(len(posts)): if i == 0: posts[i] = f'<div class="op">{posts[i]}</div>\n' else: posts[i] = f'<div class="reply">{posts[i]}</div>\n' output = '' output += f'<style>{_4chan_css}</style><div id="parent"><div id="container">' for post in posts: output += post output += '</div></div>' output = output.split('\n') for i in range(len(output)): output[i] = re.sub(r'^(>(.*?)(<br>|</div>))', r'<span class="greentext">\1</span>', output[i]) output[i] = re.sub(r'^<blockquote class="message_4chan">(>(.*?)(<br>|</div>))', r'<blockquote class="message_4chan"><span class="greentext">\1</span>', output[i]) output = '\n'.join(output) return output def make_thumbnail(image): image = image.resize((350, round(image.size[1] / image.size[0] * 350)), Image.Resampling.LANCZOS) if image.size[1] > 470: image = ImageOps.fit(image, (350, 470), Image.LANCZOS) return image def get_image_cache(path): cache_folder = Path("cache") if not cache_folder.exists(): cache_folder.mkdir() mtime = os.stat(path).st_mtime if (path in image_cache and mtime != image_cache[path][0]) or (path not in image_cache): img = make_thumbnail(Image.open(path)) old_p = Path(f'cache/{path.name}_cache.png') p = Path(f'cache/cache_{path.name}.png') if old_p.exists(): old_p.rename(p) output_file = p img.convert('RGB').save(output_file, format='PNG') image_cache[path] = [mtime, output_file.as_posix()] return image_cache[path][1] def generate_instruct_html(history): output = f'<style>{instruct_css}</style><div class="chat" id="chat"><div class="messages">' for i, _row in enumerate(history): row = [convert_to_markdown(entry) for entry in _row] if row[0]: # don't display empty user messages output += f""" <div class="user-message"> <div class="text"> <div class="message-body"> {row[0]} </div> </div> </div> """ output += f""" <div class="assistant-message"> <div class="text"> <div class="message-body"> {row[1]} </div> </div> </div> """ output += "</div></div>" return output def generate_cai_chat_html(history, name1, name2, style, reset_cache=False): output = f'<style>{chat_styles[style]}</style><div class="chat" id="chat"><div class="messages">' # We use ?name2 and ?time.time() to force the browser to reset caches img_bot = f'<img src="file/cache/pfp_character.png?{name2}">' if Path("cache/pfp_character.png").exists() else '' img_me = f'<img src="file/cache/pfp_me.png?{time.time() if reset_cache else ""}">' if Path("cache/pfp_me.png").exists() else '' for i, _row in enumerate(history): row = [convert_to_markdown(entry) for entry in _row] if row[0]: # don't display empty user messages output += f""" <div class="message"> <div class="circle-you"> {img_me} </div> <div class="text"> <div class="username"> {name1} </div> <div class="message-body"> {row[0]} </div> </div> </div> """ output += f""" <div class="message"> <div class="circle-bot"> {img_bot} </div> <div class="text"> <div class="username"> {name2} </div> <div class="message-body"> {row[1]} </div> </div> </div> """ output += "</div></div>" return output def generate_chat_html(history, name1, name2, reset_cache=False): output = f'<style>{chat_styles["wpp"]}</style><div class="chat" id="chat"><div class="messages">' for i, _row in enumerate(history): row = [convert_to_markdown(entry) for entry in _row] if row[0]: # don't display empty user messages output += f""" <div class="message"> <div class="text-you"> <div class="message-body"> {row[0]} </div> </div> </div> """ output += f""" <div class="message"> <div class="text-bot"> <div class="message-body"> {row[1]} </div> </div> </div> """ output += "</div></div>" return output def chat_html_wrapper(history, name1, name2, mode, style, reset_cache=False): if mode == 'instruct': return generate_instruct_html(history['visible']) elif style == 'wpp': return generate_chat_html(history['visible'], name1, name2) else: return generate_cai_chat_html(history['visible'], name1, name2, style, reset_cache)