text-generation-webui/modules/html_generator.py

166 lines
5.1 KiB
Python
Raw Normal View History

2023-01-07 02:14:08 +00:00
'''
2023-03-17 19:06:11 +00:00
This is a library for formatting text outputs as nice HTML.
2023-01-07 02:14:08 +00:00
'''
2023-02-23 17:41:42 +00:00
import os
2023-01-07 02:14:08 +00:00
import re
from pathlib import Path
2023-01-07 02:14:08 +00:00
2023-03-15 15:33:26 +00:00
import markdown
from PIL import Image
# This is to store the paths to the thumbnails of the profile pictures
image_cache = {}
2023-03-15 17:19:28 +00:00
with open(Path(__file__).resolve().parent / '../css/html_readable_style.css', 'r') as f:
readable_css = f.read()
with open(Path(__file__).resolve().parent / '../css/html_4chan_style.css', 'r') as css_f:
_4chan_css = css_f.read()
with open(Path(__file__).resolve().parent / '../css/html_cai_style.css', 'r') as f:
cai_css = f.read()
2023-03-15 15:33:26 +00:00
2023-03-17 19:06:11 +00:00
def fix_newlines(string):
string = string.replace('\n', '\n\n')
string = re.sub(r"\n{3,}", "\n\n", string)
string = string.strip()
return string
# This could probably be generalized and improved
def convert_to_markdown(string):
string = string.replace('\\begin{code}', '```')
string = string.replace('\\end{code}', '```')
string = string.replace('\\begin{blockquote}', '> ')
string = string.replace('\\end{blockquote}', '')
string = re.sub(r"(.)```", r"\1\n```", string)
2023-03-28 15:59:34 +00:00
string = fix_newlines(string)
2023-03-17 19:06:11 +00:00
return markdown.markdown(string, extensions=['fenced_code'])
def generate_basic_html(string):
string = convert_to_markdown(string)
string = f'<style>{readable_css}</style><div class="container">{string}</div>'
return string
2023-01-15 19:43:31 +00:00
2023-01-07 02:14:08 +00:00
def process_post(post, c):
t = post.split('\n')
number = t[0].split(' ')[1]
if len(t) > 1:
src = '\n'.join(t[1:])
else:
src = ''
src = re.sub('>', '&gt;', src)
src = re.sub('(&gt;&gt;[0-9]*)', '<span class="quote">\\1</span>', src)
src = re.sub('\n', '<br>\n', src)
src = f'<blockquote class="message">{src}\n'
src = f'<span class="name">Anonymous </span> <span class="number">No.{number}</span>\n{src}'
return src
2023-01-11 04:10:11 +00:00
def generate_4chan_html(f):
2023-01-07 02:14:08 +00:00
posts = []
post = ''
c = -2
for line in f.splitlines():
line += "\n"
if line == '-----\n':
continue
elif line.startswith('--- '):
c += 1
if post != '':
src = process_post(post, c)
posts.append(src)
post = line
else:
post += line
if post != '':
src = process_post(post, c)
posts.append(src)
for i in range(len(posts)):
if i == 0:
posts[i] = f'<div class="op">{posts[i]}</div>\n'
else:
posts[i] = f'<div class="reply">{posts[i]}</div>\n'
output = ''
2023-03-15 17:19:28 +00:00
output += f'<style>{_4chan_css}</style><div id="parent"><div id="container">'
2023-01-07 02:14:08 +00:00
for post in posts:
output += post
output += '</div></div>'
2023-01-07 02:14:08 +00:00
output = output.split('\n')
for i in range(len(output)):
2023-01-07 04:20:10 +00:00
output[i] = re.sub(r'^(&gt;(.*?)(<br>|</div>))', r'<span class="greentext">\1</span>', output[i])
output[i] = re.sub(r'^<blockquote class="message">(&gt;(.*?)(<br>|</div>))', r'<blockquote class="message"><span class="greentext">\1</span>', output[i])
2023-01-07 02:14:08 +00:00
output = '\n'.join(output)
return output
def get_image_cache(path):
cache_folder = Path("cache")
if not cache_folder.exists():
cache_folder.mkdir()
mtime = os.stat(path).st_mtime
if (path in image_cache and mtime != image_cache[path][0]) or (path not in image_cache):
img = Image.open(path)
img.thumbnail((200, 200))
output_file = Path(f'cache/{path.name}_cache.png')
img.convert('RGB').save(output_file, format='PNG')
image_cache[path] = [mtime, output_file.as_posix()]
return image_cache[path][1]
def load_html_image(paths):
for str_path in paths:
path = Path(str_path)
if path.exists():
return f'<img src="file/{get_image_cache(path)}">'
return ''
def generate_chat_html(history, name1, name2, character):
2023-03-15 17:19:28 +00:00
output = f'<style>{cai_css}</style><div class="chat" id="chat">'
2023-03-24 20:18:27 +00:00
img_bot = load_html_image([f"characters/{character}.{ext}" for ext in ['png', 'jpg', 'jpeg']] + ["img_bot.png","img_bot.jpg","img_bot.jpeg"])
img_me = load_html_image(["img_me.png", "img_me.jpg", "img_me.jpeg"])
for i,_row in enumerate(history[::-1]):
2023-03-17 19:06:11 +00:00
row = [convert_to_markdown(entry) for entry in _row]
2023-03-24 20:18:27 +00:00
output += f"""
<div class="message">
<div class="circle-bot">
{img_bot}
</div>
<div class="text">
<div class="username">
{name2}
</div>
<div class="message-body">
{row[1]}
</div>
</div>
</div>
"""
2023-03-24 20:18:27 +00:00
if len(row[0]) == 0: # don't display empty user messages
continue
2023-03-24 20:18:27 +00:00
output += f"""
<div class="message">
<div class="circle-you">
{img_me}
</div>
<div class="text">
<div class="username">
{name1}
</div>
<div class="message-body">
{row[0]}
</div>
</div>
</div>
"""
output += "</div>"
return output