2024-08-28 15:16:50 +08:00
|
|
|
|
import re
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class Header:
|
|
|
|
|
@staticmethod
|
|
|
|
|
def header(text: str) -> str:
|
|
|
|
|
"""
|
|
|
|
|
渲染标题
|
|
|
|
|
:param text: 原始文本
|
|
|
|
|
:return: 处理后的文本
|
|
|
|
|
"""
|
|
|
|
|
h6 = re.sub(r'###### (.*?)\n', r'<h6>\1</h6>\n', text) # H6
|
|
|
|
|
h5 = re.sub(r'##### (.*?)\n', r'<h5>\1</h5>\n', h6) # H5
|
|
|
|
|
h4 = re.sub(r'#### (.*?)\n', r'<h4>\1</h4>\n', h5) # H4
|
|
|
|
|
h3 = re.sub(r'### (.*?)\n', r'<h3>\1</h3>\n', h4) # H3
|
|
|
|
|
h2 = re.sub(r'## (.*?)\n', r'<h2>\1</h2>\n', h3) # H2
|
|
|
|
|
h1 = re.sub(r'# (.*?)\n', r'<h1>\1</h1>\n', h2) # H1
|
|
|
|
|
return h1
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class Style:
|
|
|
|
|
"""
|
|
|
|
|
渲染字体样式
|
|
|
|
|
"""
|
2024-08-29 12:36:57 +08:00
|
|
|
|
|
2024-08-28 15:16:50 +08:00
|
|
|
|
def __init__(self, text: str):
|
|
|
|
|
"""
|
|
|
|
|
初始化
|
|
|
|
|
:param text: cd文本
|
|
|
|
|
"""
|
|
|
|
|
self.text = text
|
|
|
|
|
|
|
|
|
|
def italic(self):
|
|
|
|
|
"""
|
|
|
|
|
斜体
|
|
|
|
|
:return:
|
|
|
|
|
"""
|
2024-08-29 12:36:57 +08:00
|
|
|
|
self.text = re.sub(r'\*([^*\n]+)\*', r'<i>\1</i>', self.text)
|
2024-08-28 15:16:50 +08:00
|
|
|
|
|
|
|
|
|
def bold(self):
|
|
|
|
|
"""
|
|
|
|
|
粗体
|
|
|
|
|
:return:
|
|
|
|
|
"""
|
2024-08-29 12:36:57 +08:00
|
|
|
|
self.text = re.sub(r'\*\*([^*\n]+)\*\*', r'<b>\1</b>', self.text)
|
2024-08-28 15:16:50 +08:00
|
|
|
|
|
|
|
|
|
def underline(self):
|
|
|
|
|
"""
|
|
|
|
|
下划线
|
|
|
|
|
:return:
|
|
|
|
|
"""
|
2024-08-29 12:36:57 +08:00
|
|
|
|
self.text = re.sub(r'~([^~\n]+)~', r'<u>\1</u>', self.text)
|
2024-08-28 15:16:50 +08:00
|
|
|
|
|
|
|
|
|
def strikethrough(self):
|
|
|
|
|
"""
|
|
|
|
|
删除线
|
|
|
|
|
:return:
|
|
|
|
|
"""
|
2024-08-29 12:36:57 +08:00
|
|
|
|
self.text = re.sub(r'~~([^~\n]+)~~', r'<s>\1</s>', self.text)
|
2024-08-28 15:16:50 +08:00
|
|
|
|
|
|
|
|
|
def highlight(self):
|
|
|
|
|
"""
|
|
|
|
|
高亮
|
|
|
|
|
:return:
|
|
|
|
|
"""
|
2024-08-29 12:36:57 +08:00
|
|
|
|
self.text = re.sub(r'==([^=\n]+)==', r'<mark>\1</mark>', self.text)
|
2024-08-28 15:16:50 +08:00
|
|
|
|
|
|
|
|
|
def __call__(self, *args, **kwargs):
|
|
|
|
|
"""
|
|
|
|
|
一键运行
|
|
|
|
|
:param args:
|
|
|
|
|
:param kwargs:
|
|
|
|
|
:return:
|
|
|
|
|
"""
|
|
|
|
|
self.bold()
|
|
|
|
|
self.italic()
|
|
|
|
|
self.strikethrough()
|
|
|
|
|
self.underline()
|
|
|
|
|
self.highlight()
|
|
|
|
|
return self.text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class Function:
|
|
|
|
|
"""
|
|
|
|
|
添加特殊功能
|
|
|
|
|
"""
|
|
|
|
|
|
|
|
|
|
def __init__(self, text: str):
|
|
|
|
|
"""
|
|
|
|
|
初始化
|
|
|
|
|
:param text: cd文本
|
|
|
|
|
"""
|
|
|
|
|
self.text = text
|
|
|
|
|
|
|
|
|
|
def link(self):
|
2024-08-29 12:36:57 +08:00
|
|
|
|
self.text = re.sub(r'\[([^\[\]\n]+)]\(([^()\n]+)\)', r'<a href="\2">\1</a>', self.text)
|
2024-08-28 15:16:50 +08:00
|
|
|
|
|
|
|
|
|
def __call__(self, *args, **kwargs):
|
|
|
|
|
"""
|
|
|
|
|
一键运行
|
|
|
|
|
:param args:
|
|
|
|
|
:param kwargs:
|
|
|
|
|
:return:
|
|
|
|
|
"""
|
|
|
|
|
self.link()
|
|
|
|
|
return self.text
|
|
|
|
|
|
|
|
|
|
|
2024-08-29 12:36:57 +08:00
|
|
|
|
class Value:
|
|
|
|
|
def __init__(self, text: str):
|
|
|
|
|
self.text = text
|
|
|
|
|
self.values = {
|
|
|
|
|
key: value for key, value in re.findall(r'\[([^]]+)]: (.+?)(?=\n|$)', text)
|
|
|
|
|
} # 从text中提取所有变量并转换成字典
|
|
|
|
|
|
|
|
|
|
def __call__(self, *args, **kwargs):
|
|
|
|
|
"""
|
|
|
|
|
将所有变量赋值并移除变量定义
|
|
|
|
|
:param args:
|
|
|
|
|
:param kwargs:
|
|
|
|
|
:return: 赋值后的正文
|
|
|
|
|
"""
|
|
|
|
|
text = self.text
|
|
|
|
|
for k, v in self.values.items():
|
|
|
|
|
text = re.sub(fr'\[([^]]+)]\({k}\)', fr'[\1]({v})', text)
|
|
|
|
|
text = re.sub(fr'\[{k}]: (.+?)(?=\n|$)', '', text)
|
|
|
|
|
return text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class CodeBlock:
|
|
|
|
|
def __init__(self, text: str):
|
2024-08-29 16:36:37 +08:00
|
|
|
|
"""
|
|
|
|
|
找出代码块并移除代码标识
|
|
|
|
|
:param text: 输入的文本
|
|
|
|
|
"""
|
|
|
|
|
self.codes = [i for i in re.findall(r'`([^`]*)`', text) if i != ''] # 找出代码快
|
|
|
|
|
self.text = re.sub(r'``', '', text) # 移除代码标识`
|
2024-08-29 12:36:57 +08:00
|
|
|
|
|
|
|
|
|
def __call__(self, *args, **kwargs):
|
2024-08-29 16:36:37 +08:00
|
|
|
|
"""
|
|
|
|
|
临时移除代码块
|
|
|
|
|
:param args:
|
|
|
|
|
:param kwargs:
|
|
|
|
|
:return: 不含代码的文本
|
|
|
|
|
"""
|
|
|
|
|
for index, item in enumerate(self.codes): # 替换代码块为-@@-(ID)-@@-
|
|
|
|
|
self.text = re.sub(fr'`{re.escape(item)}`', f'-@@-{index}-@@-', self.text) # 同时转译特殊字符
|
|
|
|
|
return self.text
|
2024-08-29 12:36:57 +08:00
|
|
|
|
|
2024-08-29 16:36:37 +08:00
|
|
|
|
def rendering(self):
|
|
|
|
|
"""
|
|
|
|
|
渲染代码
|
|
|
|
|
:return:
|
|
|
|
|
"""
|
|
|
|
|
for index, code in enumerate(self.codes):
|
|
|
|
|
if re.search(r'\n', code): # 是多行代码
|
|
|
|
|
head = re.findall(r'(.*?)\n', code)[0]
|
|
|
|
|
if head == 'python':
|
|
|
|
|
pass
|
|
|
|
|
elif head == 'shell':
|
|
|
|
|
pass
|
|
|
|
|
else: # 是单行代码
|
|
|
|
|
self.codes[index] = f'\({code}\)'
|
|
|
|
|
|
|
|
|
|
def restore(self, new_text: str):
|
|
|
|
|
"""
|
|
|
|
|
将渲染好的代码重新放回处理好的正文
|
|
|
|
|
:param new_text: 处理好的正文
|
|
|
|
|
:return: 加上代码的文章
|
|
|
|
|
"""
|
|
|
|
|
for index, item in enumerate(self.codes):
|
|
|
|
|
new_text = re.sub(fr'-@@-{index}-@@-', f'{item}', new_text, flags=re.DOTALL)
|
|
|
|
|
return new_text
|
2024-08-29 12:39:59 +08:00
|
|
|
|
|
2024-08-29 12:36:57 +08:00
|
|
|
|
|
2024-08-28 15:16:50 +08:00
|
|
|
|
class Basic:
|
2024-08-29 12:36:57 +08:00
|
|
|
|
@staticmethod
|
|
|
|
|
def paragraph(text: str):
|
2024-08-29 17:36:08 +08:00
|
|
|
|
text = '\n'.join(['-' + line + '-' for line in original_string.splitlines()])
|
2024-08-29 16:36:37 +08:00
|
|
|
|
return re.sub(r'(<.+?>.*?<.+?>)\n', r'<p>\1</p>\n', text)
|
2024-08-28 15:16:50 +08:00
|
|
|
|
|
|
|
|
|
|
2024-08-29 12:36:57 +08:00
|
|
|
|
def add_indent_to_string(input_string: str, indent_spaces: int = 4):
|
|
|
|
|
"""
|
|
|
|
|
给字符串中的每一行前面加上缩进。
|
|
|
|
|
:param input_string: 原始字符串,可以包含多行。
|
|
|
|
|
:param indent_spaces: 每行前面要添加的空格数,默认为4。
|
|
|
|
|
|
|
|
|
|
:return: 带缩进的新字符串。
|
|
|
|
|
"""
|
|
|
|
|
# 使用字符串的splitlines()方法分割原始字符串为行列表
|
|
|
|
|
lines = input_string.splitlines()
|
|
|
|
|
|
|
|
|
|
# 遍历行列表,给每行前面加上相应的缩进,并重新组合成字符串
|
|
|
|
|
indented_string = "\n".join(f"{' ' * indent_spaces}{line}" for line in lines)
|
|
|
|
|
|
|
|
|
|
return indented_string
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def body(text: str) -> str:
|
|
|
|
|
"""
|
|
|
|
|
渲染正文部分
|
|
|
|
|
:param text: 输入正文
|
|
|
|
|
:return: 输出渲染后的正文
|
|
|
|
|
"""
|
|
|
|
|
text = Value(text)() # 提取变量并赋值到文本中
|
2024-08-28 15:16:50 +08:00
|
|
|
|
text = Header.header(text) # 渲染标题
|
2024-08-29 12:36:57 +08:00
|
|
|
|
text = Style(text)() # 渲染字体样式
|
|
|
|
|
text = Function(text)() # 渲染特殊功能
|
2024-08-29 16:36:37 +08:00
|
|
|
|
text = Basic.paragraph(text)
|
2024-08-28 15:16:50 +08:00
|
|
|
|
|
|
|
|
|
# text = Basic.paragraph(text) # 渲染段落
|
|
|
|
|
return text
|
|
|
|
|
|
|
|
|
|
|
2024-08-29 12:36:57 +08:00
|
|
|
|
def main(origen: str):
|
|
|
|
|
# 预处理
|
2024-08-29 16:36:37 +08:00
|
|
|
|
code_block = CodeBlock(origen) # 获取代码内容
|
|
|
|
|
text = code_block() # 暂时移除代码
|
|
|
|
|
code_block.rendering() # 渲染代码
|
|
|
|
|
# 处理正文
|
|
|
|
|
return code_block.restore(body(text)) # 放回代码
|
2024-08-29 12:36:57 +08:00
|
|
|
|
#
|
|
|
|
|
|
|
|
|
|
|
2024-08-28 15:16:50 +08:00
|
|
|
|
if __name__ == '__main__':
|
|
|
|
|
with open('test.md', encoding='utf-8') as test:
|
2024-08-29 12:39:59 +08:00
|
|
|
|
cd = main(test.read())
|
2024-08-28 15:16:50 +08:00
|
|
|
|
with open('test.html', 'w', encoding='utf-8') as html:
|
2024-08-29 12:36:57 +08:00
|
|
|
|
html.write(f"""<!DOCTYPE html>
|
|
|
|
|
<html lang="zh-CN">
|
|
|
|
|
<head>
|
|
|
|
|
<meta charset="UTF-8">
|
|
|
|
|
<meta name="viewport" content="width=device-width, initial-scale=1.0">
|
|
|
|
|
<title>UTF-8编码示例</title>
|
2024-08-29 16:36:37 +08:00
|
|
|
|
<script type="text/javascript" async
|
|
|
|
|
src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.7/MathJax.js?config=TeX-MML-AM_CHTML">
|
|
|
|
|
</script>
|
2024-08-29 12:36:57 +08:00
|
|
|
|
<!-- 可以在这里添加其他元数据和CSS链接 -->
|
|
|
|
|
</head>
|
|
|
|
|
<body>
|
|
|
|
|
{add_indent_to_string(cd, 4)}
|
|
|
|
|
</body>
|
|
|
|
|
</html>
|
2024-08-29 12:39:59 +08:00
|
|
|
|
""")
|