mirror of
https://github.com/kuhyx/WUT_Computer_Science.git
synced 2026-07-04 17:03:12 +02:00
333 lines
11 KiB
Python
333 lines
11 KiB
Python
"""
|
|
Program for converting Latex files into html files
|
|
"""
|
|
|
|
|
|
def command_name_check(latex_string, command_name):
|
|
if latex_string[1: (len(command_name) + 1)] != command_name:
|
|
print(latex_string + "Error! command misspeled!")
|
|
return "Error!"
|
|
return
|
|
|
|
|
|
def generic_checks(latex_string):
|
|
if latex_string == "":
|
|
print(latex_string + "Error! No input given to function")
|
|
return "Error!"
|
|
if "}" not in latex_string:
|
|
print(latex_string + "Error! curly bracket not closed!")
|
|
return "Error!"
|
|
return
|
|
|
|
|
|
def generic_checks_command(latex_string):
|
|
if generic_checks(latex_string) == "Error!":
|
|
return "Error!"
|
|
if latex_string[0] != "\\":
|
|
print(latex_string + "Error! has no slash at begining")
|
|
return "Error!"
|
|
return
|
|
|
|
|
|
def document_class(latex_string):
|
|
r"""
|
|
Converts LaTeX documentclass method to html
|
|
\documentclass{article}
|
|
"""
|
|
if generic_checks_command(latex_string) == "Error!":
|
|
return "Error!"
|
|
if latex_string[len("\\documentclass{") - 1] != "{":
|
|
print(latex_string + "Error! curly bracket not opened!")
|
|
return "Error!"
|
|
if command_name_check(latex_string, "documentclass") == "Error!":
|
|
return "Error!"
|
|
document_type = latex_string[len(
|
|
"\\documentclass{"): (len(latex_string) - 1)]
|
|
return "<!DOCTYPE html>"
|
|
|
|
|
|
def begin_document(latex_string):
|
|
r"""
|
|
Converts LaTeX begin document method to html
|
|
\begin{document}
|
|
"""
|
|
if generic_checks_command(latex_string) == "Error!":
|
|
return "Error!"
|
|
if command_name_check(latex_string, "begin") == "Error!":
|
|
return "Error!"
|
|
return "<html>"
|
|
|
|
|
|
def begin_tabular(latex_string):
|
|
r"""
|
|
Checks if LaTeX begin tabular method is correct
|
|
"""
|
|
if generic_checks_command(latex_string) == "Error!":
|
|
return "Error!"
|
|
if command_name_check(latex_string, "begin") == "Error!":
|
|
return "Error!"
|
|
return "<table>"
|
|
|
|
|
|
def tabular_parameters(latex_string):
|
|
r"""
|
|
Checks if LaTeX tabular environment has any parameters
|
|
"""
|
|
if latex_string == "":
|
|
return ""
|
|
if latex_string == "[]":
|
|
return ""
|
|
return "Error!"
|
|
|
|
|
|
def only_pipes_and_space(latex_string):
|
|
"""Checks if latex string only contains | or " ", if yes returns True, if no returns false"""
|
|
return all(char == '|' or char == ' ' or char == '{' or char == '}' for char in latex_string)
|
|
|
|
|
|
def main_tabular_parameters_loop(latex_string, simple_parameters_dictionary):
|
|
return_array = []
|
|
i = 0
|
|
latex_string_length = len(latex_string)
|
|
while i < latex_string_length:
|
|
character = latex_string[i]
|
|
if character in ['l', 'c', 'r', '|']:
|
|
return_array.append(
|
|
simple_parameters_dictionary.get(latex_string[i]))
|
|
i += 1
|
|
continue
|
|
if character in ['p', 'm', 'b']:
|
|
closing_bracket = latex_string.find('}', i + 1)
|
|
columns_string = latex_string[i:closing_bracket + 1]
|
|
result = tabular_columns_parameters(columns_string)
|
|
if result == "Error!":
|
|
return result
|
|
return_array.append(result)
|
|
i = closing_bracket
|
|
continue
|
|
i += 1
|
|
return return_array
|
|
|
|
|
|
def tabular_required_parameters(latex_string):
|
|
if generic_checks(latex_string) == "Error!":
|
|
return "Error!"
|
|
if latex_string == "{}":
|
|
print("tabular_required_parameters, required table parameters are empty!:", latex_string)
|
|
return "Error!"
|
|
simple_parameters_dictionary = {
|
|
"l": "align='left'",
|
|
"c": "align='center'",
|
|
"r": "align='right'",
|
|
"|": "style='border-left: 1px solid black'"
|
|
}
|
|
if only_pipes_and_space(latex_string):
|
|
print("tabular_required_parameters, required table parameters are only pipes and spaces!:", latex_string)
|
|
return "Error!"
|
|
return main_tabular_parameters_loop(latex_string, simple_parameters_dictionary)
|
|
|
|
|
|
def length_conversions(latex_length):
|
|
length_dictionary = {
|
|
"pt": [1.3, "px"],
|
|
|
|
"mm": [1, "mm"],
|
|
|
|
"cm": [1, "cm"],
|
|
|
|
"in": [1, "in"],
|
|
|
|
"ex": [1, "ex"],
|
|
|
|
"em": [1, "em"],
|
|
}
|
|
return length_dictionary.get(latex_length, "Error!")
|
|
|
|
|
|
def tabular_columns_parameters(latex_string):
|
|
if generic_checks(latex_string) == "Error!":
|
|
return "Error!"
|
|
parameter_dictionary = {
|
|
"p": "vertical-align: top;",
|
|
"m": "vertical-align: middle;",
|
|
"b": "vertical-align: bottom;"
|
|
}
|
|
vertical_align_type = parameter_dictionary.get(latex_string[0], "Error!")
|
|
if vertical_align_type == "Error!":
|
|
print("tabular_columns_parameters, unknown parameter: ",
|
|
latex_string[0])
|
|
return "Error!"
|
|
if latex_string[1] != '{':
|
|
print(
|
|
"tabular_columns_parameters, parameter length does not start with {", latex_string)
|
|
return "Error!"
|
|
length_parameter_with_bracket = latex_string.partition("{")[2]
|
|
length_parameter = length_parameter_with_bracket.partition("}")[0]
|
|
length_value = ""
|
|
i = 0
|
|
for character in length_parameter:
|
|
if character.isalpha():
|
|
break
|
|
length_value += character
|
|
i += 1
|
|
length_unit = length_parameter[i:]
|
|
conversed_unit = length_conversions(length_unit)
|
|
if conversed_unit == "Error!":
|
|
print("tabular_columns_parameters, Unit could not be conversed!", latex_string)
|
|
return "Error!"
|
|
final_length = round(float(length_value) * conversed_unit[0], 2)
|
|
return_string = "style='" + vertical_align_type + \
|
|
" width: " + str(final_length) + conversed_unit[1] + ";'"
|
|
return return_string
|
|
|
|
|
|
def split_rows(latex_string):
|
|
double_backslash = "\\"
|
|
rows = latex_string.split(double_backslash)
|
|
return rows
|
|
|
|
|
|
def split_columns(table_row, column_count):
|
|
columns = table_row.split("&")
|
|
if len(columns) != column_count and columns != ['']:
|
|
|
|
return "Error!"
|
|
return columns
|
|
|
|
|
|
def translate_column(latex_column):
|
|
hline_string_literal = "\hline"
|
|
replaced_hline = latex_column.replace(hline_string_literal, "<hr>")
|
|
replaced_newline = replaced_hline.replace('\newline', "<br>")
|
|
return replaced_newline
|
|
|
|
|
|
def translate_inside_to_html(latex_table_inside, column_style):
|
|
return_string = "<html> <table>"
|
|
column_amount = 0
|
|
line_string = "style='border-left: 1px solid black'"
|
|
for style in column_style:
|
|
if style != line_string:
|
|
column_amount += 1
|
|
rows = split_rows(latex_table_inside)
|
|
for row in rows:
|
|
return_string += "<tr>"
|
|
|
|
columns = split_columns(row, column_amount)
|
|
column_number = 0
|
|
for column in columns:
|
|
return_string += "<td "
|
|
current_style = column_style[column_number]
|
|
while current_style == line_string:
|
|
return_string += line_string
|
|
column_number += 1
|
|
current_style = column_style[column_number]
|
|
|
|
return_string += column_style[column_number] + ">"
|
|
return_string += translate_column(column)
|
|
column_number += 1
|
|
return_string += "</td>"
|
|
|
|
return_string += "</tr>"
|
|
return_string += " </table> </html>"
|
|
return return_string
|
|
|
|
|
|
def read_file(tex_filename):
|
|
tex_file = open(tex_filename, "r")
|
|
data = tex_file.read().replace('\n', '')
|
|
tex_file.close()
|
|
return data
|
|
|
|
|
|
def read_document_class(latex_full_string):
|
|
document_class_index = latex_full_string.find("\documentclass")
|
|
if document_class_index == -1:
|
|
print("Main function error! documentclass not found")
|
|
return "Error!"
|
|
document_class_close_bracket = latex_full_string.find(
|
|
"}", document_class_index)
|
|
document_class_string = latex_full_string[document_class_index:document_class_close_bracket + 1]
|
|
latex_full_string = latex_full_string[document_class_close_bracket + 1:len(
|
|
latex_full_string) - 1]
|
|
return document_class(document_class_string), latex_full_string
|
|
|
|
|
|
def read_begin_document(latex_full_string):
|
|
begin_document_index = latex_full_string.find(r"\begin{document}")
|
|
if begin_document_index == -1:
|
|
print("read_begin_document error! begin{document not found")
|
|
return "Error!", latex_full_string
|
|
begin_document_close_bracket = latex_full_string.find(
|
|
"}", begin_document_index)
|
|
begin_document_string = latex_full_string[begin_document_index:begin_document_close_bracket + 1]
|
|
latex_full_string = latex_full_string[begin_document_close_bracket + 1:len(
|
|
latex_full_string) - 1]
|
|
return_string = begin_document(begin_document_string)
|
|
return return_string, latex_full_string
|
|
|
|
|
|
def read_start(html_string, data):
|
|
document_class_result, data = read_document_class(data)
|
|
if document_class_result == "Error!":
|
|
return "Error!", data
|
|
html_string += document_class_result
|
|
|
|
begin_document_results, data = read_begin_document(data)
|
|
if begin_document_results == "Error!":
|
|
return "Error!", data
|
|
html_string += begin_document_results
|
|
return html_string, data
|
|
|
|
|
|
def handle_table_whole(html_string, data, table_start, table_end):
|
|
if table_start == -1 or table_end == -1:
|
|
return html_string, data
|
|
tabular_begin_string = r"\begin{tabular}"
|
|
tabular_end_string = r"\end{tabular}"
|
|
|
|
table_part = data[table_start:table_end+len(tabular_end_string)]
|
|
parameters_start_index = data.find(
|
|
"{", table_start + len(tabular_begin_string))
|
|
|
|
parameters_end_index = data.find("}", parameters_start_index)
|
|
parameters_string = data[parameters_start_index:parameters_end_index+1]
|
|
parameters_array = tabular_required_parameters(parameters_string)
|
|
inside_table = data[parameters_end_index+1:table_end]
|
|
html_string += translate_inside_to_html(inside_table, parameters_array)
|
|
return html_string
|
|
|
|
|
|
def handle_insides(html_string, data):
|
|
tabular_index = 0
|
|
tabular_end_string = r"\end{tabular}"
|
|
while tabular_index != -1:
|
|
tabular_index_start = data.find(r"\begin{tabular}", 0)
|
|
tabular_index_end = data.find(tabular_end_string, tabular_index_start)
|
|
if tabular_index_start == -1 or tabular_index_end == -1:
|
|
return html_string, data
|
|
html_string += data[0:tabular_index_start]
|
|
|
|
html_string = handle_table_whole(html_string, data,
|
|
tabular_index_start, tabular_index_end)
|
|
data = data[tabular_index_end + len(tabular_end_string):len(data)]
|
|
tabular_index = tabular_index_end
|
|
return html_string, data
|
|
|
|
|
|
def main_function():
|
|
tex_filename = "texfile.tex"
|
|
data = read_file(tex_filename)
|
|
html_string = ""
|
|
html_string, data = read_start(html_string, data)
|
|
if html_string == "Error!":
|
|
print("main_function error! when reading documentclass or begin document")
|
|
return "Error"
|
|
html_string, data = handle_insides(html_string, data)
|
|
|
|
return html_string
|
|
|
|
|
|
if __name__ == "__main__":
|
|
print(main_function())
|