Spaces:
Runtime error
Runtime error
File size: 4,160 Bytes
2c076ca a5044c6 2c076ca a5044c6 2c076ca a5044c6 2c076ca d8fdbeb 2c076ca a5044c6 d8fdbeb a5044c6 2c076ca a5044c6 2c076ca 8ac92f5 2c076ca a5044c6 2c076ca b2ac83c f85bdb1 2c076ca a5044c6 2c076ca |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 |
import gradio as gr
import re
import os
import subprocess
import argparse
def remove_color_codes(text):
color_pattern = re.compile(r'\x1b\[\d+m')
clean_text = re.sub(color_pattern, '', text)
return clean_text
def to_html(document):
lines = document.split('\n')
formatted_lines = []
for line in lines:
if line.startswith("Error"):
formatted_line = f'<span style="color: red;">{line}</span>'
elif line.startswith("Warning"):
formatted_line = f'<span style="color: yellow;">{line}</span>'
elif line.startswith("Parsing Error:"):
formatted_line = f'<span style="color: yellow;">{line}</span>'
elif line == "All Clear!":
formatted_line = f'<span style="color: green;">{line}</span>'
else:
formatted_line = line
formatted_lines.append(formatted_line)
formatted_document = '<br>'.join(formatted_lines)
return formatted_document
def add_images(file_name):
html = '<div align="center">'
for file in os.listdir("."):
if file.startswith(f"errors-{file_name}") and file.endswith(".png"):
html += f'<img src="file/{file}">'
html += '</div>'
return html
def clear_cached_images(file_name):
for file in os.listdir("."):
if file.startswith(f"errors-{file_name}") and file.endswith(".png"):
os.remove(file)
def get_filename(file):
file_name = os.path.basename(file).split(".")[0]
if "_" in file_name:
# apparently aclpubcheck doesn't like underscores in filenames
file_name = file_name.split("_")[0]
return file_name
def upload_file(file, paper_type):
file_name_cmd = file.name.replace(" ", "\ ")
file_name = get_filename(file.name)
clear_cached_images(file_name)
command = f"python3 aclpubcheck-main/aclpubcheck/formatchecker.py --paper_type {paper_type} {file_name_cmd}"
out = subprocess.run(command, shell=True, stdout=subprocess.PIPE, text=True, stderr=subprocess.STDOUT)
return to_html(remove_color_codes(out.stdout)) + add_images(file_name)
with gr.Blocks() as demo:
header = """
<div align="center">
<img src="https://upload.wikimedia.org/wikipedia/en/thumb/7/72/Association_for_Computational_Linguistics_logo.svg/2880px-Association_for_Computational_Linguistics_logo.svg.png" alt="acl-logo" width=100px/>
<h1>ACL Pubcheck Tool</h1>
</div>
"""
gr.HTML(header)
gr.Markdown("Drop or upload your paper here to have it checked for [*ACL conferences](https://www.aclweb.org/) guidelines.")
dropdown = gr.Dropdown(
["long", "short", "demo", "other"], label="Paper type", value="long"
)
file_output = gr.File(file_types=[".pdf"])
button = gr.Button("Check your PDF!", variant="primary")
out = gr.HTML()
gr.Markdown(
"This graphical interface is using the official [aclpubcheck tool](https://github.com/acl-org/aclpubcheck). Check the [Github repo for more information.](https://github.com/teelinsan/aclpubcheck-gui)")
gr.Markdown(
"No data is collected. If you prefer you can also duplicate this Space to run it privately. [![Duplicate Space](https://img.shields.io/badge/-Duplicate%20Space-blue?labelColor=white&style=flat&logo=&logoWidth=14)](https://huggingface.co/spaces/teelinsan/aclpubcheck?duplicate=true)")
button.click(upload_file, [file_output, dropdown], out)
if __name__ == '__main__':
parser = argparse.ArgumentParser()
parser.add_argument('--host', default="0.0.0.0", type=str)
parser.add_argument('--port', default=7860, type=int)
args = parser.parse_args()
demo.launch(server_name=args.host, server_port=args.port)
|