File size: 4,160 Bytes
2c076ca
 
a5044c6
2c076ca
 
 
a5044c6
2c076ca
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
a5044c6
 
 
 
 
 
 
 
 
 
 
 
2c076ca
d8fdbeb
 
 
 
 
 
 
2c076ca
a5044c6
d8fdbeb
a5044c6
 
2c076ca
a5044c6
2c076ca
 
 
 
 
 
 
 
 
 
8ac92f5
2c076ca
a5044c6
 
2c076ca
 
 
 
b2ac83c
 
f85bdb1
2c076ca
a5044c6
2c076ca
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
import gradio as gr
import re
import os
import subprocess
import argparse


def remove_color_codes(text):
    color_pattern = re.compile(r'\x1b\[\d+m')
    clean_text = re.sub(color_pattern, '', text)
    return clean_text


def to_html(document):
    lines = document.split('\n')
    formatted_lines = []

    for line in lines:
        if line.startswith("Error"):
            formatted_line = f'<span style="color: red;">{line}</span>'
        elif line.startswith("Warning"):
            formatted_line = f'<span style="color: yellow;">{line}</span>'
        elif line.startswith("Parsing Error:"):
            formatted_line = f'<span style="color: yellow;">{line}</span>'
        elif line == "All Clear!":
            formatted_line = f'<span style="color: green;">{line}</span>'
        else:
            formatted_line = line

        formatted_lines.append(formatted_line)

    formatted_document = '<br>'.join(formatted_lines)
    return formatted_document

def add_images(file_name):
    html = '<div align="center">'
    for file in os.listdir("."):
        if file.startswith(f"errors-{file_name}") and file.endswith(".png"):
            html += f'<img src="file/{file}">'
    html += '</div>'
    return html

def clear_cached_images(file_name):
    for file in os.listdir("."):
        if file.startswith(f"errors-{file_name}") and file.endswith(".png"):
            os.remove(file)

def get_filename(file):
    file_name = os.path.basename(file).split(".")[0]
    if "_" in file_name:
        # apparently aclpubcheck doesn't like underscores in filenames
        file_name = file_name.split("_")[0]
    return file_name

def upload_file(file, paper_type):
    file_name_cmd = file.name.replace(" ", "\ ")
    file_name = get_filename(file.name)
    clear_cached_images(file_name)
    command = f"python3 aclpubcheck-main/aclpubcheck/formatchecker.py --paper_type {paper_type} {file_name_cmd}"
    out = subprocess.run(command, shell=True, stdout=subprocess.PIPE, text=True, stderr=subprocess.STDOUT)
    return to_html(remove_color_codes(out.stdout)) + add_images(file_name)


with gr.Blocks() as demo:
    header = """
        <div align="center">
        <img src="https://upload.wikimedia.org/wikipedia/en/thumb/7/72/Association_for_Computational_Linguistics_logo.svg/2880px-Association_for_Computational_Linguistics_logo.svg.png" alt="acl-logo" width=100px/>
        <h1>ACL Pubcheck Tool</h1>
        </div>
    """
    gr.HTML(header)
    gr.Markdown("Drop or upload your paper here to have it checked for [*ACL conferences](https://www.aclweb.org/) guidelines.")
    dropdown = gr.Dropdown(
        ["long", "short", "demo", "other"], label="Paper type", value="long"
    )
    file_output = gr.File(file_types=[".pdf"])
    button = gr.Button("Check your PDF!", variant="primary")
    out = gr.HTML()
    gr.Markdown(
        "This graphical interface is using the official [aclpubcheck tool](https://github.com/acl-org/aclpubcheck). Check the [Github repo for more information.](https://github.com/teelinsan/aclpubcheck-gui)")
    gr.Markdown(
        "No data is collected. If you prefer you can also duplicate this Space to run it privately. [![Duplicate Space](https://img.shields.io/badge/-Duplicate%20Space-blue?labelColor=white&style=flat&logo=&logoWidth=14)](https://huggingface.co/spaces/teelinsan/aclpubcheck?duplicate=true)")

    button.click(upload_file, [file_output, dropdown], out)

if __name__ == '__main__':
    parser = argparse.ArgumentParser()
    parser.add_argument('--host', default="0.0.0.0", type=str)
    parser.add_argument('--port', default=7860, type=int)
    args = parser.parse_args()

    demo.launch(server_name=args.host, server_port=args.port)