Spaces:

NAACL2022
/

NAACL2022-papers

Sleeping

App Files Files Community

hysts HF staff commited on Jun 11, 2024

Commit

3f5d923

1 Parent(s): 6923bc1

Update

Browse files

Files changed (6) hide show

.pre-commit-config.yaml +59 -35
.style.yapf +0 -5
README.md +1 -1
app.py +26 -26
paper_list.py +37 -38
style.css +1 -4

.pre-commit-config.yaml CHANGED Viewed

@@ -1,36 +1,60 @@
 repos:
-- repo: https://github.com/pre-commit/pre-commit-hooks
-  rev: v4.2.0
-  hooks:
-  - id: check-executables-have-shebangs
-  - id: check-json
-  - id: check-merge-conflict
-  - id: check-shebang-scripts-are-executable
-  - id: check-toml
-  - id: check-yaml
-  - id: double-quote-string-fixer
-  - id: end-of-file-fixer
-  - id: mixed-line-ending
-    args: ['--fix=lf']
-  - id: requirements-txt-fixer
-  - id: trailing-whitespace
-- repo: https://github.com/myint/docformatter
-  rev: v1.4
-  hooks:
-  - id: docformatter
-    args: ['--in-place']
-- repo: https://github.com/pycqa/isort
-  rev: 5.12.0
-  hooks:
-    - id: isort
-- repo: https://github.com/pre-commit/mirrors-mypy
-  rev: v0.991
-  hooks:
-    - id: mypy
-      args: ['--ignore-missing-imports']
-      additional_dependencies: ['types-requests']
-- repo: https://github.com/google/yapf
-  rev: v0.32.0
-  hooks:
-  - id: yapf
-    args: ['--parallel', '--in-place']

 repos:
+  - repo: https://github.com/pre-commit/pre-commit-hooks
+    rev: v4.6.0
+    hooks:
+      - id: check-executables-have-shebangs
+      - id: check-json
+      - id: check-merge-conflict
+      - id: check-shebang-scripts-are-executable
+      - id: check-toml
+      - id: check-yaml
+      - id: end-of-file-fixer
+      - id: mixed-line-ending
+        args: ["--fix=lf"]
+      - id: requirements-txt-fixer
+      - id: trailing-whitespace
+  - repo: https://github.com/myint/docformatter
+    rev: v1.7.5
+    hooks:
+      - id: docformatter
+        args: ["--in-place"]
+  - repo: https://github.com/pycqa/isort
+    rev: 5.13.2
+    hooks:
+      - id: isort
+        args: ["--profile", "black"]
+  - repo: https://github.com/pre-commit/mirrors-mypy
+    rev: v1.10.0
+    hooks:
+      - id: mypy
+        args: ["--ignore-missing-imports"]
+        additional_dependencies:
+          [
+            "types-python-slugify",
+            "types-requests",
+            "types-PyYAML",
+            "types-pytz",
+          ]
+  - repo: https://github.com/psf/black
+    rev: 24.4.2
+    hooks:
+      - id: black
+        language_version: python3.10
+        args: ["--line-length", "119"]
+  - repo: https://github.com/kynan/nbstripout
+    rev: 0.7.1
+    hooks:
+      - id: nbstripout
+        args:
+          [
+            "--extra-keys",
+            "metadata.interpreter metadata.kernelspec cell.metadata.pycharm",
+          ]
+  - repo: https://github.com/nbQA-dev/nbQA
+    rev: 1.8.5
+    hooks:
+      - id: nbqa-black
+      - id: nbqa-pyupgrade
+        args: ["--py37-plus"]
+      - id: nbqa-isort
+        args: ["--float-to-top"]

.style.yapf DELETED Viewed

@@ -1,5 +0,0 @@
-[style]
-based_on_style = pep8
-blank_line_before_nested_class_or_def = false
-spaces_before_comment = 2
-split_before_logical_operator = true

README.md CHANGED Viewed

@@ -4,7 +4,7 @@ emoji: 🏢
 colorFrom: yellow
 colorTo: red
 sdk: gradio
-sdk_version: 3.36.1
 app_file: app.py
 pinned: false
 ---

 colorFrom: yellow
 colorTo: red
 sdk: gradio
+sdk_version: 4.36.1
 app_file: app.py
 pinned: false
 ---

app.py CHANGED Viewed

@@ -6,44 +6,44 @@ import gradio as gr
 from paper_list import PaperList
-DESCRIPTION = '# NAACL 2022 Papers'
-NOTES = '''
 - [NAACL 2022](https://2022.naacl.org/)
 - [NAACL'22 Reproducibility Track](https://naacl2022-reproducibility-track.github.io/results/)
-'''
 paper_list = PaperList()
-with gr.Blocks(css='style.css') as demo:
     gr.Markdown(DESCRIPTION)
     search_box = gr.Textbox(
-        label='Search Title',
-        placeholder=
-        'You can search for titles with regular expressions. e.g. (?<!sur)face'
     )
-    case_sensitive = gr.Checkbox(label='Case Sensitive')
-    filter_names = gr.CheckboxGroup(label='Filter',
-                                    choices=[
-                                        'arXiv',
-                                        'GitHub',
-                                        'HF Space',
-                                        'HF Model',
-                                        'HF Dataset',
-                                    ])
     paper_category_names = [
-        'Long Paper',
-        'Short Paper',
-        'Special Theme Paper',
-        'Findings',
-        'Industry Track',
     ]
-    paper_categories = gr.CheckboxGroup(label='Paper Categories',
-                                        choices=paper_category_names,
-                                        value=paper_category_names)
-    search_button = gr.Button('Search')
-    number_of_papers = gr.Textbox(label='Number of Papers Found')
     table = gr.HTML(show_label=False)
     gr.Markdown(NOTES)

 from paper_list import PaperList
+DESCRIPTION = "# NAACL 2022 Papers"
+NOTES = """
 - [NAACL 2022](https://2022.naacl.org/)
 - [NAACL'22 Reproducibility Track](https://naacl2022-reproducibility-track.github.io/results/)
+"""
 paper_list = PaperList()
+with gr.Blocks(css="style.css") as demo:
     gr.Markdown(DESCRIPTION)
     search_box = gr.Textbox(
+        label="Search Title", placeholder="You can search for titles with regular expressions. e.g. (?<!sur)face"
+    )
+    case_sensitive = gr.Checkbox(label="Case Sensitive")
+    filter_names = gr.CheckboxGroup(
+        label="Filter",
+        choices=[
+            "arXiv",
+            "GitHub",
+            "HF Space",
+            "HF Model",
+            "HF Dataset",
+        ],
     )
     paper_category_names = [
+        "Long Paper",
+        "Short Paper",
+        "Special Theme Paper",
+        "Findings",
+        "Industry Track",
     ]
+    paper_categories = gr.CheckboxGroup(
+        label="Paper Categories", choices=paper_category_names, value=paper_category_names
+    )
+    search_button = gr.Button("Search")
+    number_of_papers = gr.Textbox(label="Number of Papers Found")
     table = gr.HTML(show_label=False)
     gr.Markdown(NOTES)

paper_list.py CHANGED Viewed

@@ -5,10 +5,10 @@ import pandas as pd
 class PaperList:
     def __init__(self):
-        self.table = pd.read_csv('papers.csv')
         self._preprcess_table()
-        self.table_header = '''
             <tr>
                 <td width="50%">Paper</td>
                 <td width="22%">Authors</td>
@@ -19,28 +19,23 @@ class PaperList:
                 <td width="4%">HF Spaces</td>
                 <td width="4%">HF Models</td>
                 <td width="4%">HF Datasets</td>
-            </tr>'''
     def _preprcess_table(self) -> None:
-        self.table['title_lowercase'] = self.table.title.str.lower()
         rows = []
         for row in self.table.itertuples():
-            paper = f'<a href="{row.url}" target="_blank">{row.title}</a>' if isinstance(
-                row.url, str) else row.title
-            pdf = f'<a href="{row.pdf}" target="_blank">pdf</a>' if isinstance(
-                row.pdf, str) else ''
-            arxiv = f'<a href="{row.arxiv}" target="_blank">arXiv</a>' if isinstance(
-                row.arxiv, str) else ''
-            github = f'<a href="{row.github}" target="_blank">GitHub</a>' if isinstance(
-                row.github, str) else ''
-            hf_space = f'<a href="{row.hf_space}" target="_blank">Space</a>' if isinstance(
-                row.hf_space, str) else ''
-            hf_model = f'<a href="{row.hf_model}" target="_blank">Model</a>' if isinstance(
-                row.hf_model, str) else ''
-            hf_dataset = f'<a href="{row.hf_dataset}" target="_blank">Dataset</a>' if isinstance(
-                row.hf_dataset, str) else ''
-            row = f'''
                 <tr>
                     <td>{paper}</td>
                     <td>{row.authors}</td>
@@ -51,33 +46,37 @@ class PaperList:
                     <td>{hf_space}</td>
                     <td>{hf_model}</td>
                     <td>{hf_dataset}</td>
-                </tr>'''
             rows.append(row)
-        self.table['html_table_content'] = rows
-    def render(self, search_query: str, case_sensitive: bool,
-               filter_names: list[str],
-               paper_categories: list[str]) -> tuple[int, str]:
         df = self.table
         if search_query:
             if case_sensitive:
                 df = df[df.title.str.contains(search_query)]
             else:
                 df = df[df.title_lowercase.str.contains(search_query.lower())]
-        has_arxiv = 'arXiv' in filter_names
-        has_github = 'GitHub' in filter_names
-        has_hf_space = 'HF Space' in filter_names
-        has_hf_model = 'HF Model' in filter_names
-        has_hf_dataset = 'HF Dataset' in filter_names
-        df = self.filter_table(df, has_arxiv, has_github, has_hf_space,
-                               has_hf_model, has_hf_dataset, paper_categories)
         return len(df), self.to_html(df, self.table_header)
     @staticmethod
-    def filter_table(df: pd.DataFrame, has_arxiv: bool, has_github: bool,
-                     has_hf_space: bool, has_hf_model: bool,
-                     has_hf_dataset: bool,
-                     paper_categories: list[str]) -> pd.DataFrame:
         if has_arxiv:
             df = df[~df.arxiv.isna()]
         if has_github:
@@ -93,10 +92,10 @@ class PaperList:
     @staticmethod
     def to_html(df: pd.DataFrame, table_header: str) -> str:
-        table_data = ''.join(df.html_table_content)
-        html = f'''
         <table>
             {table_header}
             {table_data}
-        </table>'''
         return html

 class PaperList:
     def __init__(self):
+        self.table = pd.read_csv("papers.csv")
         self._preprcess_table()
+        self.table_header = """
             <tr>
                 <td width="50%">Paper</td>
                 <td width="22%">Authors</td>
                 <td width="4%">HF Spaces</td>
                 <td width="4%">HF Models</td>
                 <td width="4%">HF Datasets</td>
+            </tr>"""
     def _preprcess_table(self) -> None:
+        self.table["title_lowercase"] = self.table.title.str.lower()
         rows = []
         for row in self.table.itertuples():
+            paper = f'<a href="{row.url}" target="_blank">{row.title}</a>' if isinstance(row.url, str) else row.title
+            pdf = f'<a href="{row.pdf}" target="_blank">pdf</a>' if isinstance(row.pdf, str) else ""
+            arxiv = f'<a href="{row.arxiv}" target="_blank">arXiv</a>' if isinstance(row.arxiv, str) else ""
+            github = f'<a href="{row.github}" target="_blank">GitHub</a>' if isinstance(row.github, str) else ""
+            hf_space = f'<a href="{row.hf_space}" target="_blank">Space</a>' if isinstance(row.hf_space, str) else ""
+            hf_model = f'<a href="{row.hf_model}" target="_blank">Model</a>' if isinstance(row.hf_model, str) else ""
+            hf_dataset = (
+                f'<a href="{row.hf_dataset}" target="_blank">Dataset</a>' if isinstance(row.hf_dataset, str) else ""
+            )
+            row = f"""
                 <tr>
                     <td>{paper}</td>
                     <td>{row.authors}</td>
                     <td>{hf_space}</td>
                     <td>{hf_model}</td>
                     <td>{hf_dataset}</td>
+                </tr>"""
             rows.append(row)
+        self.table["html_table_content"] = rows
+    def render(
+        self, search_query: str, case_sensitive: bool, filter_names: list[str], paper_categories: list[str]
+    ) -> tuple[int, str]:
         df = self.table
         if search_query:
             if case_sensitive:
                 df = df[df.title.str.contains(search_query)]
             else:
                 df = df[df.title_lowercase.str.contains(search_query.lower())]
+        has_arxiv = "arXiv" in filter_names
+        has_github = "GitHub" in filter_names
+        has_hf_space = "HF Space" in filter_names
+        has_hf_model = "HF Model" in filter_names
+        has_hf_dataset = "HF Dataset" in filter_names
+        df = self.filter_table(df, has_arxiv, has_github, has_hf_space, has_hf_model, has_hf_dataset, paper_categories)
         return len(df), self.to_html(df, self.table_header)
     @staticmethod
+    def filter_table(
+        df: pd.DataFrame,
+        has_arxiv: bool,
+        has_github: bool,
+        has_hf_space: bool,
+        has_hf_model: bool,
+        has_hf_dataset: bool,
+        paper_categories: list[str],
+    ) -> pd.DataFrame:
         if has_arxiv:
             df = df[~df.arxiv.isna()]
         if has_github:
     @staticmethod
     def to_html(df: pd.DataFrame, table_header: str) -> str:
+        table_data = "".join(df.html_table_content)
+        html = f"""
         <table>
             {table_header}
             {table_data}
+        </table>"""
         return html

style.css CHANGED Viewed

@@ -1,5 +1,6 @@
 h1 {
   text-align: center;
 }
 table a {
   background-color: transparent;
@@ -16,7 +17,3 @@ a:hover {
 table, th, td {
   border: 1px solid;
 }
-img#visitor-badge {
-  display: block;
-  margin: auto;
-}

 h1 {
   text-align: center;
+  display: block;
 }
 table a {
   background-color: transparent;
 table, th, td {
   border: 1px solid;
 }