Spaces:

ICML2022
/

ICML2022_papers

Sleeping

App Files Files Community

hysts HF staff commited on Jun 11

Commit

2e8621f

•

1 Parent(s): eb928c8

Update

Browse files

Files changed (6) hide show

.pre-commit-config.yaml +59 -35
.style.yapf +0 -5
README.md +1 -1
app.py +18 -18
paper_list.py +46 -48
style.css +1 -4

.pre-commit-config.yaml CHANGED Viewed

@@ -1,36 +1,60 @@
 repos:
-- repo: https://github.com/pre-commit/pre-commit-hooks
-  rev: v4.2.0
-  hooks:
-  - id: check-executables-have-shebangs
-  - id: check-json
-  - id: check-merge-conflict
-  - id: check-shebang-scripts-are-executable
-  - id: check-toml
-  - id: check-yaml
-  - id: double-quote-string-fixer
-  - id: end-of-file-fixer
-  - id: mixed-line-ending
-    args: ['--fix=lf']
-  - id: requirements-txt-fixer
-  - id: trailing-whitespace
-- repo: https://github.com/myint/docformatter
-  rev: v1.4
-  hooks:
-  - id: docformatter
-    args: ['--in-place']
-- repo: https://github.com/pycqa/isort
-  rev: 5.12.0
-  hooks:
-    - id: isort
-- repo: https://github.com/pre-commit/mirrors-mypy
-  rev: v0.991
-  hooks:
-    - id: mypy
-      args: ['--ignore-missing-imports']
-      additional_dependencies: ['types-requests']
-- repo: https://github.com/google/yapf
-  rev: v0.32.0
-  hooks:
-  - id: yapf
-    args: ['--parallel', '--in-place']

 repos:
+  - repo: https://github.com/pre-commit/pre-commit-hooks
+    rev: v4.6.0
+    hooks:
+      - id: check-executables-have-shebangs
+      - id: check-json
+      - id: check-merge-conflict
+      - id: check-shebang-scripts-are-executable
+      - id: check-toml
+      - id: check-yaml
+      - id: end-of-file-fixer
+      - id: mixed-line-ending
+        args: ["--fix=lf"]
+      - id: requirements-txt-fixer
+      - id: trailing-whitespace
+  - repo: https://github.com/myint/docformatter
+    rev: v1.7.5
+    hooks:
+      - id: docformatter
+        args: ["--in-place"]
+  - repo: https://github.com/pycqa/isort
+    rev: 5.13.2
+    hooks:
+      - id: isort
+        args: ["--profile", "black"]
+  - repo: https://github.com/pre-commit/mirrors-mypy
+    rev: v1.10.0
+    hooks:
+      - id: mypy
+        args: ["--ignore-missing-imports"]
+        additional_dependencies:
+          [
+            "types-python-slugify",
+            "types-requests",
+            "types-PyYAML",
+            "types-pytz",
+          ]
+  - repo: https://github.com/psf/black
+    rev: 24.4.2
+    hooks:
+      - id: black
+        language_version: python3.10
+        args: ["--line-length", "119"]
+  - repo: https://github.com/kynan/nbstripout
+    rev: 0.7.1
+    hooks:
+      - id: nbstripout
+        args:
+          [
+            "--extra-keys",
+            "metadata.interpreter metadata.kernelspec cell.metadata.pycharm",
+          ]
+  - repo: https://github.com/nbQA-dev/nbQA
+    rev: 1.8.5
+    hooks:
+      - id: nbqa-black
+      - id: nbqa-pyupgrade
+        args: ["--py37-plus"]
+      - id: nbqa-isort
+        args: ["--float-to-top"]

.style.yapf DELETED Viewed

@@ -1,5 +0,0 @@
-[style]
-based_on_style = pep8
-blank_line_before_nested_class_or_def = false
-spaces_before_comment = 2
-split_before_logical_operator = true

README.md CHANGED Viewed

@@ -4,7 +4,7 @@ emoji: 🦀
 colorFrom: green
 colorTo: gray
 sdk: gradio
-sdk_version: 3.36.1
 app_file: app.py
 pinned: true
 ---

 colorFrom: green
 colorTo: gray
 sdk: gradio
+sdk_version: 4.36.1
 app_file: app.py
 pinned: true
 ---

app.py CHANGED Viewed

@@ -6,34 +6,34 @@ import gradio as gr
 from paper_list import PaperList
-DESCRIPTION = '# ICML 2022 Papers'
-NOTES = '''
 - [ICML 2022](https://icml.cc/Conferences/2022/)
 - [Proceedings](https://proceedings.mlr.press/v162/)
-'''
 paper_list = PaperList()
-with gr.Blocks(css='style.css') as demo:
     gr.Markdown(DESCRIPTION)
     search_box = gr.Textbox(
-        label='Search Title',
-        placeholder=
-        'You can search for titles with regular expressions. e.g. (?<!sur)face'
     )
-    case_sensitive = gr.Checkbox(label='Case Sensitive')
-    filter_names = gr.CheckboxGroup(label='Filter',
-                                    choices=[
-                                        'arXiv',
-                                        'GitHub',
-                                        'HF Space',
-                                        'HF Model',
-                                        'HF Dataset',
-                                    ])
-    search_button = gr.Button('Search')
-    number_of_papers = gr.Textbox(label='Number of Papers Found')
     table = gr.HTML(show_label=False)
     gr.Markdown(NOTES)

 from paper_list import PaperList
+DESCRIPTION = "# ICML 2022 Papers"
+NOTES = """
 - [ICML 2022](https://icml.cc/Conferences/2022/)
 - [Proceedings](https://proceedings.mlr.press/v162/)
+"""
 paper_list = PaperList()
+with gr.Blocks(css="style.css") as demo:
     gr.Markdown(DESCRIPTION)
     search_box = gr.Textbox(
+        label="Search Title", placeholder="You can search for titles with regular expressions. e.g. (?<!sur)face"
     )
+    case_sensitive = gr.Checkbox(label="Case Sensitive")
+    filter_names = gr.CheckboxGroup(
+        label="Filter",
+        choices=[
+            "arXiv",
+            "GitHub",
+            "HF Space",
+            "HF Model",
+            "HF Dataset",
+        ],
+    )
+    search_button = gr.Button("Search")
+    number_of_papers = gr.Textbox(label="Number of Papers Found")
     table = gr.HTML(show_label=False)
     gr.Markdown(NOTES)

paper_list.py CHANGED Viewed

@@ -8,11 +8,11 @@ from huggingface_hub.hf_api import SpaceInfo
 class PaperList:
     def __init__(self):
-        self.organization_name = 'ICML2022'
-        self.table = pd.read_csv('papers.csv')
         self._preprcess_table()
-        self.table_header = '''
             <tr>
                 <td width="50%">Paper</td>
                 <td width="26%">Authors</td>
@@ -22,49 +22,44 @@ class PaperList:
                 <td width="4%">HF Spaces</td>
                 <td width="4%">HF Models</td>
                 <td width="4%">HF Datasets</td>
-            </tr>'''
     @staticmethod
     def load_space_info(author: str) -> list[SpaceInfo]:
-        path = 'https://huggingface.co/api/spaces'
-        r = requests.get(path, params={'author': author})
         d = r.json()
         return [SpaceInfo(**x) for x in d]
-    def add_spaces_to_table(self, organization_name: str,
-                            df: pd.DataFrame) -> pd.DataFrame:
         spaces = self.load_space_info(organization_name)
-        name2space = {
-            s.id.split('/')[1].lower(): f'https://huggingface.co/spaces/{s.id}'
-            for s in spaces
-        }
-        df['hf_space'] = df.loc[:, ['hf_space', 'github']].apply(
-            lambda x: x[0] if isinstance(x[0], str) else name2space.get(
-                x[1].split('/')[-1].lower()
-                if isinstance(x[1], str) else '', np.nan),
-            axis=1)
         return df
     def _preprcess_table(self) -> None:
-        self.table = self.add_spaces_to_table(self.organization_name,
-                                              self.table)
-        self.table['title_lowercase'] = self.table.title.str.lower()
         rows = []
         for row in self.table.itertuples():
             paper = f'<a href="{row.url}" target="_blank">{row.title}</a>'
             pdf = f'<a href="{row.pdf}" target="_blank">pdf</a>'
-            arxiv = f'<a href="{row.arxiv}" target="_blank">arXiv</a>' if isinstance(
-                row.arxiv, str) else ''
-            github = f'<a href="{row.github}" target="_blank">GitHub</a>' if isinstance(
-                row.github, str) else ''
-            hf_space = f'<a href="{row.hf_space}" target="_blank">Space</a>' if isinstance(
-                row.hf_space, str) else ''
-            hf_model = f'<a href="{row.hf_model}" target="_blank">Model</a>' if isinstance(
-                row.hf_model, str) else ''
-            hf_dataset = f'<a href="{row.hf_dataset}" target="_blank">Dataset</a>' if isinstance(
-                row.hf_dataset, str) else ''
-            row = f'''
                 <tr>
                     <td>{paper}</td>
                     <td>{row.authors}</td>
@@ -74,31 +69,34 @@ class PaperList:
                     <td>{hf_space}</td>
                     <td>{hf_model}</td>
                     <td>{hf_dataset}</td>
-                </tr>'''
             rows.append(row)
-        self.table['html_table_content'] = rows
-    def render(self, search_query: str, case_sensitive: bool,
-               filter_names: list[str]) -> tuple[int, str]:
         df = self.add_spaces_to_table(self.organization_name, self.table)
         if search_query:
             if case_sensitive:
                 df = df[df.title.str.contains(search_query)]
             else:
                 df = df[df.title_lowercase.str.contains(search_query.lower())]
-        has_arxiv = 'arXiv' in filter_names
-        has_github = 'GitHub' in filter_names
-        has_hf_space = 'HF Space' in filter_names
-        has_hf_model = 'HF Model' in filter_names
-        has_hf_dataset = 'HF Dataset' in filter_names
-        df = self.filter_table(df, has_arxiv, has_github, has_hf_space,
-                               has_hf_model, has_hf_dataset)
         return len(df), self.to_html(df, self.table_header)
     @staticmethod
-    def filter_table(df: pd.DataFrame, has_arxiv: bool, has_github: bool,
-                     has_hf_space: bool, has_hf_model: bool,
-                     has_hf_dataset: bool) -> pd.DataFrame:
         if has_arxiv:
             df = df[~df.arxiv.isna()]
         if has_github:
@@ -113,10 +111,10 @@ class PaperList:
     @staticmethod
     def to_html(df: pd.DataFrame, table_header: str) -> str:
-        table_data = ''.join(df.html_table_content)
-        html = f'''
         <table>
             {table_header}
             {table_data}
-        </table>'''
         return html

 class PaperList:
     def __init__(self):
+        self.organization_name = "ICML2022"
+        self.table = pd.read_csv("papers.csv")
         self._preprcess_table()
+        self.table_header = """
             <tr>
                 <td width="50%">Paper</td>
                 <td width="26%">Authors</td>
                 <td width="4%">HF Spaces</td>
                 <td width="4%">HF Models</td>
                 <td width="4%">HF Datasets</td>
+            </tr>"""
     @staticmethod
     def load_space_info(author: str) -> list[SpaceInfo]:
+        path = "https://huggingface.co/api/spaces"
+        r = requests.get(path, params={"author": author})
         d = r.json()
         return [SpaceInfo(**x) for x in d]
+    def add_spaces_to_table(self, organization_name: str, df: pd.DataFrame) -> pd.DataFrame:
         spaces = self.load_space_info(organization_name)
+        name2space = {s.id.split("/")[1].lower(): f"https://huggingface.co/spaces/{s.id}" for s in spaces}
+        df["hf_space"] = df.loc[:, ["hf_space", "github"]].apply(
+            lambda x: (
+                x[0]
+                if isinstance(x[0], str)
+                else name2space.get(x[1].split("/")[-1].lower() if isinstance(x[1], str) else "", np.nan)
+            ),
+            axis=1,
+        )
         return df
     def _preprcess_table(self) -> None:
+        self.table = self.add_spaces_to_table(self.organization_name, self.table)
+        self.table["title_lowercase"] = self.table.title.str.lower()
         rows = []
         for row in self.table.itertuples():
             paper = f'<a href="{row.url}" target="_blank">{row.title}</a>'
             pdf = f'<a href="{row.pdf}" target="_blank">pdf</a>'
+            arxiv = f'<a href="{row.arxiv}" target="_blank">arXiv</a>' if isinstance(row.arxiv, str) else ""
+            github = f'<a href="{row.github}" target="_blank">GitHub</a>' if isinstance(row.github, str) else ""
+            hf_space = f'<a href="{row.hf_space}" target="_blank">Space</a>' if isinstance(row.hf_space, str) else ""
+            hf_model = f'<a href="{row.hf_model}" target="_blank">Model</a>' if isinstance(row.hf_model, str) else ""
+            hf_dataset = (
+                f'<a href="{row.hf_dataset}" target="_blank">Dataset</a>' if isinstance(row.hf_dataset, str) else ""
+            )
+            row = f"""
                 <tr>
                     <td>{paper}</td>
                     <td>{row.authors}</td>
                     <td>{hf_space}</td>
                     <td>{hf_model}</td>
                     <td>{hf_dataset}</td>
+                </tr>"""
             rows.append(row)
+        self.table["html_table_content"] = rows
+    def render(self, search_query: str, case_sensitive: bool, filter_names: list[str]) -> tuple[int, str]:
         df = self.add_spaces_to_table(self.organization_name, self.table)
         if search_query:
             if case_sensitive:
                 df = df[df.title.str.contains(search_query)]
             else:
                 df = df[df.title_lowercase.str.contains(search_query.lower())]
+        has_arxiv = "arXiv" in filter_names
+        has_github = "GitHub" in filter_names
+        has_hf_space = "HF Space" in filter_names
+        has_hf_model = "HF Model" in filter_names
+        has_hf_dataset = "HF Dataset" in filter_names
+        df = self.filter_table(df, has_arxiv, has_github, has_hf_space, has_hf_model, has_hf_dataset)
         return len(df), self.to_html(df, self.table_header)
     @staticmethod
+    def filter_table(
+        df: pd.DataFrame,
+        has_arxiv: bool,
+        has_github: bool,
+        has_hf_space: bool,
+        has_hf_model: bool,
+        has_hf_dataset: bool,
+    ) -> pd.DataFrame:
         if has_arxiv:
             df = df[~df.arxiv.isna()]
         if has_github:
     @staticmethod
     def to_html(df: pd.DataFrame, table_header: str) -> str:
+        table_data = "".join(df.html_table_content)
+        html = f"""
         <table>
             {table_header}
             {table_data}
+        </table>"""
         return html

style.css CHANGED Viewed

@@ -1,5 +1,6 @@
 h1 {
   text-align: center;
 }
 table a {
   background-color: transparent;
@@ -16,7 +17,3 @@ a:hover {
 table, th, td {
   border: 1px solid;
 }
-img#visitor-badge {
-  display: block;
-  margin: auto;
-}

 h1 {
   text-align: center;
+  display: block;
 }
 table a {
   background-color: transparent;
 table, th, td {
   border: 1px solid;
 }