Spaces:
Build error
Build error
spaces init
Browse files
README.md
CHANGED
@@ -1,3 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
# Auto-Research
|
2 |
![Auto-Research][logo]
|
3 |
|
@@ -22,32 +34,23 @@ Kaggle Re-usable Demo : https://www.kaggle.com/sidharthpal/auto-research-generat
|
|
22 |
(`[TIP]` click 'edit and run' to run the demo for your custom queries on a free GPU)
|
23 |
|
24 |
|
25 |
-
####
|
|
|
|
|
|
|
26 |
```
|
27 |
-
apt install -y poppler-utils libpoppler-cpp-dev
|
28 |
-
git clone https://github.com/sidphbot/Auto-Research.git
|
29 |
|
30 |
-
|
31 |
-
|
32 |
python survey.py [options] <your_research_query>
|
33 |
```
|
34 |
|
35 |
-
####
|
36 |
-
- Detailed survey draft paper as txt file
|
37 |
-
- A curated list of top 25+ papers as pdfs and txts
|
38 |
-
- Images extracted from above papers as jpegs, bmps etc
|
39 |
-
- Heading/Section wise highlights extracted from above papers as a re-usable pure python joblib dump
|
40 |
-
- Tables extracted from papers(optional)
|
41 |
-
- Corpus of metadata highlights/text of top 100 papers as a re-usable pure python joblib dump
|
42 |
-
|
43 |
-
## Example run #1 - python utility
|
44 |
-
|
45 |
```
|
46 |
-
|
47 |
```
|
48 |
|
49 |
-
|
50 |
-
|
51 |
```
|
52 |
from survey import Surveyor
|
53 |
mysurveyor = Surveyor()
|
@@ -264,4 +267,17 @@ optional arguments:
|
|
264 |
> during survey generation with `surveyor_obj.survey(query="my_research_query")`
|
265 |
- `max_search`: int maximium number of papers to gaze at - defaults to `100`
|
266 |
- `num_papers`: int maximium number of papers to download and analyse - defaults to `25`
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
267 |
|
|
|
1 |
+
----
|
2 |
+
-title: Surveyor
|
3 |
+
-emoji: 📊
|
4 |
+
-colorFrom: gray
|
5 |
+
-colorTo: pink
|
6 |
+
-sdk: streamlit
|
7 |
+
-sdk_version: 1.9.0
|
8 |
+
-app_file: app.py
|
9 |
+
-pinned: false
|
10 |
+
-license: apache-2.0
|
11 |
+
----
|
12 |
+
|
13 |
# Auto-Research
|
14 |
![Auto-Research][logo]
|
15 |
|
|
|
34 |
(`[TIP]` click 'edit and run' to run the demo for your custom queries on a free GPU)
|
35 |
|
36 |
|
37 |
+
#### Installation:
|
38 |
+
```
|
39 |
+
sudo apt-get install build-essential poppler-utils libpoppler-cpp-dev pkg-config python-dev
|
40 |
+
pip install git+https://github.com/sidphbot/Auto-Research.git
|
41 |
```
|
|
|
|
|
42 |
|
43 |
+
#### Run Survey (cli):
|
44 |
+
```
|
45 |
python survey.py [options] <your_research_query>
|
46 |
```
|
47 |
|
48 |
+
#### Run Survey (Streamlit web-interface - new):
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
49 |
```
|
50 |
+
streamlit run app.py
|
51 |
```
|
52 |
|
53 |
+
#### Run Survey (Python API):
|
|
|
54 |
```
|
55 |
from survey import Surveyor
|
56 |
mysurveyor = Surveyor()
|
|
|
267 |
> during survey generation with `surveyor_obj.survey(query="my_research_query")`
|
268 |
- `max_search`: int maximium number of papers to gaze at - defaults to `100`
|
269 |
- `num_papers`: int maximium number of papers to download and analyse - defaults to `25`
|
270 |
+
|
271 |
+
|
272 |
+
|
273 |
+
#### Artifacts generated (zipped):
|
274 |
+
- Detailed survey draft paper as txt file
|
275 |
+
- A curated list of top 25+ papers as pdfs and txts
|
276 |
+
- Images extracted from above papers as jpegs, bmps etc
|
277 |
+
- Heading/Section wise highlights extracted from above papers as a re-usable pure python joblib dump
|
278 |
+
- Tables extracted from papers(optional)
|
279 |
+
- Corpus of metadata highlights/text of top 100 papers as a re-usable pure python joblib dump
|
280 |
+
|
281 |
+
|
282 |
+
Please cite this repo if it helped you :)
|
283 |
|
app.py
CHANGED
@@ -2,7 +2,7 @@ import streamlit as st
|
|
2 |
import pandas as pd
|
3 |
import numpy as np
|
4 |
|
5 |
-
|
6 |
|
7 |
def run_survey(surveyor, research_keywords, max_search, num_papers):
|
8 |
zip_file_name, survey_file_name = surveyor.survey(research_keywords,
|
@@ -21,16 +21,10 @@ def run_survey(surveyor, research_keywords, max_search, num_papers):
|
|
21 |
btn = st.download_button(
|
22 |
label="Download detailed generated survey file",
|
23 |
data=file,
|
24 |
-
file_name=str(
|
25 |
-
)
|
26 |
-
|
27 |
-
with open(str(survey_file_name), "rb") as file:
|
28 |
-
btn = st.download_button(
|
29 |
-
label="Download detailed generated survey file",
|
30 |
-
data=file,
|
31 |
-
file_name=str(zip_file_name)
|
32 |
)
|
33 |
-
|
|
|
34 |
|
35 |
|
36 |
def survey_space():
|
@@ -47,9 +41,9 @@ def survey_space():
|
|
47 |
|
48 |
if submit:
|
49 |
st.write("hello")
|
50 |
-
|
51 |
-
|
52 |
-
|
53 |
|
54 |
|
55 |
if __name__ == '__main__':
|
|
|
2 |
import pandas as pd
|
3 |
import numpy as np
|
4 |
|
5 |
+
from src.Surveyor import Surveyor
|
6 |
|
7 |
def run_survey(surveyor, research_keywords, max_search, num_papers):
|
8 |
zip_file_name, survey_file_name = surveyor.survey(research_keywords,
|
|
|
21 |
btn = st.download_button(
|
22 |
label="Download detailed generated survey file",
|
23 |
data=file,
|
24 |
+
file_name=str(survey_file_name)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
25 |
)
|
26 |
+
for line in file.readlines():
|
27 |
+
st.write(line)
|
28 |
|
29 |
|
30 |
def survey_space():
|
|
|
41 |
|
42 |
if submit:
|
43 |
st.write("hello")
|
44 |
+
if surveyor_obj is None:
|
45 |
+
surveyor_obj = Surveyor()
|
46 |
+
run_survey(surveyor_obj, research_keywords, max_search, num_papers)
|
47 |
|
48 |
|
49 |
if __name__ == '__main__':
|