Update arvix.py
Browse files
arvix.py
CHANGED
@@ -50,7 +50,7 @@ def extract_data(category):
|
|
50 |
if not utils.check_data_in_file(paper_id, 'arxiv.txt'):
|
51 |
utils.write_data_to_file(paper_id, 'arxiv.txt')
|
52 |
all_ids.add(paper_id)
|
53 |
-
if len(all_ids) >=
|
54 |
break
|
55 |
return list(all_ids)
|
56 |
|
@@ -86,11 +86,11 @@ def extract_arxiv_data():
|
|
86 |
if paper_id not in used_ids:
|
87 |
category_ids.add(paper_id)
|
88 |
used_ids.add(paper_id)
|
89 |
-
if len(category_ids) ==
|
90 |
break
|
91 |
-
if len(category_ids) ==
|
92 |
break
|
93 |
-
while len(category_ids) <
|
94 |
category_ids.add(random.choice(list(used_ids)))
|
95 |
data[category] = {"ids": list(category_ids), "count": len(category_ids)}
|
96 |
if not utils.upload_datafile('arxiv.txt'):
|
|
|
50 |
if not utils.check_data_in_file(paper_id, 'arxiv.txt'):
|
51 |
utils.write_data_to_file(paper_id, 'arxiv.txt')
|
52 |
all_ids.add(paper_id)
|
53 |
+
if len(all_ids) >= 2:
|
54 |
break
|
55 |
return list(all_ids)
|
56 |
|
|
|
86 |
if paper_id not in used_ids:
|
87 |
category_ids.add(paper_id)
|
88 |
used_ids.add(paper_id)
|
89 |
+
if len(category_ids) == 2:
|
90 |
break
|
91 |
+
if len(category_ids) == 2:
|
92 |
break
|
93 |
+
while len(category_ids) < 2:
|
94 |
category_ids.add(random.choice(list(used_ids)))
|
95 |
data[category] = {"ids": list(category_ids), "count": len(category_ids)}
|
96 |
if not utils.upload_datafile('arxiv.txt'):
|