Update arvix.py
Browse files
arvix.py
CHANGED
|
@@ -50,7 +50,7 @@ def extract_data(category):
|
|
| 50 |
if not utils.check_data_in_file(paper_id, 'arxiv.txt'):
|
| 51 |
utils.write_data_to_file(paper_id, 'arxiv.txt')
|
| 52 |
all_ids.add(paper_id)
|
| 53 |
-
if len(all_ids) >=
|
| 54 |
break
|
| 55 |
return list(all_ids)
|
| 56 |
|
|
@@ -86,11 +86,11 @@ def extract_arxiv_data():
|
|
| 86 |
if paper_id not in used_ids:
|
| 87 |
category_ids.add(paper_id)
|
| 88 |
used_ids.add(paper_id)
|
| 89 |
-
if len(category_ids) ==
|
| 90 |
break
|
| 91 |
-
if len(category_ids) ==
|
| 92 |
break
|
| 93 |
-
while len(category_ids) <
|
| 94 |
category_ids.add(random.choice(list(used_ids)))
|
| 95 |
data[category] = {"ids": list(category_ids), "count": len(category_ids)}
|
| 96 |
if not utils.upload_datafile('arxiv.txt'):
|
|
|
|
| 50 |
if not utils.check_data_in_file(paper_id, 'arxiv.txt'):
|
| 51 |
utils.write_data_to_file(paper_id, 'arxiv.txt')
|
| 52 |
all_ids.add(paper_id)
|
| 53 |
+
if len(all_ids) >= 2:
|
| 54 |
break
|
| 55 |
return list(all_ids)
|
| 56 |
|
|
|
|
| 86 |
if paper_id not in used_ids:
|
| 87 |
category_ids.add(paper_id)
|
| 88 |
used_ids.add(paper_id)
|
| 89 |
+
if len(category_ids) == 2:
|
| 90 |
break
|
| 91 |
+
if len(category_ids) == 2:
|
| 92 |
break
|
| 93 |
+
while len(category_ids) < 2:
|
| 94 |
category_ids.add(random.choice(list(used_ids)))
|
| 95 |
data[category] = {"ids": list(category_ids), "count": len(category_ids)}
|
| 96 |
if not utils.upload_datafile('arxiv.txt'):
|