DeekshithN05 commited on
Commit
05f62b4
·
verified ·
1 Parent(s): b62487c

Delete exploration.ipynb

Browse files
Files changed (1) hide show
  1. exploration.ipynb +0 -190
exploration.ipynb DELETED
@@ -1,190 +0,0 @@
1
- {
2
- "cells": [
3
- {
4
- "cell_type": "markdown",
5
- "id": "94bd79f6",
6
- "metadata": {},
7
- "source": [
8
- "# Overview of the GAIA dataset"
9
- ]
10
- },
11
- {
12
- "cell_type": "code",
13
- "execution_count": 1,
14
- "id": "773d3352",
15
- "metadata": {},
16
- "outputs": [
17
- {
18
- "data": {
19
- "text/plain": [
20
- "{'task_id': 'c61d22de-5f6c-4958-a7f6-5e9707bd3466',\n",
21
- " 'Question': 'A paper about AI regulation that was originally submitted to arXiv.org in June 2022 shows a figure with three axes, where each axis has a label word at both ends. Which of these words is used to describe a type of society in a Physics and Society article submitted to arXiv.org on August 11, 2016?',\n",
22
- " 'Level': 2,\n",
23
- " 'Final answer': 'egalitarian',\n",
24
- " 'file_name': '',\n",
25
- " 'Annotator Metadata': {'Steps': '1. Go to arxiv.org and navigate to the Advanced Search page.\\n2. Enter \"AI regulation\" in the search box and select \"All fields\" from the dropdown.\\n3. Enter 2022-06-01 and 2022-07-01 into the date inputs, select \"Submission date (original)\", and submit the search.\\n4. Go through the search results to find the article that has a figure with three axes and labels on each end of the axes, titled \"Fairness in Agreement With European Values: An Interdisciplinary Perspective on AI Regulation\".\\n5. Note the six words used as labels: deontological, egalitarian, localized, standardized, utilitarian, and consequential.\\n6. Go back to arxiv.org\\n7. Find \"Physics and Society\" and go to the page for the \"Physics and Society\" category.\\n8. Note that the tag for this category is \"physics.soc-ph\".\\n9. Go to the Advanced Search page.\\n10. Enter \"physics.soc-ph\" in the search box and select \"All fields\" from the dropdown.\\n11. Enter 2016-08-11 and 2016-08-12 into the date inputs, select \"Submission date (original)\", and submit the search.\\n12. Search for instances of the six words in the results to find the paper titled \"Phase transition from egalitarian to hierarchical societies driven by competition between cognitive and social constraints\", indicating that \"egalitarian\" is the correct answer.',\n",
26
- " 'Number of steps': '12',\n",
27
- " 'How long did this take?': '8 minutes',\n",
28
- " 'Tools': '1. Web browser\\n2. Image recognition tools (to identify and parse a figure with three axes)',\n",
29
- " 'Number of tools': '2'}}"
30
- ]
31
- },
32
- "execution_count": 1,
33
- "metadata": {},
34
- "output_type": "execute_result"
35
- }
36
- ],
37
- "source": [
38
- "\n",
39
- "import json\n",
40
- "# Load the metadata.jsonl file\n",
41
- "with open('metadata.jsonl', 'r') as jsonl_file:\n",
42
- " json_list = list(jsonl_file)\n",
43
- "\n",
44
- "json_QA = []\n",
45
- "for json_str in json_list:\n",
46
- " json_data = json.loads(json_str)\n",
47
- " json_QA.append(json_data)\n",
48
- " \n",
49
- "\n",
50
- "json_QA[0]\n",
51
- " "
52
- ]
53
- },
54
- {
55
- "cell_type": "code",
56
- "execution_count": 2,
57
- "id": "be320045",
58
- "metadata": {},
59
- "outputs": [
60
- {
61
- "name": "stdout",
62
- "output_type": "stream",
63
- "text": [
64
- "==================================================\n",
65
- "Task ID: 0ff53813-3367-4f43-bcbd-3fd725c1bf4b\n",
66
- "Question: What two-word type of model did Manash Pratim Kashyap's and PS Fader's studies in customer retention studies published during 2018-2019 have in common (no punctuation)?\n",
67
- "Level: 2\n",
68
- "Final Answer: beta geometric\n",
69
- "Annotator Metadata: \n",
70
- " ├── Steps: \n",
71
- " │ ├── 1. Searched \"Manash Pratim Kashyap customer retention\" on Google.\n",
72
- " │ ├── 2. Opened https://www.journalijar.com/article/26843/a-simple-model-for-analyzing-the-customer-retention-comparing-rural-and-urban-store/.\n",
73
- " │ ├── 3. Noted \"discrete time beta geometric model\" in the abstract.\n",
74
- " │ ├── 4. Searched \"PS Fader customer retention\" on Google.\n",
75
- " │ ├── 5. Opened https://www.sciencedirect.com/science/article/abs/pii/S1094996807700233.\n",
76
- " │ ├── 6. Noted \"basic model (known as a “shifted-beta-geometric”)\" in the abstract.\n",
77
- " │ ├── 7. Extracted the two words in common.\n",
78
- " ├── Number of steps: 6\n",
79
- " ├── How long did this take?: 10 minutes\n",
80
- " ├── Tools:\n",
81
- " │ ├── 1. Web browser\n",
82
- " │ ├── 2. Search engine\n",
83
- " └── Number of tools: 2\n",
84
- "==================================================\n"
85
- ]
86
- }
87
- ],
88
- "source": [
89
- "\n",
90
- "import random\n",
91
- "# random.seed(42)\n",
92
- "random_samples = random.sample(json_QA, 1)\n",
93
- "for sample in random_samples:\n",
94
- " print(\"=\" * 50)\n",
95
- " print(f\"Task ID: {sample['task_id']}\")\n",
96
- " print(f\"Question: {sample['Question']}\")\n",
97
- " print(f\"Level: {sample['Level']}\")\n",
98
- " print(f\"Final Answer: {sample['Final answer']}\")\n",
99
- " print(f\"Annotator Metadata: \")\n",
100
- " print(f\" ├── Steps: \")\n",
101
- " for step in sample['Annotator Metadata']['Steps'].split('\\n'):\n",
102
- " print(f\" │ ├── {step}\")\n",
103
- " print(f\" ├── Number of steps: {sample['Annotator Metadata']['Number of steps']}\")\n",
104
- " print(f\" ├── How long did this take?: {sample['Annotator Metadata']['How long did this take?']}\")\n",
105
- " print(f\" ├── Tools:\")\n",
106
- " for tool in sample['Annotator Metadata']['Tools'].split('\\n'):\n",
107
- " print(f\" │ ├── {tool}\")\n",
108
- " print(f\" └── Number of tools: {sample['Annotator Metadata']['Number of tools']}\")\n",
109
- "print(\"=\" * 50)"
110
- ]
111
- },
112
- {
113
- "cell_type": "code",
114
- "execution_count": 3,
115
- "id": "64c5ca54",
116
- "metadata": {},
117
- "outputs": [
118
- {
119
- "data": {
120
- "text/plain": [
121
- "[{'task_id': 'c61d22de-5f6c-4958-a7f6-5e9707bd3466',\n",
122
- " 'Question': 'A paper about AI regulation that was originally submitted to arXiv.org in June 2022 shows a figure with three axes, where each axis has a label word at both ends. Which of these words is used to describe a type of society in a Physics and Society article submitted to arXiv.org on August 11, 2016?',\n",
123
- " 'Level': 2,\n",
124
- " 'Final answer': 'egalitarian',\n",
125
- " 'file_name': '',\n",
126
- " 'Annotator Metadata': {'Steps': '1. Go to arxiv.org and navigate to the Advanced Search page.\\n2. Enter \"AI regulation\" in the search box and select \"All fields\" from the dropdown.\\n3. Enter 2022-06-01 and 2022-07-01 into the date inputs, select \"Submission date (original)\", and submit the search.\\n4. Go through the search results to find the article that has a figure with three axes and labels on each end of the axes, titled \"Fairness in Agreement With European Values: An Interdisciplinary Perspective on AI Regulation\".\\n5. Note the six words used as labels: deontological, egalitarian, localized, standardized, utilitarian, and consequential.\\n6. Go back to arxiv.org\\n7. Find \"Physics and Society\" and go to the page for the \"Physics and Society\" category.\\n8. Note that the tag for this category is \"physics.soc-ph\".\\n9. Go to the Advanced Search page.\\n10. Enter \"physics.soc-ph\" in the search box and select \"All fields\" from the dropdown.\\n11. Enter 2016-08-11 and 2016-08-12 into the date inputs, select \"Submission date (original)\", and submit the search.\\n12. Search for instances of the six words in the results to find the paper titled \"Phase transition from egalitarian to hierarchical societies driven by competition between cognitive and social constraints\", indicating that \"egalitarian\" is the correct answer.',\n",
127
- " 'Number of steps': '12',\n",
128
- " 'How long did this take?': '8 minutes',\n",
129
- " 'Tools': '1. Web browser\\n2. Image recognition tools (to identify and parse a figure with three axes)',\n",
130
- " 'Number of tools': '2'}},\n",
131
- " {'task_id': '17b5a6a3-bc87-42e8-b0fb-6ab0781ef2cc',\n",
132
- " 'Question': 'I’m researching species that became invasive after people who kept them as pets released them. There’s a certain species of fish that was popularized as a pet by being the main character of the movie Finding Nemo. According to the USGS, where was this fish found as a nonnative species, before the year 2020? I need the answer formatted as the five-digit zip codes of the places the species was found, separated by commas if there is more than one place.',\n",
133
- " 'Level': 2,\n",
134
- " 'Final answer': '34689',\n",
135
- " 'file_name': '',\n",
136
- " 'Annotator Metadata': {'Steps': '1. Search the web for “finding nemo main character”.\\n2. Note the results, which state that the main character is a clownfish.\\n3. Search the web for “usgs nonnative species database”.\\n4. Click result for the Nonindigenous Aquatic Species site.\\n5. Click “Marine Fishes”.\\n6. Click “Species List of Nonindigenous Marine Fish”.\\n7. Scroll through the list until I find the clown anenomefish, and click “Collection info”.\\n8. Note the place that a clown anenomefish was found, in Fred Howard Park at the Gulf of Mexico.\\n9. Search the web for “fred howard park florida zip code”.\\n10. Note the zip code, 34689. Since only one clownfish was found before the year 2020, this is the answer.',\n",
137
- " 'Number of steps': '10',\n",
138
- " 'How long did this take?': '5 minutes',\n",
139
- " 'Tools': '1. Search engine\\n2. Web browser',\n",
140
- " 'Number of tools': '2'}},\n",
141
- " {'task_id': '04a04a9b-226c-43fd-b319-d5e89743676f',\n",
142
- " 'Question': 'If we assume all articles published by Nature in 2020 (articles, only, not book reviews/columns, etc) relied on statistical significance to justify their findings and they on average came to a p-value of 0.04, how many papers would be incorrect as to their claims of statistical significance? Round the value up to the next integer.',\n",
143
- " 'Level': 2,\n",
144
- " 'Final answer': '41',\n",
145
- " 'file_name': '',\n",
146
- " 'Annotator Metadata': {'Steps': '1. Find how many articles were published in Nature in 2020 by Googling \"articles submitted to nature 2020\"\\n2. Click through to Nature\\'s archive for 2020 and filter the results to only provide articles, not other types of publications: 1002\\n3. Find 4% of 1002 and round up: 40.08 > 41',\n",
147
- " 'Number of steps': '3',\n",
148
- " 'How long did this take?': '5 minutes',\n",
149
- " 'Tools': '1. search engine\\n2. calculator',\n",
150
- " 'Number of tools': '2'}}]"
151
- ]
152
- },
153
- "execution_count": 3,
154
- "metadata": {},
155
- "output_type": "execute_result"
156
- }
157
- ],
158
- "source": [
159
- "json_QA[0:3]"
160
- ]
161
- },
162
- {
163
- "cell_type": "markdown",
164
- "id": "d4ddf21d",
165
- "metadata": {},
166
- "source": []
167
- }
168
- ],
169
- "metadata": {
170
- "kernelspec": {
171
- "display_name": "Python 3",
172
- "language": "python",
173
- "name": "python3"
174
- },
175
- "language_info": {
176
- "codemirror_mode": {
177
- "name": "ipython",
178
- "version": 3
179
- },
180
- "file_extension": ".py",
181
- "mimetype": "text/x-python",
182
- "name": "python",
183
- "nbconvert_exporter": "python",
184
- "pygments_lexer": "ipython3",
185
- "version": "3.10.12"
186
- }
187
- },
188
- "nbformat": 4,
189
- "nbformat_minor": 5
190
- }