First commit
Browse files- Code.ipynb +59 -0
- Code2.ipynb +0 -0
- local_dataset_directory/dataset_dict.json +1 -0
- local_dataset_directory/train/data-00000-of-00007.arrow +3 -0
- local_dataset_directory/train/data-00001-of-00007.arrow +3 -0
- local_dataset_directory/train/data-00002-of-00007.arrow +3 -0
- local_dataset_directory/train/data-00003-of-00007.arrow +3 -0
- local_dataset_directory/train/data-00004-of-00007.arrow +3 -0
- local_dataset_directory/train/data-00005-of-00007.arrow +3 -0
- local_dataset_directory/train/data-00006-of-00007.arrow +3 -0
- local_dataset_directory/train/dataset_info.json +50 -0
- local_dataset_directory/train/state.json +31 -0
Code.ipynb
ADDED
|
@@ -0,0 +1,59 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"cells": [
|
| 3 |
+
{
|
| 4 |
+
"cell_type": "code",
|
| 5 |
+
"execution_count": null,
|
| 6 |
+
"metadata": {},
|
| 7 |
+
"outputs": [
|
| 8 |
+
{
|
| 9 |
+
"data": {
|
| 10 |
+
"application/vnd.jupyter.widget-view+json": {
|
| 11 |
+
"model_id": "1165efaad02849e4945d9b0f726a33c3",
|
| 12 |
+
"version_major": 2,
|
| 13 |
+
"version_minor": 0
|
| 14 |
+
},
|
| 15 |
+
"text/plain": [
|
| 16 |
+
"Saving the dataset (0/7 shards): 0%| | 0/82560 [00:00<?, ? examples/s]"
|
| 17 |
+
]
|
| 18 |
+
},
|
| 19 |
+
"metadata": {},
|
| 20 |
+
"output_type": "display_data"
|
| 21 |
+
}
|
| 22 |
+
],
|
| 23 |
+
"source": [
|
| 24 |
+
"# Method 1: Using datasets library\n",
|
| 25 |
+
"from datasets import load_dataset\n",
|
| 26 |
+
"\n",
|
| 27 |
+
"# Download and load the dataset\n",
|
| 28 |
+
"dataset = load_dataset(\"akinsanyaayomide/skin_cancer_dataset_balanced_labels_aug\")\n",
|
| 29 |
+
"\n",
|
| 30 |
+
"# Print basic dataset information\n",
|
| 31 |
+
"print(dataset)\n",
|
| 32 |
+
"\n",
|
| 33 |
+
"# Example: Access first few samples\n",
|
| 34 |
+
"print(dataset[\"train\"][:3])"
|
| 35 |
+
]
|
| 36 |
+
}
|
| 37 |
+
],
|
| 38 |
+
"metadata": {
|
| 39 |
+
"kernelspec": {
|
| 40 |
+
"display_name": "base",
|
| 41 |
+
"language": "python",
|
| 42 |
+
"name": "python3"
|
| 43 |
+
},
|
| 44 |
+
"language_info": {
|
| 45 |
+
"codemirror_mode": {
|
| 46 |
+
"name": "ipython",
|
| 47 |
+
"version": 3
|
| 48 |
+
},
|
| 49 |
+
"file_extension": ".py",
|
| 50 |
+
"mimetype": "text/x-python",
|
| 51 |
+
"name": "python",
|
| 52 |
+
"nbconvert_exporter": "python",
|
| 53 |
+
"pygments_lexer": "ipython3",
|
| 54 |
+
"version": "3.12.3"
|
| 55 |
+
}
|
| 56 |
+
},
|
| 57 |
+
"nbformat": 4,
|
| 58 |
+
"nbformat_minor": 2
|
| 59 |
+
}
|
Code2.ipynb
ADDED
|
File without changes
|
local_dataset_directory/dataset_dict.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"splits": ["train"]}
|
local_dataset_directory/train/data-00000-of-00007.arrow
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3f8542f1cdfdb27a13a2fb01a8d3e0c1df791e372c2274e895589df028660738
|
| 3 |
+
size 503410528
|
local_dataset_directory/train/data-00001-of-00007.arrow
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d7e3d5b80067e094f8386a0e66078d8290300bc35582b0e1f323ab3c4ccf12ef
|
| 3 |
+
size 505796984
|
local_dataset_directory/train/data-00002-of-00007.arrow
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a1f3677d4b1fd8e83f86ef33c0834e95b2301a05206debd9876bbb55dc6938c0
|
| 3 |
+
size 545738880
|
local_dataset_directory/train/data-00003-of-00007.arrow
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ce461d017aa575ff9ccfc0f688553a61c9ec31acb96832a7757dc499ef906cb3
|
| 3 |
+
size 504405232
|
local_dataset_directory/train/data-00004-of-00007.arrow
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b8097135e39e8d5f08b498560f858b141fcaa3fb66e94124346014bb8d9a6e95
|
| 3 |
+
size 222551824
|
local_dataset_directory/train/data-00005-of-00007.arrow
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cb80265c2a981f0d8b56dfdcdb0ab9ef6c69150d11b0bcc4846000b4a652fdff
|
| 3 |
+
size 421870296
|
local_dataset_directory/train/data-00006-of-00007.arrow
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f3b513ee6f3f44b77874ded157e454bd9c7603f2634c3caf400e32d9f8498179
|
| 3 |
+
size 503388728
|
local_dataset_directory/train/dataset_info.json
ADDED
|
@@ -0,0 +1,50 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"builder_name": "parquet",
|
| 3 |
+
"citation": "",
|
| 4 |
+
"config_name": "default",
|
| 5 |
+
"dataset_name": "skin_cancer_dataset_balanced_labels_aug",
|
| 6 |
+
"dataset_size": 3206879716,
|
| 7 |
+
"description": "",
|
| 8 |
+
"download_checksums": {
|
| 9 |
+
"hf://datasets/akinsanyaayomide/skin_cancer_dataset_balanced_labels_aug@539d615f74f9820c0730a1c1a92766d9064f155f/balanced_skin_cancer_dataset.parquet": {
|
| 10 |
+
"num_bytes": 3205594311,
|
| 11 |
+
"checksum": null
|
| 12 |
+
}
|
| 13 |
+
},
|
| 14 |
+
"download_size": 3205594311,
|
| 15 |
+
"features": {
|
| 16 |
+
"image": {
|
| 17 |
+
"_type": "Image"
|
| 18 |
+
},
|
| 19 |
+
"label": {
|
| 20 |
+
"dtype": "int64",
|
| 21 |
+
"_type": "Value"
|
| 22 |
+
}
|
| 23 |
+
},
|
| 24 |
+
"homepage": "",
|
| 25 |
+
"license": "",
|
| 26 |
+
"size_in_bytes": 6412474027,
|
| 27 |
+
"splits": {
|
| 28 |
+
"train": {
|
| 29 |
+
"name": "train",
|
| 30 |
+
"num_bytes": 3206879716,
|
| 31 |
+
"num_examples": 82560,
|
| 32 |
+
"shard_lengths": [
|
| 33 |
+
11800,
|
| 34 |
+
11700,
|
| 35 |
+
10800,
|
| 36 |
+
11700,
|
| 37 |
+
20600,
|
| 38 |
+
11300,
|
| 39 |
+
4660
|
| 40 |
+
],
|
| 41 |
+
"dataset_name": "skin_cancer_dataset_balanced_labels_aug"
|
| 42 |
+
}
|
| 43 |
+
},
|
| 44 |
+
"version": {
|
| 45 |
+
"version_str": "0.0.0",
|
| 46 |
+
"major": 0,
|
| 47 |
+
"minor": 0,
|
| 48 |
+
"patch": 0
|
| 49 |
+
}
|
| 50 |
+
}
|
local_dataset_directory/train/state.json
ADDED
|
@@ -0,0 +1,31 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_data_files": [
|
| 3 |
+
{
|
| 4 |
+
"filename": "data-00000-of-00007.arrow"
|
| 5 |
+
},
|
| 6 |
+
{
|
| 7 |
+
"filename": "data-00001-of-00007.arrow"
|
| 8 |
+
},
|
| 9 |
+
{
|
| 10 |
+
"filename": "data-00002-of-00007.arrow"
|
| 11 |
+
},
|
| 12 |
+
{
|
| 13 |
+
"filename": "data-00003-of-00007.arrow"
|
| 14 |
+
},
|
| 15 |
+
{
|
| 16 |
+
"filename": "data-00004-of-00007.arrow"
|
| 17 |
+
},
|
| 18 |
+
{
|
| 19 |
+
"filename": "data-00005-of-00007.arrow"
|
| 20 |
+
},
|
| 21 |
+
{
|
| 22 |
+
"filename": "data-00006-of-00007.arrow"
|
| 23 |
+
}
|
| 24 |
+
],
|
| 25 |
+
"_fingerprint": "2ed268d78b91509f",
|
| 26 |
+
"_format_columns": null,
|
| 27 |
+
"_format_kwargs": {},
|
| 28 |
+
"_format_type": null,
|
| 29 |
+
"_output_all_columns": false,
|
| 30 |
+
"_split": "train"
|
| 31 |
+
}
|