Upload combined_data_stats.json with huggingface_hub
Browse files- combined_data_stats.json +72 -0
combined_data_stats.json
ADDED
|
@@ -0,0 +1,72 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"total_samples": 15271,
|
| 3 |
+
"data_sources": {
|
| 4 |
+
"1_2_m_academic_v0_1": 865,
|
| 5 |
+
"None": 8262,
|
| 6 |
+
"30_60_s_academic_v0_1": 2096,
|
| 7 |
+
"0_30_s_perceptiontest": 470,
|
| 8 |
+
"0_30_s_academic_v0_1": 1411,
|
| 9 |
+
"2_3_m_academic_v0_1": 806,
|
| 10 |
+
"0_30_s_nextqa": 131,
|
| 11 |
+
"1_2_m_nextqa": 95,
|
| 12 |
+
"30_60_s_perceptiontest": 167,
|
| 13 |
+
"30_60_s_nextqa": 139,
|
| 14 |
+
"clevrer": 829
|
| 15 |
+
},
|
| 16 |
+
"assistant_stats": {
|
| 17 |
+
"characters": {
|
| 18 |
+
"min": 37.0,
|
| 19 |
+
"max": 10918.0,
|
| 20 |
+
"avg": 1817.258201820444,
|
| 21 |
+
"count": 15271
|
| 22 |
+
},
|
| 23 |
+
"words": {
|
| 24 |
+
"min": 4.0,
|
| 25 |
+
"max": 1918.0,
|
| 26 |
+
"avg": 321.41202278829155,
|
| 27 |
+
"count": 15271
|
| 28 |
+
},
|
| 29 |
+
"tokens": {
|
| 30 |
+
"min": 9.25,
|
| 31 |
+
"max": 2729.5,
|
| 32 |
+
"avg": 454.314550455111,
|
| 33 |
+
"count": 15271,
|
| 34 |
+
"definition": "tokens = characters / 4.0"
|
| 35 |
+
}
|
| 36 |
+
},
|
| 37 |
+
"unique_videos": {
|
| 38 |
+
"total_unique_overall": 11816,
|
| 39 |
+
"per_data_source_unique_counts": {
|
| 40 |
+
"1_2_m_academic_v0_1": 635,
|
| 41 |
+
"None": 6349,
|
| 42 |
+
"30_60_s_academic_v0_1": 1563,
|
| 43 |
+
"0_30_s_perceptiontest": 402,
|
| 44 |
+
"0_30_s_academic_v0_1": 1060,
|
| 45 |
+
"2_3_m_academic_v0_1": 551,
|
| 46 |
+
"0_30_s_nextqa": 121,
|
| 47 |
+
"1_2_m_nextqa": 92,
|
| 48 |
+
"30_60_s_perceptiontest": 140,
|
| 49 |
+
"30_60_s_nextqa": 131,
|
| 50 |
+
"clevrer": 814
|
| 51 |
+
}
|
| 52 |
+
},
|
| 53 |
+
"video_metadata": {
|
| 54 |
+
"ffprobe_available": true,
|
| 55 |
+
"probed_videos_count": 11816,
|
| 56 |
+
"duration_seconds": {
|
| 57 |
+
"min": 5.0,
|
| 58 |
+
"max": 179.932,
|
| 59 |
+
"mean": 48.94285781990521,
|
| 60 |
+
"count": 11816
|
| 61 |
+
},
|
| 62 |
+
"resolution_groups": {
|
| 63 |
+
"below_480p": 5463,
|
| 64 |
+
"between_480p_720p": 2514,
|
| 65 |
+
"between_720p_1080p": 2298,
|
| 66 |
+
"above_1080p": 1541,
|
| 67 |
+
"unknown": 0
|
| 68 |
+
},
|
| 69 |
+
"errors_total": 0,
|
| 70 |
+
"errors_sample": []
|
| 71 |
+
}
|
| 72 |
+
}
|