mmaaz60 commited on
Commit
0d9b80c
·
verified ·
1 Parent(s): 85291be

Upload combined_data_stats.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. combined_data_stats.json +72 -0
combined_data_stats.json ADDED
@@ -0,0 +1,72 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "total_samples": 15271,
3
+ "data_sources": {
4
+ "1_2_m_academic_v0_1": 865,
5
+ "None": 8262,
6
+ "30_60_s_academic_v0_1": 2096,
7
+ "0_30_s_perceptiontest": 470,
8
+ "0_30_s_academic_v0_1": 1411,
9
+ "2_3_m_academic_v0_1": 806,
10
+ "0_30_s_nextqa": 131,
11
+ "1_2_m_nextqa": 95,
12
+ "30_60_s_perceptiontest": 167,
13
+ "30_60_s_nextqa": 139,
14
+ "clevrer": 829
15
+ },
16
+ "assistant_stats": {
17
+ "characters": {
18
+ "min": 37.0,
19
+ "max": 10918.0,
20
+ "avg": 1817.258201820444,
21
+ "count": 15271
22
+ },
23
+ "words": {
24
+ "min": 4.0,
25
+ "max": 1918.0,
26
+ "avg": 321.41202278829155,
27
+ "count": 15271
28
+ },
29
+ "tokens": {
30
+ "min": 9.25,
31
+ "max": 2729.5,
32
+ "avg": 454.314550455111,
33
+ "count": 15271,
34
+ "definition": "tokens = characters / 4.0"
35
+ }
36
+ },
37
+ "unique_videos": {
38
+ "total_unique_overall": 11816,
39
+ "per_data_source_unique_counts": {
40
+ "1_2_m_academic_v0_1": 635,
41
+ "None": 6349,
42
+ "30_60_s_academic_v0_1": 1563,
43
+ "0_30_s_perceptiontest": 402,
44
+ "0_30_s_academic_v0_1": 1060,
45
+ "2_3_m_academic_v0_1": 551,
46
+ "0_30_s_nextqa": 121,
47
+ "1_2_m_nextqa": 92,
48
+ "30_60_s_perceptiontest": 140,
49
+ "30_60_s_nextqa": 131,
50
+ "clevrer": 814
51
+ }
52
+ },
53
+ "video_metadata": {
54
+ "ffprobe_available": true,
55
+ "probed_videos_count": 11816,
56
+ "duration_seconds": {
57
+ "min": 5.0,
58
+ "max": 179.932,
59
+ "mean": 48.94285781990521,
60
+ "count": 11816
61
+ },
62
+ "resolution_groups": {
63
+ "below_480p": 5463,
64
+ "between_480p_720p": 2514,
65
+ "between_720p_1080p": 2298,
66
+ "above_1080p": 1541,
67
+ "unknown": 0
68
+ },
69
+ "errors_total": 0,
70
+ "errors_sample": []
71
+ }
72
+ }