File size: 1,859 Bytes
7949a3f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
{
  "builder_name": "json",
  "citation": "",
  "config_name": "default",
  "dataset_name": "json",
  "dataset_size": 22198464,
  "description": "",
  "download_checksums": {
    "/content/drive/MyDrive/Speciale/2. Data cleaning/self_instruct/self_instruct_cleaned.jsonl": {
      "num_bytes": 27572781,
      "checksum": null
    }
  },
  "download_size": 27572781,
  "features": {
    "instruction": {
      "dtype": "string",
      "_type": "Value"
    },
    "response": {
      "dtype": "string",
      "_type": "Value"
    },
    "_row_id": {
      "dtype": "int64",
      "_type": "Value"
    },
    "syntax_valid": {
      "dtype": "bool",
      "_type": "Value"
    },
    "exec_valid": {
      "dtype": "bool",
      "_type": "Value"
    },
    "exec_error": {
      "dtype": "string",
      "_type": "Value"
    },
    "prompt_norm": {
      "dtype": "string",
      "_type": "Value"
    },
    "response_norm": {
      "dtype": "string",
      "_type": "Value"
    },
    "prompt_exact_match": {
      "dtype": "bool",
      "_type": "Value"
    },
    "entry_point_exact_match": {
      "dtype": "bool",
      "_type": "Value"
    },
    "solution_exact_match": {
      "dtype": "bool",
      "_type": "Value"
    },
    "max_prompt_similarity": {
      "dtype": "float64",
      "_type": "Value"
    },
    "max_code_similarity": {
      "dtype": "float64",
      "_type": "Value"
    },
    "leakage_flag": {
      "dtype": "bool",
      "_type": "Value"
    },
    "text": {
      "dtype": "string",
      "_type": "Value"
    }
  },
  "homepage": "",
  "license": "",
  "size_in_bytes": 49771245,
  "splits": {
    "train": {
      "name": "train",
      "num_bytes": 22198464,
      "num_examples": 18015,
      "dataset_name": "json"
    }
  },
  "version": {
    "version_str": "0.0.0",
    "major": 0,
    "minor": 0,
    "patch": 0
  }
}