tbung commited on
Commit
42edf3c
·
1 Parent(s): 3fda8cb

fix: reduce number of languages, add lora

Browse files
adapter_config.json ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alora_invocation_tokens": null,
3
+ "alpha_pattern": {},
4
+ "arrow_config": null,
5
+ "auto_mapping": {
6
+ "base_model_class": "RobertaForSequenceClassification",
7
+ "parent_library": "transformers.models.roberta.modeling_roberta"
8
+ },
9
+ "base_model_name_or_path": "huggingface/CodeBERTa-small-v1",
10
+ "bias": "none",
11
+ "corda_config": null,
12
+ "ensure_weight_tying": false,
13
+ "eva_config": null,
14
+ "exclude_modules": null,
15
+ "fan_in_fan_out": false,
16
+ "inference_mode": true,
17
+ "init_lora_weights": true,
18
+ "layer_replication": null,
19
+ "layers_pattern": null,
20
+ "layers_to_transform": null,
21
+ "loftq_config": {},
22
+ "lora_alpha": 16,
23
+ "lora_bias": false,
24
+ "lora_dropout": 0.1,
25
+ "megatron_config": null,
26
+ "megatron_core": "megatron.core",
27
+ "modules_to_save": [
28
+ "classifier"
29
+ ],
30
+ "peft_type": "LORA",
31
+ "peft_version": "0.18.0",
32
+ "qalora_group_size": 16,
33
+ "r": 16,
34
+ "rank_pattern": {},
35
+ "revision": null,
36
+ "target_modules": [
37
+ "value",
38
+ "query"
39
+ ],
40
+ "target_parameters": null,
41
+ "task_type": null,
42
+ "trainable_token_indices": null,
43
+ "use_dora": false,
44
+ "use_qalora": false,
45
+ "use_rslora": false
46
+ }
adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2402db45b928e2129ec461c2b8c3cfe2814fc4cdc2c7fc1ef90ce0c52033df25
3
+ size 3570544
config.json CHANGED
@@ -11,114 +11,26 @@
11
  "hidden_dropout_prob": 0.1,
12
  "hidden_size": 768,
13
  "id2label": {
14
- "0": "Assembly",
15
- "1": "Batchfile",
16
- "2": "C",
17
- "3": "C#",
18
- "4": "C++",
19
- "5": "CMake",
20
- "6": "COBOL",
21
- "7": "CSS",
22
- "8": "CSV",
23
- "9": "Clojure",
24
- "10": "CoffeeScript",
25
- "11": "DM",
26
- "12": "Dart",
27
- "13": "Dockerfile",
28
- "14": "Elixir",
29
- "15": "Erlang",
30
- "16": "Fortran",
31
- "17": "Go",
32
- "18": "Groovy",
33
- "19": "HTML",
34
- "20": "Haskell",
35
- "21": "INI",
36
- "22": "JSON",
37
- "23": "Java",
38
- "24": "JavaScript",
39
- "25": "Julia",
40
- "26": "Kotlin",
41
- "27": "Lisp",
42
- "28": "Lua",
43
- "29": "Makefile",
44
- "30": "Matlab",
45
- "31": "OCaml",
46
- "32": "Objective-C",
47
- "33": "PHP",
48
- "34": "Pascal",
49
- "35": "Perl",
50
- "36": "PowerShell",
51
- "37": "Prolog",
52
- "38": "Python",
53
- "39": "R",
54
- "40": "Ruby",
55
- "41": "Rust",
56
- "42": "SQL",
57
- "43": "Scala",
58
- "44": "Shell",
59
- "45": "Swift",
60
- "46": "TeX",
61
- "47": "TypeScript",
62
- "48": "Verilog",
63
- "49": "Visual Basic",
64
- "50": "XML",
65
- "51": "YAML"
66
  },
67
  "initializer_range": 0.02,
68
  "intermediate_size": 3072,
69
  "label2id": {
70
- "Assembly": 0,
71
- "Batchfile": 1,
72
- "C": 2,
73
- "C#": 3,
74
- "C++": 4,
75
- "CMake": 5,
76
- "COBOL": 6,
77
- "CSS": 7,
78
- "CSV": 8,
79
- "Clojure": 9,
80
- "CoffeeScript": 10,
81
- "DM": 11,
82
- "Dart": 12,
83
- "Dockerfile": 13,
84
- "Elixir": 14,
85
- "Erlang": 15,
86
- "Fortran": 16,
87
- "Go": 17,
88
- "Groovy": 18,
89
- "HTML": 19,
90
- "Haskell": 20,
91
- "INI": 21,
92
- "JSON": 22,
93
- "Java": 23,
94
- "JavaScript": 24,
95
- "Julia": 25,
96
- "Kotlin": 26,
97
- "Lisp": 27,
98
- "Lua": 28,
99
- "Makefile": 29,
100
- "Matlab": 30,
101
- "OCaml": 31,
102
- "Objective-C": 32,
103
- "PHP": 33,
104
- "Pascal": 34,
105
- "Perl": 35,
106
- "PowerShell": 36,
107
- "Prolog": 37,
108
- "Python": 38,
109
- "R": 39,
110
- "Ruby": 40,
111
- "Rust": 41,
112
- "SQL": 42,
113
- "Scala": 43,
114
- "Shell": 44,
115
- "Swift": 45,
116
- "TeX": 46,
117
- "TypeScript": 47,
118
- "Verilog": 48,
119
- "Visual Basic": 49,
120
- "XML": 50,
121
- "YAML": 51
122
  },
123
  "layer_norm_eps": 1e-05,
124
  "max_position_embeddings": 514,
@@ -127,7 +39,6 @@
127
  "num_hidden_layers": 6,
128
  "pad_token_id": 1,
129
  "position_embedding_type": "absolute",
130
- "problem_type": "single_label_classification",
131
  "transformers_version": "4.57.0",
132
  "type_vocab_size": 1,
133
  "use_cache": true,
 
11
  "hidden_dropout_prob": 0.1,
12
  "hidden_size": 768,
13
  "id2label": {
14
+ "0": "C#",
15
+ "1": "Go",
16
+ "2": "JSON",
17
+ "3": "Java",
18
+ "4": "TypeScript",
19
+ "5": "Python",
20
+ "6": "Rust",
21
+ "7": "Shell"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
22
  },
23
  "initializer_range": 0.02,
24
  "intermediate_size": 3072,
25
  "label2id": {
26
+ "C#": 0,
27
+ "Go": 1,
28
+ "JSON": 2,
29
+ "Java": 3,
30
+ "Python": 5,
31
+ "Rust": 6,
32
+ "Shell": 7,
33
+ "TypeScript": 4
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
34
  },
35
  "layer_norm_eps": 1e-05,
36
  "max_position_embeddings": 514,
 
39
  "num_hidden_layers": 6,
40
  "pad_token_id": 1,
41
  "position_embedding_type": "absolute",
 
42
  "transformers_version": "4.57.0",
43
  "type_vocab_size": 1,
44
  "use_cache": true,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f0bb8a3f7117d4dc8dc40f73b2b7620be6cd78430b171049938670e999bb8b84
3
- size 333976000
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15f29975ded74b6bf071753e05b25401f099419d06cf9ed1845bfba94a02746c
3
+ size 333840656
tokenizer_config.json CHANGED
@@ -54,6 +54,5 @@
54
  "pad_token": "<pad>",
55
  "sep_token": "</s>",
56
  "tokenizer_class": "RobertaTokenizer",
57
- "trim_offsets": true,
58
  "unk_token": "<unk>"
59
  }
 
54
  "pad_token": "<pad>",
55
  "sep_token": "</s>",
56
  "tokenizer_class": "RobertaTokenizer",
 
57
  "unk_token": "<unk>"
58
  }
vocab.json CHANGED
The diff for this file is too large to render. See raw diff