Jingya HF Staff commited on
Commit
78983a1
·
verified ·
1 Parent(s): e966339

Upload config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. config.json +30 -15
config.json CHANGED
@@ -1,14 +1,12 @@
1
  {
2
- "_name_or_path": "dslim/bert-base-NER",
 
3
  "_num_labels": 9,
4
  "architectures": [
5
  "BertForTokenClassification"
6
  ],
7
  "attention_probs_dropout_prob": 0.1,
8
- "auto_cast": null,
9
- "auto_cast_type": null,
10
  "classifier_dropout": null,
11
- "dynamic_batch_size": true,
12
  "hidden_act": "gelu",
13
  "hidden_dropout_prob": 0.1,
14
  "hidden_size": 768,
@@ -24,11 +22,6 @@
24
  "8": "I-LOC"
25
  },
26
  "initializer_range": 0.02,
27
- "input_names": [
28
- "input_ids",
29
- "attention_mask",
30
- "token_type_ids"
31
- ],
32
  "intermediate_size": 3072,
33
  "label2id": {
34
  "B-LOC": 7,
@@ -44,18 +37,40 @@
44
  "layer_norm_eps": 1e-12,
45
  "max_position_embeddings": 512,
46
  "model_type": "bert",
47
- "neuron_batch_size": 1,
48
- "neuron_sequence_length": 128,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
49
  "num_attention_heads": 12,
50
  "num_hidden_layers": 12,
51
- "output_names": [
52
- "logits"
53
- ],
54
  "output_past": true,
55
  "pad_token_id": 0,
56
  "position_embedding_type": "absolute",
 
 
57
  "torchscript": true,
58
- "transformers_version": "4.29.2",
59
  "type_vocab_size": 2,
60
  "use_cache": true,
61
  "vocab_size": 28996
 
1
  {
2
+ "_attn_implementation_autoset": true,
3
+ "_name_or_path": "/tmp/tmp85t7b0_b",
4
  "_num_labels": 9,
5
  "architectures": [
6
  "BertForTokenClassification"
7
  ],
8
  "attention_probs_dropout_prob": 0.1,
 
 
9
  "classifier_dropout": null,
 
10
  "hidden_act": "gelu",
11
  "hidden_dropout_prob": 0.1,
12
  "hidden_size": 768,
 
22
  "8": "I-LOC"
23
  },
24
  "initializer_range": 0.02,
 
 
 
 
 
25
  "intermediate_size": 3072,
26
  "label2id": {
27
  "B-LOC": 7,
 
37
  "layer_norm_eps": 1e-12,
38
  "max_position_embeddings": 512,
39
  "model_type": "bert",
40
+ "neuron": {
41
+ "auto_cast": "matmul",
42
+ "auto_cast_type": "bf16",
43
+ "compiler_type": "neuronx-cc",
44
+ "compiler_version": "2.16.372.0+4a9b2326",
45
+ "disable_fallback": false,
46
+ "disable_fast_relayout": false,
47
+ "dynamic_batch_size": false,
48
+ "inline_weights_to_neff": true,
49
+ "input_names": [
50
+ "input_ids",
51
+ "attention_mask",
52
+ "token_type_ids"
53
+ ],
54
+ "model_type": "bert",
55
+ "optlevel": "2",
56
+ "output_attentions": false,
57
+ "output_hidden_states": false,
58
+ "output_names": [
59
+ "logits"
60
+ ],
61
+ "static_batch_size": 1,
62
+ "static_sequence_length": 128,
63
+ "tensor_parallel_size": 1
64
+ },
65
  "num_attention_heads": 12,
66
  "num_hidden_layers": 12,
 
 
 
67
  "output_past": true,
68
  "pad_token_id": 0,
69
  "position_embedding_type": "absolute",
70
+ "task": "token-classification",
71
+ "torch_dtype": "float32",
72
  "torchscript": true,
73
+ "transformers_version": "4.49.0",
74
  "type_vocab_size": 2,
75
  "use_cache": true,
76
  "vocab_size": 28996