optimum
/

tiny_random_bert_neuron

Optimum commited on Aug 16, 2023

Commit

77378cd

1 Parent(s): 4c47022

Upload config.json with huggingface_hub

Files changed (1) hide show

config.json CHANGED Viewed

@@ -4,37 +4,40 @@
     "BertModel"
   ],
   "attention_probs_dropout_prob": 0.1,
-  "auto_cast": null,
-  "auto_cast_type": null,
   "classifier_dropout": null,
-  "disable_fallback": true,
-  "disable_fast_relayout": false,
-  "dynamic_batch_size": true,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
   "hidden_size": 32,
   "initializer_range": 0.02,
-  "input_names": [
-    "input_ids",
-    "attention_mask",
-    "token_type_ids"
-  ],
   "intermediate_size": 37,
   "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,
   "model_type": "bert",
-  "neuron_batch_size": 1,
-  "neuron_sequence_length": 16,
   "num_attention_heads": 4,
   "num_hidden_layers": 5,
-  "output_names": [
-    "last_hidden_state",
-    "pooler_output"
-  ],
   "pad_token_id": 0,
   "position_embedding_type": "absolute",
-  "torchscript": true,
-  "transformers_version": "4.29.2",
   "type_vocab_size": 16,
   "use_cache": true,
   "vocab_size": 1124

     "BertModel"
   ],
   "attention_probs_dropout_prob": 0.1,
   "classifier_dropout": null,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
   "hidden_size": 32,
   "initializer_range": 0.02,
   "intermediate_size": 37,
   "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,
   "model_type": "bert",
+  "neuron": {
+    "auto_cast": null,
+    "auto_cast_type": null,
+    "compiler_type": "neuron-cc",
+    "compiler_version": "1.15.0.0+eec0c3604",
+    "disable_fallback": false,
+    "disable_fast_relayout": false,
+    "dynamic_batch_size": false,
+    "input_names": [
+      "input_ids",
+      "attention_mask",
+      "token_type_ids"
+    ],
+    "output_names": [
+      "logits"
+    ],
+    "static_batch_size": 1,
+    "static_sequence_length": 32
+  },
   "num_attention_heads": 4,
   "num_hidden_layers": 5,
   "pad_token_id": 0,
   "position_embedding_type": "absolute",
+  "torch_dtype": "float32",
+  "transformers_version": "4.31.0",
   "type_vocab_size": 16,
   "use_cache": true,
   "vocab_size": 1124