normalcomputing
/

extended-mind-mpt-30b

Text Generation

Model card Files Files and versions Community

phoebeklett commited on May 29, 2024

Commit

9e038ac

·

verified ·

1 Parent(s): c6f0cbc

Update config.json

Files changed (1) hide show

config.json +19 -5

config.json CHANGED Viewed

@@ -1,14 +1,28 @@
 {
-  "_name_or_path": "mosaicml/mpt-30b",
   "architectures": [
     "ExtendedMptForCausalLM"
   ],
   "attn_config": {
-    "model_type": ""
   },
   "auto_map": {
-    "AutoConfig": "mosaicml/mpt-30b--configuration_mpt.MPTConfig",
-    "AutoModelForCausalLM": "mosaicml/mpt-30b--modeling_mpt.MPTForCausalLM"
   },
   "d_model": 7168,
   "emb_pdrop": 0,
@@ -41,7 +55,7 @@
   "tokenizer_name": "EleutherAI/gpt-neox-20b",
   "torch_dtype": "float32",
   "transformers_version": "4.33.0",
-  "use_cache": false,
   "use_external_mind": true,
   "use_external_mind_by_layer": [
     true,

 {
+  "_name_or_path": "normalcomputing/extended-mind-mpt-30b",
   "architectures": [
     "ExtendedMptForCausalLM"
   ],
   "attn_config": {
+    "alibi": true,
+    "alibi_bias_max": 8,
+    "attn_impl": "torch",
+    "attn_pdrop": 0,
+    "attn_type": "multihead_attention",
+    "attn_uses_sequence_id": false,
+    "clip_qkv": null,
+    "mask_by_sim": true,
+    "memory_type": "manual",
+    "prefix_lm": false,
+    "qk_ln": false,
+    "sim_threshold": 0.25,
+    "softmax_scale": null,
+    "topk": 10,
+    "use_active_externalism": true
   },
   "auto_map": {
+    "AutoConfig": "configuration.ExtendedMptConfig",
+    "AutoModelForCausalLM": "modeling.ExtendedMptForCausalLM"
   },
   "d_model": 7168,
   "emb_pdrop": 0,
   "tokenizer_name": "EleutherAI/gpt-neox-20b",
   "torch_dtype": "float32",
   "transformers_version": "4.33.0",
+  "use_cache": true,
   "use_external_mind": true,
   "use_external_mind_by_layer": [
     true,