cerebras
/

btlm-3b-8k-base

Text Generation

Model card Files Files and versions

Faisal AlKhateeb commited on Jul 19, 2023

Commit

6317e26

·

1 Parent(s): 2c2d81f

add checkpoint

Files changed (2) hide show

config.json +34 -0
pytorch_model.bin +3 -0

config.json ADDED Viewed

	@@ -0,0 +1,34 @@

+{
+    "auto_map": {
+        "AutoConfig": "configuration_btlm.BTLMConfig",
+        "AutoModel": "modeling_btlm.BTLMModel",
+        "AutoModelForSequenceClassification": "modeling_btlm.BTLMForSequenceClassification",
+        "AutoModelForTokenClassification": "modeling_btlm.BTLMForTokenClassification",
+        "AutoModelForQuestionAnswering": "modeling_btlm.BTLMForQuestionAnswering",
+        "AutoModelForCausalLM": "modeling_btlm.BTLMLMHeadModel"
+    },
+    "architectures": [
+        "BTLMLMHeadModel"
+    ],
+    "attn_pdrop": 0.0,
+    "bos_token_id": 50256,
+    "eos_token_id": 50256,
+    "scale_attn_weights": true,
+    "resid_pdrop": 0.0,
+    "embeddings_scale": 14.6,
+    "n_inner": 6826,
+    "n_embd": 2560,
+    "layer_norm_epsilon": 1e-05,
+    "n_positions": 8192,
+    "activation_function": "swiglu",
+    "n_head": 32,
+    "n_layer": 32,
+    "model_type": "btlm",
+    "width_scale": 0.1,
+    "output_logits_scale": 0.22200000000000003,
+    "position_embedding_type": "alibi",
+    "scale_qk_dot_by_d": true,
+    "tie_word_embeddings": true,
+    "vocab_size": 50257,
+    "embd_pdrop": 0.0
+}

pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2c941784983f87a61c21450c65774c591a49291f565f3f15396348d5a1dd0263
+size 13247298643