stefan-it commited on
Commit
c2b9dd2
·
1 Parent(s): 6ce722e

model: add config and trained xLSTM model

Browse files
Files changed (2) hide show
  1. config.json +24 -0
  2. model.safetensors +3 -0
config.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "torch_dtype": "float32",
3
+ "architectures": [
4
+ "xLSTMForCausalLM"
5
+ ],
6
+ "transformers_version": "4.44.0",
7
+ "_xlstm_config": {
8
+ "num_blocks": 24,
9
+ "embedding_dim": 768,
10
+ "mlstm_block": {
11
+ "mlstm": {
12
+ "num_heads": 4
13
+ }
14
+ },
15
+ "slstm_block": {},
16
+ "slstm_at": [],
17
+ "context_length": 512,
18
+ "vocab_size": 32000
19
+ },
20
+ "vocab_size": 32000,
21
+ "embedding_dim": 768,
22
+ "context_length": 512,
23
+ "model_type": "xlstm"
24
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:881342c6711b37a7659080df758441a77b2c527bfc1b9251f7b631027a6b7db1
3
+ size 444504408