snezhanata commited on
Commit
d8c5280
·
verified ·
1 Parent(s): c73172d

Upload MinistralForCausalLM

Browse files
config.json CHANGED
@@ -1,9 +1,10 @@
1
  {
2
  "architectures": [
3
- "MistralForCausalLM"
4
  ],
5
  "attention_dropout": 0.0,
6
  "bos_token_id": 1,
 
7
  "eos_token_id": 2,
8
  "head_dim": 128,
9
  "hidden_act": "silu",
@@ -49,7 +50,7 @@
49
  "sliding_attention"
50
  ],
51
  "max_position_embeddings": 32768,
52
- "model_type": "mistral",
53
  "num_attention_heads": 32,
54
  "num_hidden_layers": 36,
55
  "num_key_value_heads": 8,
@@ -57,8 +58,7 @@
57
  "rope_theta": 100000000.0,
58
  "sliding_window": 32768,
59
  "tie_word_embeddings": false,
60
- "torch_dtype": "bfloat16",
61
- "transformers_version": "4.55.0",
62
  "use_cache": true,
63
  "vocab_size": 131072
64
  }
 
1
  {
2
  "architectures": [
3
+ "MinistralForCausalLM"
4
  ],
5
  "attention_dropout": 0.0,
6
  "bos_token_id": 1,
7
+ "dtype": "bfloat16",
8
  "eos_token_id": 2,
9
  "head_dim": 128,
10
  "hidden_act": "silu",
 
50
  "sliding_attention"
51
  ],
52
  "max_position_embeddings": 32768,
53
+ "model_type": "ministral",
54
  "num_attention_heads": 32,
55
  "num_hidden_layers": 36,
56
  "num_key_value_heads": 8,
 
58
  "rope_theta": 100000000.0,
59
  "sliding_window": 32768,
60
  "tie_word_embeddings": false,
61
+ "transformers_version": "4.57.0",
 
62
  "use_cache": true,
63
  "vocab_size": 131072
64
  }
generation_config.json CHANGED
@@ -2,5 +2,5 @@
2
  "_from_model_config": true,
3
  "bos_token_id": 1,
4
  "eos_token_id": 2,
5
- "transformers_version": "4.55.0"
6
  }
 
2
  "_from_model_config": true,
3
  "bos_token_id": 1,
4
  "eos_token_id": 2,
5
+ "transformers_version": "4.57.0"
6
  }
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2c82fb59ac8f724c2c885ed28beb9a34eaef187afd450b313a59aced38e901d7
3
  size 4983007904
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:375f7ea202d2981377fb48eab97cb151b85a8e7e58236b3f1fb37c673924d48f
3
  size 4983007904
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:57a13d9ce1d7b1b46d590aa61c4ffede6789613b7c610b9c2aba1cea0f9fcc85
3
  size 4999836776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:132faa2a11957be0e5240633597917e78f6c26512805fe608b0c36d9f33229c3
3
  size 4999836776
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1828a9c14f8675fb7db041ae2978a6d207962332a8b6619ad54fbd7aa5c37099
3
  size 4983067960
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e748256b0517c34b7349cd3fba5c524a5585f707cb5f2fa883e84bbbc5122c62
3
  size 4983067960