apepkuss79 commited on
Commit
31b96d8
1 Parent(s): efbff56

Update models

Browse files
.gitattributes CHANGED
@@ -33,3 +33,16 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ Nemotron-Mini-4B-Instruct-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
37
+ Nemotron-Mini-4B-Instruct-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
38
+ Nemotron-Mini-4B-Instruct-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
39
+ Nemotron-Mini-4B-Instruct-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
40
+ Nemotron-Mini-4B-Instruct-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
41
+ Nemotron-Mini-4B-Instruct-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
42
+ Nemotron-Mini-4B-Instruct-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
43
+ Nemotron-Mini-4B-Instruct-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
44
+ Nemotron-Mini-4B-Instruct-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
45
+ Nemotron-Mini-4B-Instruct-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
46
+ Nemotron-Mini-4B-Instruct-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
47
+ Nemotron-Mini-4B-Instruct-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
48
+ Nemotron-Mini-4B-Instruct-f16.gguf filter=lfs diff=lfs merge=lfs -text
Nemotron-Mini-4B-Instruct-Q2_K.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd0f58dc5f986050c218ff0d218fc996047f55ce9d208288e5ee16152f86abde
3
+ size 1902795552
Nemotron-Mini-4B-Instruct-Q3_K_L.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba95fc84849f20310d34e76acc40f637f7888e905369bfc9be053735b4242c68
3
+ size 2452953888
Nemotron-Mini-4B-Instruct-Q3_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ff88e2e1dd12d6c52b953b88f17de3660b64acbb5ef27634d49227a446e98fc
3
+ size 2297240352
Nemotron-Mini-4B-Instruct-Q3_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:598219b93190727b87e46aab5502cf0a916399156739cda2066c54fa4df5f371
3
+ size 2115574560
Nemotron-Mini-4B-Instruct-Q4_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12768e362a120d3438415c1b4c224d1acfaf85ca670ef75644a08b4f5320f6d8
3
+ size 2567625504
Nemotron-Mini-4B-Instruct-Q4_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7fa712b782f0f4d11a1b78fb370310ea836e3f6f857056c6f4d5100eb7dec447
3
+ size 2697386784
Nemotron-Mini-4B-Instruct-Q4_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9720805147b628dd3d8245ed4623036d2ccd09313b53ea9dcd3df5ac28a2b334
3
+ size 2583354144
Nemotron-Mini-4B-Instruct-Q5_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02817bc750348b56e621fbba1e9c45742d302fb8150448191f1400b5a4cdddbd
3
+ size 2993085216
Nemotron-Mini-4B-Instruct-Q5_K_M.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9186e76ba9d182a880faa5eb82c8240ee4743d56c034f6b5fd2a6d82bebeeea0
3
+ size 3059931936
Nemotron-Mini-4B-Instruct-Q5_K_S.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:361c6c76cc6b246e9f8fc3877d160027a7569b1d461ba36d480a47a411c7d826
3
+ size 2993085216
Nemotron-Mini-4B-Instruct-Q6_K.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed922ea555f6d81c9e8cb953324897cb86151d801d1b8f5990916125d7a80605
3
+ size 3445136160
Nemotron-Mini-4B-Instruct-Q8_0.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e52852b266f92ab1f81957f5cb01ec5c097ff8d69ff49698408f042c05fba07
3
+ size 4459928352
Nemotron-Mini-4B-Instruct-f16.gguf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a83fbc63c044779ed75ee1f0492e9507da83d470bc9f7953b84901b24c7b341d
3
+ size 8388156192
config.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "nvidia/Minitron-4B-Instruct",
3
+ "architectures": [
4
+ "NemotronForCausalLM"
5
+ ],
6
+ "bos_token_id": 2,
7
+ "eos_token_id": 3,
8
+ "hidden_act": "relu2",
9
+ "hidden_size": 3072,
10
+ "initializer_range": 0.0134,
11
+ "intermediate_size": 9216,
12
+ "max_position_embeddings": 4096,
13
+ "model_type": "nemotron",
14
+ "num_attention_heads": 24,
15
+ "num_hidden_layers": 32,
16
+ "num_key_value_heads": 8,
17
+ "norm_eps": 1e-05,
18
+ "rope_theta": 10000,
19
+ "partial_rotary_factor": 0.5,
20
+ "tie_word_embeddings": false,
21
+ "torch_dtype": "bfloat16",
22
+ "transformers_version": "4.32.0.dev0",
23
+ "use_cache": true,
24
+ "vocab_size": 256000,
25
+ "kv_channels": 128
26
+ }