mgoin commited on
Commit
6f9f989
1 Parent(s): 41feef4

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. config.json +38 -0
  3. generation_config.json +6 -0
  4. model-00001-of-00189.safetensors +3 -0
  5. model-00002-of-00189.safetensors +3 -0
  6. model-00003-of-00189.safetensors +3 -0
  7. model-00004-of-00189.safetensors +3 -0
  8. model-00005-of-00189.safetensors +3 -0
  9. model-00006-of-00189.safetensors +3 -0
  10. model-00007-of-00189.safetensors +3 -0
  11. model-00008-of-00189.safetensors +3 -0
  12. model-00009-of-00189.safetensors +3 -0
  13. model-00010-of-00189.safetensors +3 -0
  14. model-00011-of-00189.safetensors +3 -0
  15. model-00012-of-00189.safetensors +3 -0
  16. model-00013-of-00189.safetensors +3 -0
  17. model-00014-of-00189.safetensors +3 -0
  18. model-00015-of-00189.safetensors +3 -0
  19. model-00016-of-00189.safetensors +3 -0
  20. model-00017-of-00189.safetensors +3 -0
  21. model-00018-of-00189.safetensors +3 -0
  22. model-00019-of-00189.safetensors +3 -0
  23. model-00020-of-00189.safetensors +3 -0
  24. model-00021-of-00189.safetensors +3 -0
  25. model-00022-of-00189.safetensors +3 -0
  26. model-00023-of-00189.safetensors +3 -0
  27. model-00024-of-00189.safetensors +3 -0
  28. model-00025-of-00189.safetensors +3 -0
  29. model-00026-of-00189.safetensors +3 -0
  30. model-00027-of-00189.safetensors +3 -0
  31. model-00028-of-00189.safetensors +3 -0
  32. model-00029-of-00189.safetensors +3 -0
  33. model-00030-of-00189.safetensors +3 -0
  34. model-00031-of-00189.safetensors +3 -0
  35. model-00032-of-00189.safetensors +3 -0
  36. model-00033-of-00189.safetensors +3 -0
  37. model-00034-of-00189.safetensors +3 -0
  38. model-00035-of-00189.safetensors +3 -0
  39. model-00036-of-00189.safetensors +3 -0
  40. model-00037-of-00189.safetensors +3 -0
  41. model-00038-of-00189.safetensors +3 -0
  42. model-00039-of-00189.safetensors +3 -0
  43. model-00040-of-00189.safetensors +3 -0
  44. model-00041-of-00189.safetensors +3 -0
  45. model-00042-of-00189.safetensors +3 -0
  46. model-00043-of-00189.safetensors +3 -0
  47. model-00044-of-00189.safetensors +3 -0
  48. model-00045-of-00189.safetensors +3 -0
  49. model-00046-of-00189.safetensors +3 -0
  50. model-00047-of-00189.safetensors +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
config.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "Nemotron-4-340B-Base-hf",
3
+ "architectures": [
4
+ "NemotronForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 2,
9
+ "eos_token_id": 3,
10
+ "head_dim": 192,
11
+ "hidden_act": "relu2",
12
+ "hidden_size": 18432,
13
+ "initializer_range": 0.0063,
14
+ "intermediate_size": 73728,
15
+ "max_position_embeddings": 4096,
16
+ "mlp_bias": false,
17
+ "model_type": "nemotron",
18
+ "norm_eps": 1e-05,
19
+ "num_attention_heads": 96,
20
+ "num_hidden_layers": 96,
21
+ "num_key_value_heads": 8,
22
+ "quantization_config": {
23
+ "activation_scheme": "dynamic",
24
+ "ignored_layers": [
25
+ "lm_head"
26
+ ],
27
+ "quant_method": "fp8"
28
+ },
29
+ "rope_percent": 0.5,
30
+ "rope_percentage": 0.5,
31
+ "rope_scaling": null,
32
+ "rope_theta": 10000,
33
+ "tie_word_embeddings": false,
34
+ "torch_dtype": "bfloat16",
35
+ "transformers_version": "4.43.0.dev0",
36
+ "use_cache": true,
37
+ "vocab_size": 256000
38
+ }
generation_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 2,
4
+ "eos_token_id": 3,
5
+ "transformers_version": "4.43.0.dev0"
6
+ }
model-00001-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:492e67d00b85927fd5106a5fcc61933a93a4da2ba3dab19ad84df45908d22f2c
3
+ size 9437184112
model-00002-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:206eb1589c0ec52919a0bd5fb6bba6454cc0a5b62c987675b1b5c2e0a9551cf0
3
+ size 2095055948
model-00003-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e22dc1406f95a7cc26fb7ccb637142678fe94c45d818ee9d7c23e95b885d4a54
3
+ size 2095203836
model-00004-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0cb7e046722c5d7b8453d84df84c9d2b37a6963c55d470d77ed6c193a470e494
3
+ size 1358954708
model-00005-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a6fc66b6dc8d3bc39fbd88ffd670ede2b54d32151f7a344908de89223b14a12
3
+ size 2095203836
model-00006-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa95ca271a1119e2e6ff98c86a50672a110a29ccb14bb5ed01c637813a63b20a
3
+ size 1358954708
model-00007-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3a0f5447817fda87bac0566c5a0061cd445acb79529d6f781da05c8863f2297
3
+ size 2095203836
model-00008-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f5da863a3e6ad19422f9f75d9e6f9a4b279053185201298974b9ec6ac0dcbb5
3
+ size 1358954708
model-00009-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8d53665f8e452a4cc6b670304c9f9acb2ab3fc96912768b8267d9182c08c01f
3
+ size 2095203836
model-00010-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4c94783835bfe7e3b999687b98925c05cd0d38febc74ce8129820813731fddf
3
+ size 1358954708
model-00011-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:941968406fabb8602f1145d9e0e728780f83be55c85bdb9420319b943d83a749
3
+ size 2095203836
model-00012-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b45a29bc8265bd68003ec4c6cd9d967456a61d36b22087fc290368ccb7b4ab1c
3
+ size 1358954708
model-00013-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5f3c588f6c289165d22def9abdde4af230b78cd5697ce962593d3ffb38486c4
3
+ size 2095203836
model-00014-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:197befcef18e6f1ee2634db13ae3f114aff3fd6d32979cd15f7db3ce1361cd9e
3
+ size 1358954708
model-00015-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96540f02c449ad300d9764a9bc98698fef35d8b374e6b35d2709ed7fa04a0364
3
+ size 2095203836
model-00016-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6b33f3c82e2462a3852fc80459c27b5eda495cbf7efdb5fd384dd6ffec8aa7c
3
+ size 1358954708
model-00017-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dcee331e8c683d4d5bcec6568d96360221496d3588cd5d255e4401e847938bb5
3
+ size 2095203836
model-00018-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2dedde9514dcd9b03a33f1b6f4bf54c14e16ee6d14a6a01bcfdb7b4864b239b5
3
+ size 1358954708
model-00019-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:132daf633959e27797a12924f82c5079f76018a1ecf1f26a10a0f0eabf8d3442
3
+ size 2095203836
model-00020-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78fbe48f9aadff8af34d7d9761ddb5d84ea00d640b788dfa9f82af36cbd45ba0
3
+ size 1358954708
model-00021-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5af142a24bedec15cbfaf0ace484cbdf9ff01a2b4b99f72a85c98e5dddea145
3
+ size 2095203836
model-00022-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:679060a348a979ff966fbf89fccceec278b0176b58199395b659ef6001324a0d
3
+ size 1358954716
model-00023-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c02f136ad71ba9947022ffee91b71a7bdf60d1a72111a0fe681e6a6ad9364ec7
3
+ size 2095203852
model-00024-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac2e54c71d5a7fb7e214c1121c7737fd495ee1cdd7cbbfe22a1013b3ad3fbfdd
3
+ size 1358954716
model-00025-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cc4137de93bf43bd726f822d5ecc0fb3462cf887ba0de4d327c075aa31703c0
3
+ size 2095203852
model-00026-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2990fdbcd669429ae8cb740013755ffb02b6be9600e2eff431621bd005a9164
3
+ size 1358954716
model-00027-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94c7e42d62da64c135874372113cdcfc67398867222883b8a22c5ae72dc83606
3
+ size 2095203852
model-00028-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b5eee630e2f6f7a16a610d6811cb640c1ff61442a1ccbfc0fd48644ccdf3c5e
3
+ size 1358954716
model-00029-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d93081ad2411540e79148032d85f521c5fa1c22b63b19d36ba373811fd549ad1
3
+ size 2095203852
model-00030-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:749ac01f582ca0c981e8b3afa20c5fae32b3022e426054d179ff002a97928a6c
3
+ size 1358954716
model-00031-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f96672bb43116626c47df7d139dbc5fb9cfe7a56bfaf5d90c9ae7a60c845b1b
3
+ size 2095203852
model-00032-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c5cfaa532708b5befa6145eeb37a0ad761cb8d103fd316ccc5b7404731b77ef
3
+ size 1358954716
model-00033-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b742f787298466e033701ab75be0616836ba85fad05a341482cd801297416593
3
+ size 2095203852
model-00034-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75f57a0c96f25c1f6c58a1a7739226bdf12ef6a17a713900a7e6dfa81aa748fd
3
+ size 1358954716
model-00035-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8cbd533f9e874956f922a85535b37303009dd6254f6c014f376f4c7470ab17c4
3
+ size 2095203852
model-00036-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4be0f31cac813940a69778066be18a8565b094734c73a5fc54749634ab3e1468
3
+ size 1358954716
model-00037-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57e5a9c28a897b2ac80321a1053c02cf610f0d1895ba72ffba47fa4643f9e556
3
+ size 2095203852
model-00038-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce7b84d7e0ede36de80d854d4140cfb8c0f66b5af4977322ec8ade864ae6b964
3
+ size 1358954716
model-00039-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f85733ece4a869c5e4b50647000e04c83ab5867cc0f152165504c1d15b321555
3
+ size 2095203852
model-00040-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d71be466b49c450f5bb49cef853bc0d70e9713c4b88178297d3847bae631808
3
+ size 1358954716
model-00041-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c2efd9d258014378e422ead20ce17e50c3204822092bc9bbc0673fb521057d9
3
+ size 2095203852
model-00042-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0176156bd2ec62eab16e4568e1b2bdb4ecd8e29c6ae09975b254fd439f86e4cc
3
+ size 1358954716
model-00043-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47e072411cf28b82cbc9805fb81a8ee9e4e6480c585f2d4bd25d0268dfd831f1
3
+ size 2095203852
model-00044-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aef2efdcda387a1c9e1b2e16b5d34258fbe1970fc17ede4adec7e2d43e640676
3
+ size 1358954716
model-00045-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64f42af2ad24db779bc5866943455c9c53310db8817ec2244edcb04cb84f562f
3
+ size 2095203852
model-00046-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea9be991f8da98514148b6eca5fe6a66c35775ca2204dc8723c0e9b29c7be89f
3
+ size 1358954716
model-00047-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86c9fa06f9b0bd1d3b092361d662208be9c11b157a13f7c600ddb84f97b925dc
3
+ size 2095203852