Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
eduagarcia
commited on
Commit
•
49da771
1
Parent(s):
91c6e89
update readme model list
Browse files- README.md +104 -0
- model_list.txt +104 -0
- update_models_in_readme.py +1 -0
README.md
CHANGED
@@ -64,6 +64,12 @@ models:
|
|
64 |
- BAAI/Aquila-7B
|
65 |
- BAAI/Aquila2-34B
|
66 |
- BAAI/Aquila2-7B
|
|
|
|
|
|
|
|
|
|
|
|
|
67 |
- Bruno/Caramelinho
|
68 |
- Bruno/Caramelo_7B
|
69 |
- CausalLM/34b-beta
|
@@ -72,11 +78,13 @@ models:
|
|
72 |
- CohereForAI/aya-23-8B
|
73 |
- CohereForAI/c4ai-command-r-plus-4bit
|
74 |
- CohereForAI/c4ai-command-r-v01
|
|
|
75 |
- ConvexAI/Luminex-34B-v0.1
|
76 |
- ConvexAI/Luminex-34B-v0.2
|
77 |
- CultriX/NeuralMona_MoE-4x7B
|
78 |
- DAMO-NLP-MT/polylm-1.7b
|
79 |
- DAMO-NLP-MT/polylm-13b
|
|
|
80 |
- Danielbrdz/Barcenas-Llama3-8b-ORPO
|
81 |
- Deci/DeciLM-7B
|
82 |
- DeepMount00/Llama-3-8b-Ita
|
@@ -101,6 +109,13 @@ models:
|
|
101 |
- EleutherAI/pythia-70m-deduped
|
102 |
- FuseAI/FuseChat-7B-VaRM
|
103 |
- FuseAI/OpenChat-3.5-7B-Solar
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
104 |
- GritLM/GritLM-7B
|
105 |
- GritLM/GritLM-7B-KTO
|
106 |
- GuiCas/Phituguese_FP16
|
@@ -108,6 +123,12 @@ models:
|
|
108 |
- HuggingFaceH4/zephyr-7b-alpha
|
109 |
- HuggingFaceH4/zephyr-7b-beta
|
110 |
- HuggingFaceH4/zephyr-7b-gemma-v0.1
|
|
|
|
|
|
|
|
|
|
|
|
|
111 |
- HuggingFaceTB/cosmo-1b
|
112 |
- Intel/neural-chat-7b-v3-1
|
113 |
- Intel/neural-chat-7b-v3-3
|
@@ -120,17 +141,23 @@ models:
|
|
120 |
- JJhooww/Qwen2-7B_reload_v1
|
121 |
- JosephusCheung/LL7M
|
122 |
- Kquant03/CognitiveFusion2-4x7B-BF16
|
|
|
123 |
- Kukedlc/NeuralLLaMa-3-8b-DT-v0.1
|
124 |
- Kukedlc/NeuralLLaMa-3-8b-ORPO-v0.3
|
125 |
- Kukedlc/NeuralLLaMa-3-8b-ORPO-v0.4
|
126 |
- Kukedlc/NeuralSynthesis-7B-v0.1
|
|
|
127 |
- Kukedlc/NeuralSynthesis-7b-v0.4-slerp
|
|
|
|
|
128 |
- M4-ai/tau-0.5B
|
129 |
- M4-ai/tau-0.5B-instruct-DPOP
|
130 |
- M4-ai/tau-1.8B
|
131 |
- MTSAIR/multi_verse_model
|
|
|
132 |
- MagusCorp/legislinho
|
133 |
- MaziyarPanahi/Calme-4x7B-MoE-v0.1
|
|
|
134 |
- MaziyarPanahi/Llama-3-8B-Instruct-v0.8
|
135 |
- MaziyarPanahi/Mistral-7B-Instruct-Aya-101
|
136 |
- MaziyarPanahi/Mistral-7B-Instruct-v0.3
|
@@ -138,9 +165,11 @@ models:
|
|
138 |
- MaziyarPanahi/Topxtral-4x7B-v0.1
|
139 |
- MulaBR/Mula-4x160-v0.1
|
140 |
- MulaBR/Mula-8x160-v0.1
|
|
|
141 |
- NLPark/AnFeng_v3_Avocet
|
142 |
- NOVA-vision-language/GlorIA-1.3B
|
143 |
- Nexusflow/Starling-LM-7B-beta
|
|
|
144 |
- NotAiLOL/Yi-1.5-dolphin-9B
|
145 |
- NousResearch/Hermes-2-Pro-Llama-3-8B
|
146 |
- NousResearch/Hermes-2-Theta-Llama-3-8B
|
@@ -156,6 +185,7 @@ models:
|
|
156 |
- Oburaco/llama2-qlora-finetunined-ptbr
|
157 |
- Oburaco/ptbr-falcon-7b
|
158 |
- Oburaco/ptbr-falcon-7b-v3
|
|
|
159 |
- OpenBuddy/openbuddy-qwen1.5-32b-v21.1-32k
|
160 |
- OpenBuddy/openbuddy-qwen1.5-32b-v21.2-32k
|
161 |
- OpenLLM-France/Claire-7B-0.1
|
@@ -193,17 +223,23 @@ models:
|
|
193 |
- Qwen/Qwen1.5-MoE-A2.7B-Chat
|
194 |
- Qwen/Qwen2-0.5B
|
195 |
- Qwen/Qwen2-0.5B-Instruct
|
|
|
196 |
- Qwen/Qwen2-72B-Instruct
|
197 |
- Qwen/Qwen2-7B
|
198 |
- Qwen/Qwen2-7B-Instruct
|
199 |
- RLHFlow/LLaMA3-iterative-DPO-final
|
|
|
200 |
- Ramikan-BR/TiamaPY-v30
|
|
|
201 |
- Ramikan-BR/tinyllama-coder-py-4bit-v10
|
202 |
- Ramikan-BR/tinyllama-coder-py-v11
|
203 |
- Ramikan-BR/tinyllama-coder-py-v12
|
204 |
- RogerioPiazzon/alpaca-lora-ptbr-7b
|
|
|
205 |
- SakanaAI/DiscoPOP-zephyr-7b-gemma
|
|
|
206 |
- SeaLLMs/SeaLLM-7B-v2.5
|
|
|
207 |
- SinclairSchneider/zephyr-orpo-141b-A35b-v0.1-bnb-4bit
|
208 |
- Skywork/Skywork-13B-base
|
209 |
- THUDM/LongAlign-7B-64k
|
@@ -224,10 +260,18 @@ models:
|
|
224 |
- TheBloke/zephyr-7B-beta-GPTQ
|
225 |
- TinyLlama/TinyLlama-1.1B-Chat-v1.0
|
226 |
- TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T
|
|
|
227 |
- TinyPixel/Llama-2-7B-bf16-sharded
|
|
|
|
|
|
|
|
|
|
|
|
|
228 |
- Unbabel/TowerBase-7B-v0.1
|
229 |
- VAGOsolutions/Llama-3-SauerkrautLM-8b-Instruct
|
230 |
- VAGOsolutions/SauerkrautLM-Gemma-7b
|
|
|
231 |
- VAGOsolutions/SauerkrautLM-Qwen-32b
|
232 |
- Walmart-the-bag/Misted-v2-7B
|
233 |
- Walmart-the-bag/Quintellect-10.7B
|
@@ -243,6 +287,7 @@ models:
|
|
243 |
- Weni/ZeroShot-3.4.22-Mistral-7b-DPO-1.0.0
|
244 |
- Weni/ZeroShot-Multilanguage-Zephyr-7B
|
245 |
- Weyaxi/Bagel-Hermes-34B-Slerp
|
|
|
246 |
- Weyaxi/Nous-Hermes-2-SUS-Chat-34B-Slerp
|
247 |
- WizardLMTeam/WizardLM-13B-V1.0
|
248 |
- WizardLMTeam/WizardLM-70B-V1.0
|
@@ -250,6 +295,7 @@ models:
|
|
250 |
- Xwin-LM/Xwin-LM-13B-V0.2
|
251 |
- Xwin-LM/Xwin-LM-7B-V0.1
|
252 |
- Xwin-LM/Xwin-LM-7B-V0.2
|
|
|
253 |
- abacusai/Llama-3-Smaug-8B
|
254 |
- abacusai/Smaug-34B-v0.1
|
255 |
- abacusai/Smaug-72B-v0.1
|
@@ -277,6 +323,7 @@ models:
|
|
277 |
- allenai/tulu-2-dpo-13b
|
278 |
- allenai/tulu-2-dpo-70b
|
279 |
- allenai/tulu-2-dpo-7b
|
|
|
280 |
- alpindale/WizardLM-2-8x22B
|
281 |
- alvarobartt/Mistral-7B-v0.1-ORPO
|
282 |
- alvarobartt/mistral-7b-orpo-alignment-handbook
|
@@ -297,17 +344,20 @@ models:
|
|
297 |
- baichuan-inc/Baichuan2-7B-Base
|
298 |
- bardsai/jaskier-7b-dpo-v5.6
|
299 |
- bartowski/internlm2-chat-7b-llama
|
|
|
300 |
- berkeley-nest/Starling-LM-7B-alpha
|
301 |
- bigscience/bloom-1b7
|
302 |
- bigscience/bloom-3b
|
303 |
- bigscience/bloom-560m
|
304 |
- bigscience/bloom-7b1
|
305 |
- botbot-ai/Cabra-72b
|
|
|
306 |
- botbot-ai/CabraLlama3-8b
|
307 |
- botbot-ai/CabraMistral-v3-7b-32k
|
308 |
- botbot-ai/CabraMixtral-8x7b
|
309 |
- cerebras/Cerebras-GPT-1.3B
|
310 |
- cerebras/Cerebras-GPT-111M
|
|
|
311 |
- cerebras/Cerebras-GPT-2.7B
|
312 |
- cerebras/Cerebras-GPT-256M
|
313 |
- cerebras/Cerebras-GPT-590M
|
@@ -317,15 +367,22 @@ models:
|
|
317 |
- chujiezheng/Llama-3-Instruct-8B-SimPO-ExPO
|
318 |
- chujiezheng/Smaug-34B-v0.1-ExPO
|
319 |
- cnmoro/Mistral-7B-Portuguese
|
|
|
320 |
- cognitivecomputations/WizardLM-13B-Uncensored
|
321 |
- cognitivecomputations/WizardLM-7B-Uncensored
|
322 |
- cognitivecomputations/dolphin-2.9-llama3-8b
|
|
|
323 |
- cognitivecomputations/dolphin-2.9.1-mixtral-1x22b
|
324 |
- cognitivecomputations/dolphin-2.9.1-yi-1.5-34b
|
325 |
- cognitivecomputations/dolphin-2.9.1-yi-1.5-9b
|
326 |
- cognitivecomputations/dolphin-2.9.2-Phi-3-Medium
|
327 |
- cognitivecomputations/dolphin-2.9.2-Phi-3-Medium-abliterated
|
328 |
- cognitivecomputations/dolphin-2.9.2-qwen2-7b
|
|
|
|
|
|
|
|
|
|
|
329 |
- cosmicvalor/mistral-orthogonalized
|
330 |
- croissantllm/CroissantLLMBase
|
331 |
- deepseek-ai/DeepSeek-V2-Lite
|
@@ -343,6 +400,13 @@ models:
|
|
343 |
- eduagarcia/mistral-orpo-capybara-3k
|
344 |
- eduagarcia/mistral-orpo-mix-21k
|
345 |
- eduagarcia/mistral-orpo-mix-7k
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
346 |
- eduagarcia/zephyr-pt-phi-3-mini-128k-dpo-v0.1
|
347 |
- eduagarcia/zephyr-pt-phi-3-mini-128k-orpo-v0.1
|
348 |
- eduagarcia/zephyr-pt-phi-3-mini-128k-sft-v0.1
|
@@ -365,13 +429,20 @@ models:
|
|
365 |
- facebook/xglm-4.5B
|
366 |
- facebook/xglm-564M
|
367 |
- facebook/xglm-7.5B
|
|
|
368 |
- failspy/Meta-Llama-3-8B-Instruct-abliterated-v3
|
369 |
- failspy/Phi-3-medium-4k-instruct-abliterated-v3
|
370 |
- fblgit/UNA-SimpleSmaug-34b-v1beta
|
371 |
- fernandosola/bluearara-7B
|
372 |
- fernandosola/bluearara-7B-instruct
|
|
|
|
|
373 |
- google/gemma-1.1-2b-it
|
374 |
- google/gemma-1.1-7b-it
|
|
|
|
|
|
|
|
|
375 |
- google/gemma-2b
|
376 |
- google/gemma-2b-it
|
377 |
- google/gemma-7b
|
@@ -388,8 +459,12 @@ models:
|
|
388 |
- h2oai/h2o-danube2-1.8b-base
|
389 |
- h2oai/h2o-danube2-1.8b-chat
|
390 |
- h2oai/h2o-danube2-1.8b-sft
|
|
|
|
|
|
|
391 |
- haoranxu/ALMA-13B-Pretrain
|
392 |
- haoranxu/ALMA-13B-R
|
|
|
393 |
- heloisy/zephyr-7b-b-cosmosqa-ptbr-text-v2
|
394 |
- heloisy/zephyr-7b-b-cosmosqa-ptbr-text-v3
|
395 |
- heloisy/zephyr-7b-cosmosqa-ptbr_text
|
@@ -399,6 +474,7 @@ models:
|
|
399 |
- huggyllama/llama-30b
|
400 |
- huggyllama/llama-65b
|
401 |
- huggyllama/llama-7b
|
|
|
402 |
- ibivibiv/multimaster-7b-v6
|
403 |
- internlm/internlm-20b
|
404 |
- internlm/internlm-7b
|
@@ -414,6 +490,9 @@ models:
|
|
414 |
- internlm/internlm2-chat-7b
|
415 |
- internlm/internlm2-chat-7b-sft
|
416 |
- internlm/internlm2-wqx-20b
|
|
|
|
|
|
|
417 |
- invalid-coder/Sakura-SOLAR-Instruct-CarbonVillain-en-10.7B-v2-slerp
|
418 |
- jeonsworld/CarbonVillain-en-10.7B-v4
|
419 |
- jondurbin/bagel-8b-v1.0
|
@@ -422,6 +501,7 @@ models:
|
|
422 |
- josu/gpt-neo-pt-1.3B
|
423 |
- josu/gpt-neo-pt-br
|
424 |
- jsfs11/MixtureofMerges-MoE-4x7b-v4
|
|
|
425 |
- kaist-ai/mistral-orpo-capybara-7k
|
426 |
- kaitchup/Qwen1.5-7B-bnb-4bit
|
427 |
- kekmodel/StopCarbon-10.7B-v5
|
@@ -432,16 +512,22 @@ models:
|
|
432 |
- lightblue/suzume-llama-3-8B-multilingual-orpo-borda-half
|
433 |
- lightblue/suzume-llama-3-8B-multilingual-orpo-borda-top25
|
434 |
- lightblue/suzume-llama-3-8B-multilingual-orpo-borda-top75
|
|
|
435 |
- lmsys/vicuna-13b-v1.5
|
436 |
- lmsys/vicuna-7b-v1.5
|
437 |
- lrds-code/boana-7b-instruct
|
438 |
- lrds-code/samba-1.1B
|
|
|
439 |
- lucianosb/boto-7B
|
440 |
- lucianosb/boto-7B-v1.1
|
441 |
- lucianosb/boto-7B-v1.2
|
|
|
|
|
|
|
442 |
- maritaca-ai/sabia-7b
|
443 |
- matheusrdgsf/cesar-ptbr
|
444 |
- matsuo-lab/weblab-10b
|
|
|
445 |
- maywell/Synatra-7B-v0.3-RP
|
446 |
- meraGPT/mera-mix-4x7B
|
447 |
- meta-llama/Llama-2-13b-chat-hf
|
@@ -454,6 +540,10 @@ models:
|
|
454 |
- meta-llama/Meta-Llama-3-70B-Instruct
|
455 |
- meta-llama/Meta-Llama-3-8B
|
456 |
- meta-llama/Meta-Llama-3-8B-Instruct
|
|
|
|
|
|
|
|
|
457 |
- microsoft/Phi-3-medium-128k-instruct
|
458 |
- microsoft/Phi-3-medium-4k-instruct
|
459 |
- microsoft/Phi-3-mini-128k-instruct
|
@@ -464,19 +554,24 @@ models:
|
|
464 |
- microsoft/phi-1_5
|
465 |
- microsoft/phi-2
|
466 |
- migtissera/Tess-M-v1.3
|
|
|
467 |
- mistral-community/Mistral-7B-v0.2
|
468 |
- mistral-community/Mixtral-8x22B-Instruct-v0.1-4bit
|
469 |
- mistral-community/Mixtral-8x22B-v0.1-4bit
|
|
|
470 |
- mistralai/Mistral-7B-Instruct-v0.1
|
471 |
- mistralai/Mistral-7B-Instruct-v0.2
|
472 |
- mistralai/Mistral-7B-Instruct-v0.3
|
473 |
- mistralai/Mistral-7B-v0.1
|
474 |
- mistralai/Mistral-7B-v0.3
|
|
|
|
|
475 |
- mistralai/Mixtral-8x22B-Instruct-v0.1
|
476 |
- mistralai/Mixtral-8x7B-Instruct-v0.1
|
477 |
- mistralai/Mixtral-8x7B-v0.1
|
478 |
- mlabonne/AlphaMonarch-7B
|
479 |
- mlabonne/Beyonder-4x7B-v3
|
|
|
480 |
- mlabonne/Daredevil-8B-abliterated
|
481 |
- mlabonne/Llama-3-8B-Instruct-abliterated-dpomix
|
482 |
- mlabonne/Monarch-7B
|
@@ -499,6 +594,7 @@ models:
|
|
499 |
- nicolasdec/CabraQwen7b
|
500 |
- nicolasdec/Cabramistral7b
|
501 |
- nicolasdec/cabra13b
|
|
|
502 |
- openai-community/gpt2-large
|
503 |
- openai-community/gpt2-medium
|
504 |
- openai-community/gpt2-xl
|
@@ -515,6 +611,7 @@ models:
|
|
515 |
- pedrogengo/gemma-ptbr
|
516 |
- pfnet/plamo-13b
|
517 |
- pierreguillou/gpt2-small-portuguese
|
|
|
518 |
- princeton-nlp/Llama-3-Instruct-8B-SimPO
|
519 |
- princeton-nlp/Mistral-7B-Base-SFT-SimPO
|
520 |
- projecte-aina/FLOR-1.3B
|
@@ -571,6 +668,7 @@ models:
|
|
571 |
- rhaymison/portuguese-tom-cat-13b
|
572 |
- rishiraj/CatPPT
|
573 |
- rishiraj/CatPPT-base
|
|
|
574 |
- royallab/ZephRP-m7b
|
575 |
- saltlux/luxia-21.4b-alignment-v1.0
|
576 |
- saltlux/luxia-21.4b-alignment-v1.2
|
@@ -599,9 +697,12 @@ models:
|
|
599 |
- t5-small
|
600 |
- teknium/OpenHermes-2-Mistral-7B
|
601 |
- teknium/OpenHermes-2.5-Mistral-7B
|
|
|
|
|
602 |
- tiiuae/falcon-11B
|
603 |
- tiiuae/falcon-40b
|
604 |
- tiiuae/falcon-7b
|
|
|
605 |
- togethercomputer/RedPajama-INCITE-7B-Base
|
606 |
- togethercomputer/RedPajama-INCITE-Base-3B-v1
|
607 |
- unicamp-dl/ptt5-base-portuguese-vocab
|
@@ -618,8 +719,10 @@ models:
|
|
618 |
- upstage/SOLAR-10.7B-Instruct-v1.0
|
619 |
- upstage/SOLAR-10.7B-v1.0
|
620 |
- uukuguy/speechless-code-mistral-7b-v1.0
|
|
|
621 |
- uukuguy/zephyr-7b-alpha-dare-0.85
|
622 |
- uygarkurt/llama-3-merged-linear
|
|
|
623 |
- vicgalle/CarbonBeagle-11B-truthy
|
624 |
- vicgalle/Configurable-Hermes-2-Pro-Llama-3-8B
|
625 |
- vicgalle/Configurable-Llama-3-8B-v0.3
|
@@ -639,6 +742,7 @@ models:
|
|
639 |
- xverse/XVERSE-7B
|
640 |
- yahma/llama-7b-hf
|
641 |
- yunconglong/DARE_TIES_13B
|
|
|
642 |
- yunconglong/Truthful_DPO_TomGrc_FusionNet_7Bx2_MoE_13B
|
643 |
- zhengr/MixTAO-7Bx2-MoE-v8.1
|
644 |
---
|
|
|
64 |
- BAAI/Aquila-7B
|
65 |
- BAAI/Aquila2-34B
|
66 |
- BAAI/Aquila2-7B
|
67 |
+
- BAAI/Infinity-Instruct-3M-0613-Mistral-7B
|
68 |
+
- BAAI/Infinity-Instruct-3M-0625-Llama3-8B
|
69 |
+
- BAAI/Infinity-Instruct-3M-0625-Mistral-7B
|
70 |
+
- BAAI/Infinity-Instruct-3M-0625-Qwen2-7B
|
71 |
+
- BAAI/Infinity-Instruct-3M-0625-Yi-1.5-9B
|
72 |
+
- BAAI/Infinity-Instruct-7M-0729-Llama3_1-8B
|
73 |
- Bruno/Caramelinho
|
74 |
- Bruno/Caramelo_7B
|
75 |
- CausalLM/34b-beta
|
|
|
78 |
- CohereForAI/aya-23-8B
|
79 |
- CohereForAI/c4ai-command-r-plus-4bit
|
80 |
- CohereForAI/c4ai-command-r-v01
|
81 |
+
- Columbia-NLP/LION-LLaMA-3-8b-odpo-v1.0
|
82 |
- ConvexAI/Luminex-34B-v0.1
|
83 |
- ConvexAI/Luminex-34B-v0.2
|
84 |
- CultriX/NeuralMona_MoE-4x7B
|
85 |
- DAMO-NLP-MT/polylm-1.7b
|
86 |
- DAMO-NLP-MT/polylm-13b
|
87 |
+
- Danielbrdz/Barcenas-14b-Phi-3-medium-ORPO
|
88 |
- Danielbrdz/Barcenas-Llama3-8b-ORPO
|
89 |
- Deci/DeciLM-7B
|
90 |
- DeepMount00/Llama-3-8b-Ita
|
|
|
109 |
- EleutherAI/pythia-70m-deduped
|
110 |
- FuseAI/FuseChat-7B-VaRM
|
111 |
- FuseAI/OpenChat-3.5-7B-Solar
|
112 |
+
- GeneZC/MiniChat-1.5-3B
|
113 |
+
- GeneZC/MiniChat-2-3B
|
114 |
+
- GeneZC/MiniChat-3B
|
115 |
+
- GeneZC/MiniLoong-3B
|
116 |
+
- GeneZC/MiniMA-2-1B
|
117 |
+
- GeneZC/MiniMA-2-3B
|
118 |
+
- GeneZC/MiniMA-3B
|
119 |
- GritLM/GritLM-7B
|
120 |
- GritLM/GritLM-7B-KTO
|
121 |
- GuiCas/Phituguese_FP16
|
|
|
123 |
- HuggingFaceH4/zephyr-7b-alpha
|
124 |
- HuggingFaceH4/zephyr-7b-beta
|
125 |
- HuggingFaceH4/zephyr-7b-gemma-v0.1
|
126 |
+
- HuggingFaceTB/SmolLM-1.7B
|
127 |
+
- HuggingFaceTB/SmolLM-1.7B-Instruct
|
128 |
+
- HuggingFaceTB/SmolLM-135M
|
129 |
+
- HuggingFaceTB/SmolLM-135M-Instruct
|
130 |
+
- HuggingFaceTB/SmolLM-360M
|
131 |
+
- HuggingFaceTB/SmolLM-360M-Instruct
|
132 |
- HuggingFaceTB/cosmo-1b
|
133 |
- Intel/neural-chat-7b-v3-1
|
134 |
- Intel/neural-chat-7b-v3-3
|
|
|
141 |
- JJhooww/Qwen2-7B_reload_v1
|
142 |
- JosephusCheung/LL7M
|
143 |
- Kquant03/CognitiveFusion2-4x7B-BF16
|
144 |
+
- Kukedlc/NeuralExperiment-7b-MagicCoder-v7.5
|
145 |
- Kukedlc/NeuralLLaMa-3-8b-DT-v0.1
|
146 |
- Kukedlc/NeuralLLaMa-3-8b-ORPO-v0.3
|
147 |
- Kukedlc/NeuralLLaMa-3-8b-ORPO-v0.4
|
148 |
- Kukedlc/NeuralSynthesis-7B-v0.1
|
149 |
+
- Kukedlc/NeuralSynthesis-7B-v0.3
|
150 |
- Kukedlc/NeuralSynthesis-7b-v0.4-slerp
|
151 |
+
- LiteAI/Hare-1.1B-Chat
|
152 |
+
- LiteAI/Hare-1.1B-base
|
153 |
- M4-ai/tau-0.5B
|
154 |
- M4-ai/tau-0.5B-instruct-DPOP
|
155 |
- M4-ai/tau-1.8B
|
156 |
- MTSAIR/multi_verse_model
|
157 |
+
- Magpie-Align/Llama-3-8B-Magpie-Align-v0.3
|
158 |
- MagusCorp/legislinho
|
159 |
- MaziyarPanahi/Calme-4x7B-MoE-v0.1
|
160 |
+
- MaziyarPanahi/Calme-4x7B-MoE-v0.2
|
161 |
- MaziyarPanahi/Llama-3-8B-Instruct-v0.8
|
162 |
- MaziyarPanahi/Mistral-7B-Instruct-Aya-101
|
163 |
- MaziyarPanahi/Mistral-7B-Instruct-v0.3
|
|
|
165 |
- MaziyarPanahi/Topxtral-4x7B-v0.1
|
166 |
- MulaBR/Mula-4x160-v0.1
|
167 |
- MulaBR/Mula-8x160-v0.1
|
168 |
+
- NLPark/AnFeng_v3.1-Avocet
|
169 |
- NLPark/AnFeng_v3_Avocet
|
170 |
- NOVA-vision-language/GlorIA-1.3B
|
171 |
- Nexusflow/Starling-LM-7B-beta
|
172 |
+
- Nos-PT/Carvalho_pt-gl-1.3B
|
173 |
- NotAiLOL/Yi-1.5-dolphin-9B
|
174 |
- NousResearch/Hermes-2-Pro-Llama-3-8B
|
175 |
- NousResearch/Hermes-2-Theta-Llama-3-8B
|
|
|
185 |
- Oburaco/llama2-qlora-finetunined-ptbr
|
186 |
- Oburaco/ptbr-falcon-7b
|
187 |
- Oburaco/ptbr-falcon-7b-v3
|
188 |
+
- OliveiraJLT/Sagui-7B-Instruct-v0.1
|
189 |
- OpenBuddy/openbuddy-qwen1.5-32b-v21.1-32k
|
190 |
- OpenBuddy/openbuddy-qwen1.5-32b-v21.2-32k
|
191 |
- OpenLLM-France/Claire-7B-0.1
|
|
|
223 |
- Qwen/Qwen1.5-MoE-A2.7B-Chat
|
224 |
- Qwen/Qwen2-0.5B
|
225 |
- Qwen/Qwen2-0.5B-Instruct
|
226 |
+
- Qwen/Qwen2-72B
|
227 |
- Qwen/Qwen2-72B-Instruct
|
228 |
- Qwen/Qwen2-7B
|
229 |
- Qwen/Qwen2-7B-Instruct
|
230 |
- RLHFlow/LLaMA3-iterative-DPO-final
|
231 |
+
- Ramikan-BR/Qwen2-0.5B-v5
|
232 |
- Ramikan-BR/TiamaPY-v30
|
233 |
+
- Ramikan-BR/TiamaPY-v31
|
234 |
- Ramikan-BR/tinyllama-coder-py-4bit-v10
|
235 |
- Ramikan-BR/tinyllama-coder-py-v11
|
236 |
- Ramikan-BR/tinyllama-coder-py-v12
|
237 |
- RogerioPiazzon/alpaca-lora-ptbr-7b
|
238 |
+
- RubielLabarta/LogoS-7Bx2-MoE-13B-v0.2
|
239 |
- SakanaAI/DiscoPOP-zephyr-7b-gemma
|
240 |
+
- SeaLLMs/SeaLLM-7B-v2
|
241 |
- SeaLLMs/SeaLLM-7B-v2.5
|
242 |
+
- SeaLLMs/SeaLLMs-v3-7B-Chat
|
243 |
- SinclairSchneider/zephyr-orpo-141b-A35b-v0.1-bnb-4bit
|
244 |
- Skywork/Skywork-13B-base
|
245 |
- THUDM/LongAlign-7B-64k
|
|
|
260 |
- TheBloke/zephyr-7B-beta-GPTQ
|
261 |
- TinyLlama/TinyLlama-1.1B-Chat-v1.0
|
262 |
- TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T
|
263 |
+
- TinyLlama/TinyLlama_v1.1
|
264 |
- TinyPixel/Llama-2-7B-bf16-sharded
|
265 |
+
- UCLA-AGI/Gemma-2-9B-It-SPPO-Iter2
|
266 |
+
- UCLA-AGI/Gemma-2-9B-It-SPPO-Iter3
|
267 |
+
- UCLA-AGI/Llama-3-Instruct-8B-SPPO-Iter2
|
268 |
+
- UCLA-AGI/Llama-3-Instruct-8B-SPPO-Iter3
|
269 |
+
- UCLA-AGI/Mistral7B-PairRM-SPPO-Iter2
|
270 |
+
- UCLA-AGI/Mistral7B-PairRM-SPPO-Iter3
|
271 |
- Unbabel/TowerBase-7B-v0.1
|
272 |
- VAGOsolutions/Llama-3-SauerkrautLM-8b-Instruct
|
273 |
- VAGOsolutions/SauerkrautLM-Gemma-7b
|
274 |
+
- VAGOsolutions/SauerkrautLM-Nemo-12b-Instruct
|
275 |
- VAGOsolutions/SauerkrautLM-Qwen-32b
|
276 |
- Walmart-the-bag/Misted-v2-7B
|
277 |
- Walmart-the-bag/Quintellect-10.7B
|
|
|
287 |
- Weni/ZeroShot-3.4.22-Mistral-7b-DPO-1.0.0
|
288 |
- Weni/ZeroShot-Multilanguage-Zephyr-7B
|
289 |
- Weyaxi/Bagel-Hermes-34B-Slerp
|
290 |
+
- Weyaxi/Einstein-v7-Qwen2-7B
|
291 |
- Weyaxi/Nous-Hermes-2-SUS-Chat-34B-Slerp
|
292 |
- WizardLMTeam/WizardLM-13B-V1.0
|
293 |
- WizardLMTeam/WizardLM-70B-V1.0
|
|
|
295 |
- Xwin-LM/Xwin-LM-13B-V0.2
|
296 |
- Xwin-LM/Xwin-LM-7B-V0.1
|
297 |
- Xwin-LM/Xwin-LM-7B-V0.2
|
298 |
+
- abacusai/Liberated-Qwen1.5-14B
|
299 |
- abacusai/Llama-3-Smaug-8B
|
300 |
- abacusai/Smaug-34B-v0.1
|
301 |
- abacusai/Smaug-72B-v0.1
|
|
|
323 |
- allenai/tulu-2-dpo-13b
|
324 |
- allenai/tulu-2-dpo-70b
|
325 |
- allenai/tulu-2-dpo-7b
|
326 |
+
- allknowingroger/MultiverseEx26-7B-slerp
|
327 |
- alpindale/WizardLM-2-8x22B
|
328 |
- alvarobartt/Mistral-7B-v0.1-ORPO
|
329 |
- alvarobartt/mistral-7b-orpo-alignment-handbook
|
|
|
344 |
- baichuan-inc/Baichuan2-7B-Base
|
345 |
- bardsai/jaskier-7b-dpo-v5.6
|
346 |
- bartowski/internlm2-chat-7b-llama
|
347 |
+
- beowolx/CodeNinja-1.0-OpenChat-7B
|
348 |
- berkeley-nest/Starling-LM-7B-alpha
|
349 |
- bigscience/bloom-1b7
|
350 |
- bigscience/bloom-3b
|
351 |
- bigscience/bloom-560m
|
352 |
- bigscience/bloom-7b1
|
353 |
- botbot-ai/Cabra-72b
|
354 |
+
- botbot-ai/CabraLlama3-70b
|
355 |
- botbot-ai/CabraLlama3-8b
|
356 |
- botbot-ai/CabraMistral-v3-7b-32k
|
357 |
- botbot-ai/CabraMixtral-8x7b
|
358 |
- cerebras/Cerebras-GPT-1.3B
|
359 |
- cerebras/Cerebras-GPT-111M
|
360 |
+
- cerebras/Cerebras-GPT-13B
|
361 |
- cerebras/Cerebras-GPT-2.7B
|
362 |
- cerebras/Cerebras-GPT-256M
|
363 |
- cerebras/Cerebras-GPT-590M
|
|
|
367 |
- chujiezheng/Llama-3-Instruct-8B-SimPO-ExPO
|
368 |
- chujiezheng/Smaug-34B-v0.1-ExPO
|
369 |
- cnmoro/Mistral-7B-Portuguese
|
370 |
+
- cognitivecomputations/WestLake-7B-v2-laser
|
371 |
- cognitivecomputations/WizardLM-13B-Uncensored
|
372 |
- cognitivecomputations/WizardLM-7B-Uncensored
|
373 |
- cognitivecomputations/dolphin-2.9-llama3-8b
|
374 |
+
- cognitivecomputations/dolphin-2.9.1-llama-3-70b
|
375 |
- cognitivecomputations/dolphin-2.9.1-mixtral-1x22b
|
376 |
- cognitivecomputations/dolphin-2.9.1-yi-1.5-34b
|
377 |
- cognitivecomputations/dolphin-2.9.1-yi-1.5-9b
|
378 |
- cognitivecomputations/dolphin-2.9.2-Phi-3-Medium
|
379 |
- cognitivecomputations/dolphin-2.9.2-Phi-3-Medium-abliterated
|
380 |
- cognitivecomputations/dolphin-2.9.2-qwen2-7b
|
381 |
+
- cognitivecomputations/dolphin-2.9.3-llama-3-8b
|
382 |
+
- cognitivecomputations/dolphin-2.9.3-mistral-7B-32k
|
383 |
+
- cognitivecomputations/dolphin-2.9.3-mistral-nemo-12b
|
384 |
+
- cognitivecomputations/openchat-3.5-0106-laser
|
385 |
+
- cognitivess/bella-1-8b
|
386 |
- cosmicvalor/mistral-orthogonalized
|
387 |
- croissantllm/CroissantLLMBase
|
388 |
- deepseek-ai/DeepSeek-V2-Lite
|
|
|
400 |
- eduagarcia/mistral-orpo-capybara-3k
|
401 |
- eduagarcia/mistral-orpo-mix-21k
|
402 |
- eduagarcia/mistral-orpo-mix-7k
|
403 |
+
- eduagarcia/zephyr-pt-Yi-1.5-9B-orpo-v0.1
|
404 |
+
- eduagarcia/zephyr-pt-Yi-1.5-9B-orpo-v0.2
|
405 |
+
- eduagarcia/zephyr-pt-Yi-1.5-9B-orpo-v0.3
|
406 |
+
- eduagarcia/zephyr-pt-Yi-1.5-9B-orpo-v0.4
|
407 |
+
- eduagarcia/zephyr-pt-Yi-1.5-9B-orpo-v0.5
|
408 |
+
- eduagarcia/zephyr-pt-Yi-1.5-9B-orpo-v0.6
|
409 |
+
- eduagarcia/zephyr-pt-llama-3-8B-orpo-v0.1
|
410 |
- eduagarcia/zephyr-pt-phi-3-mini-128k-dpo-v0.1
|
411 |
- eduagarcia/zephyr-pt-phi-3-mini-128k-orpo-v0.1
|
412 |
- eduagarcia/zephyr-pt-phi-3-mini-128k-sft-v0.1
|
|
|
429 |
- facebook/xglm-4.5B
|
430 |
- facebook/xglm-564M
|
431 |
- facebook/xglm-7.5B
|
432 |
+
- failspy/Codestral-22B-v0.1-abliterated-v3
|
433 |
- failspy/Meta-Llama-3-8B-Instruct-abliterated-v3
|
434 |
- failspy/Phi-3-medium-4k-instruct-abliterated-v3
|
435 |
- fblgit/UNA-SimpleSmaug-34b-v1beta
|
436 |
- fernandosola/bluearara-7B
|
437 |
- fernandosola/bluearara-7B-instruct
|
438 |
+
- freewheelin/free-solar-evo-v0.11
|
439 |
+
- ghost-x/ghost-8b-beta
|
440 |
- google/gemma-1.1-2b-it
|
441 |
- google/gemma-1.1-7b-it
|
442 |
+
- google/gemma-2-27b
|
443 |
+
- google/gemma-2-27b-it
|
444 |
+
- google/gemma-2-9b
|
445 |
+
- google/gemma-2-9b-it
|
446 |
- google/gemma-2b
|
447 |
- google/gemma-2b-it
|
448 |
- google/gemma-7b
|
|
|
459 |
- h2oai/h2o-danube2-1.8b-base
|
460 |
- h2oai/h2o-danube2-1.8b-chat
|
461 |
- h2oai/h2o-danube2-1.8b-sft
|
462 |
+
- h2oai/h2o-danube3-4b-base
|
463 |
+
- h2oai/h2o-danube3-500m-base
|
464 |
+
- h2oai/h2o-danube3-500m-chat
|
465 |
- haoranxu/ALMA-13B-Pretrain
|
466 |
- haoranxu/ALMA-13B-R
|
467 |
+
- haoranxu/ALMA-7B-R
|
468 |
- heloisy/zephyr-7b-b-cosmosqa-ptbr-text-v2
|
469 |
- heloisy/zephyr-7b-b-cosmosqa-ptbr-text-v3
|
470 |
- heloisy/zephyr-7b-cosmosqa-ptbr_text
|
|
|
474 |
- huggyllama/llama-30b
|
475 |
- huggyllama/llama-65b
|
476 |
- huggyllama/llama-7b
|
477 |
+
- ibivibiv/llama-3-nectar-dpo-8B
|
478 |
- ibivibiv/multimaster-7b-v6
|
479 |
- internlm/internlm-20b
|
480 |
- internlm/internlm-7b
|
|
|
490 |
- internlm/internlm2-chat-7b
|
491 |
- internlm/internlm2-chat-7b-sft
|
492 |
- internlm/internlm2-wqx-20b
|
493 |
+
- internlm/internlm2_5-7b
|
494 |
+
- internlm/internlm2_5-7b-chat
|
495 |
+
- internlm/internlm2_5-7b-chat-1m
|
496 |
- invalid-coder/Sakura-SOLAR-Instruct-CarbonVillain-en-10.7B-v2-slerp
|
497 |
- jeonsworld/CarbonVillain-en-10.7B-v4
|
498 |
- jondurbin/bagel-8b-v1.0
|
|
|
501 |
- josu/gpt-neo-pt-1.3B
|
502 |
- josu/gpt-neo-pt-br
|
503 |
- jsfs11/MixtureofMerges-MoE-4x7b-v4
|
504 |
+
- jsfs11/MixtureofMerges-MoE-4x7b-v5
|
505 |
- kaist-ai/mistral-orpo-capybara-7k
|
506 |
- kaitchup/Qwen1.5-7B-bnb-4bit
|
507 |
- kekmodel/StopCarbon-10.7B-v5
|
|
|
512 |
- lightblue/suzume-llama-3-8B-multilingual-orpo-borda-half
|
513 |
- lightblue/suzume-llama-3-8B-multilingual-orpo-borda-top25
|
514 |
- lightblue/suzume-llama-3-8B-multilingual-orpo-borda-top75
|
515 |
+
- liminerity/M7-7b
|
516 |
- lmsys/vicuna-13b-v1.5
|
517 |
- lmsys/vicuna-7b-v1.5
|
518 |
- lrds-code/boana-7b-instruct
|
519 |
- lrds-code/samba-1.1B
|
520 |
+
- lucianosb/boto-27B
|
521 |
- lucianosb/boto-7B
|
522 |
- lucianosb/boto-7B-v1.1
|
523 |
- lucianosb/boto-7B-v1.2
|
524 |
+
- lucianosb/boto-9B
|
525 |
+
- lucianosb/boto-9B-it
|
526 |
+
- macadeliccc/Samantha-Qwen-2-7B
|
527 |
- maritaca-ai/sabia-7b
|
528 |
- matheusrdgsf/cesar-ptbr
|
529 |
- matsuo-lab/weblab-10b
|
530 |
+
- maywell/Qwen2-7B-Multilingual-RP
|
531 |
- maywell/Synatra-7B-v0.3-RP
|
532 |
- meraGPT/mera-mix-4x7B
|
533 |
- meta-llama/Llama-2-13b-chat-hf
|
|
|
540 |
- meta-llama/Meta-Llama-3-70B-Instruct
|
541 |
- meta-llama/Meta-Llama-3-8B
|
542 |
- meta-llama/Meta-Llama-3-8B-Instruct
|
543 |
+
- meta-llama/Meta-Llama-3.1-70B
|
544 |
+
- meta-llama/Meta-Llama-3.1-70B-Instruct
|
545 |
+
- meta-llama/Meta-Llama-3.1-8B
|
546 |
+
- meta-llama/Meta-Llama-3.1-8B-Instruct
|
547 |
- microsoft/Phi-3-medium-128k-instruct
|
548 |
- microsoft/Phi-3-medium-4k-instruct
|
549 |
- microsoft/Phi-3-mini-128k-instruct
|
|
|
554 |
- microsoft/phi-1_5
|
555 |
- microsoft/phi-2
|
556 |
- migtissera/Tess-M-v1.3
|
557 |
+
- migtissera/Tess-v2.5-Phi-3-medium-128k-14B
|
558 |
- mistral-community/Mistral-7B-v0.2
|
559 |
- mistral-community/Mixtral-8x22B-Instruct-v0.1-4bit
|
560 |
- mistral-community/Mixtral-8x22B-v0.1-4bit
|
561 |
+
- mistralai/Codestral-22B-v0.1
|
562 |
- mistralai/Mistral-7B-Instruct-v0.1
|
563 |
- mistralai/Mistral-7B-Instruct-v0.2
|
564 |
- mistralai/Mistral-7B-Instruct-v0.3
|
565 |
- mistralai/Mistral-7B-v0.1
|
566 |
- mistralai/Mistral-7B-v0.3
|
567 |
+
- mistralai/Mistral-Nemo-Base-2407
|
568 |
+
- mistralai/Mistral-Nemo-Instruct-2407
|
569 |
- mistralai/Mixtral-8x22B-Instruct-v0.1
|
570 |
- mistralai/Mixtral-8x7B-Instruct-v0.1
|
571 |
- mistralai/Mixtral-8x7B-v0.1
|
572 |
- mlabonne/AlphaMonarch-7B
|
573 |
- mlabonne/Beyonder-4x7B-v3
|
574 |
+
- mlabonne/ChimeraLlama-3-8B-v3
|
575 |
- mlabonne/Daredevil-8B-abliterated
|
576 |
- mlabonne/Llama-3-8B-Instruct-abliterated-dpomix
|
577 |
- mlabonne/Monarch-7B
|
|
|
594 |
- nicolasdec/CabraQwen7b
|
595 |
- nicolasdec/Cabramistral7b
|
596 |
- nicolasdec/cabra13b
|
597 |
+
- nvidia/Nemotron-4-340B-Instruct
|
598 |
- openai-community/gpt2-large
|
599 |
- openai-community/gpt2-medium
|
600 |
- openai-community/gpt2-xl
|
|
|
611 |
- pedrogengo/gemma-ptbr
|
612 |
- pfnet/plamo-13b
|
613 |
- pierreguillou/gpt2-small-portuguese
|
614 |
+
- premai-io/prem-1B-chat
|
615 |
- princeton-nlp/Llama-3-Instruct-8B-SimPO
|
616 |
- princeton-nlp/Mistral-7B-Base-SFT-SimPO
|
617 |
- projecte-aina/FLOR-1.3B
|
|
|
668 |
- rhaymison/portuguese-tom-cat-13b
|
669 |
- rishiraj/CatPPT
|
670 |
- rishiraj/CatPPT-base
|
671 |
+
- rombodawg/Everyone-Coder-4x7b-Base
|
672 |
- royallab/ZephRP-m7b
|
673 |
- saltlux/luxia-21.4b-alignment-v1.0
|
674 |
- saltlux/luxia-21.4b-alignment-v1.2
|
|
|
697 |
- t5-small
|
698 |
- teknium/OpenHermes-2-Mistral-7B
|
699 |
- teknium/OpenHermes-2.5-Mistral-7B
|
700 |
+
- tensoropera/Fox-1-1.6B
|
701 |
+
- tensoropera/Fox-1-1.6B-Instruct-v0.1
|
702 |
- tiiuae/falcon-11B
|
703 |
- tiiuae/falcon-40b
|
704 |
- tiiuae/falcon-7b
|
705 |
+
- tobiaspires/command-r-p11-fn
|
706 |
- togethercomputer/RedPajama-INCITE-7B-Base
|
707 |
- togethercomputer/RedPajama-INCITE-Base-3B-v1
|
708 |
- unicamp-dl/ptt5-base-portuguese-vocab
|
|
|
719 |
- upstage/SOLAR-10.7B-Instruct-v1.0
|
720 |
- upstage/SOLAR-10.7B-v1.0
|
721 |
- uukuguy/speechless-code-mistral-7b-v1.0
|
722 |
+
- uukuguy/speechless-zephyr-code-functionary-7b
|
723 |
- uukuguy/zephyr-7b-alpha-dare-0.85
|
724 |
- uygarkurt/llama-3-merged-linear
|
725 |
+
- vicgalle/CarbonBeagle-11B
|
726 |
- vicgalle/CarbonBeagle-11B-truthy
|
727 |
- vicgalle/Configurable-Hermes-2-Pro-Llama-3-8B
|
728 |
- vicgalle/Configurable-Llama-3-8B-v0.3
|
|
|
742 |
- xverse/XVERSE-7B
|
743 |
- yahma/llama-7b-hf
|
744 |
- yunconglong/DARE_TIES_13B
|
745 |
+
- yunconglong/MoE_13B_DPO
|
746 |
- yunconglong/Truthful_DPO_TomGrc_FusionNet_7Bx2_MoE_13B
|
747 |
- zhengr/MixTAO-7Bx2-MoE-v8.1
|
748 |
---
|
model_list.txt
CHANGED
@@ -35,6 +35,12 @@
|
|
35 |
- BAAI/Aquila-7B
|
36 |
- BAAI/Aquila2-34B
|
37 |
- BAAI/Aquila2-7B
|
|
|
|
|
|
|
|
|
|
|
|
|
38 |
- Bruno/Caramelinho
|
39 |
- Bruno/Caramelo_7B
|
40 |
- CausalLM/34b-beta
|
@@ -43,11 +49,13 @@
|
|
43 |
- CohereForAI/aya-23-8B
|
44 |
- CohereForAI/c4ai-command-r-plus-4bit
|
45 |
- CohereForAI/c4ai-command-r-v01
|
|
|
46 |
- ConvexAI/Luminex-34B-v0.1
|
47 |
- ConvexAI/Luminex-34B-v0.2
|
48 |
- CultriX/NeuralMona_MoE-4x7B
|
49 |
- DAMO-NLP-MT/polylm-1.7b
|
50 |
- DAMO-NLP-MT/polylm-13b
|
|
|
51 |
- Danielbrdz/Barcenas-Llama3-8b-ORPO
|
52 |
- Deci/DeciLM-7B
|
53 |
- DeepMount00/Llama-3-8b-Ita
|
@@ -72,6 +80,13 @@
|
|
72 |
- EleutherAI/pythia-70m-deduped
|
73 |
- FuseAI/FuseChat-7B-VaRM
|
74 |
- FuseAI/OpenChat-3.5-7B-Solar
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
75 |
- GritLM/GritLM-7B
|
76 |
- GritLM/GritLM-7B-KTO
|
77 |
- GuiCas/Phituguese_FP16
|
@@ -79,6 +94,12 @@
|
|
79 |
- HuggingFaceH4/zephyr-7b-alpha
|
80 |
- HuggingFaceH4/zephyr-7b-beta
|
81 |
- HuggingFaceH4/zephyr-7b-gemma-v0.1
|
|
|
|
|
|
|
|
|
|
|
|
|
82 |
- HuggingFaceTB/cosmo-1b
|
83 |
- Intel/neural-chat-7b-v3-1
|
84 |
- Intel/neural-chat-7b-v3-3
|
@@ -91,17 +112,23 @@
|
|
91 |
- JJhooww/Qwen2-7B_reload_v1
|
92 |
- JosephusCheung/LL7M
|
93 |
- Kquant03/CognitiveFusion2-4x7B-BF16
|
|
|
94 |
- Kukedlc/NeuralLLaMa-3-8b-DT-v0.1
|
95 |
- Kukedlc/NeuralLLaMa-3-8b-ORPO-v0.3
|
96 |
- Kukedlc/NeuralLLaMa-3-8b-ORPO-v0.4
|
97 |
- Kukedlc/NeuralSynthesis-7B-v0.1
|
|
|
98 |
- Kukedlc/NeuralSynthesis-7b-v0.4-slerp
|
|
|
|
|
99 |
- M4-ai/tau-0.5B
|
100 |
- M4-ai/tau-0.5B-instruct-DPOP
|
101 |
- M4-ai/tau-1.8B
|
102 |
- MTSAIR/multi_verse_model
|
|
|
103 |
- MagusCorp/legislinho
|
104 |
- MaziyarPanahi/Calme-4x7B-MoE-v0.1
|
|
|
105 |
- MaziyarPanahi/Llama-3-8B-Instruct-v0.8
|
106 |
- MaziyarPanahi/Mistral-7B-Instruct-Aya-101
|
107 |
- MaziyarPanahi/Mistral-7B-Instruct-v0.3
|
@@ -109,9 +136,11 @@
|
|
109 |
- MaziyarPanahi/Topxtral-4x7B-v0.1
|
110 |
- MulaBR/Mula-4x160-v0.1
|
111 |
- MulaBR/Mula-8x160-v0.1
|
|
|
112 |
- NLPark/AnFeng_v3_Avocet
|
113 |
- NOVA-vision-language/GlorIA-1.3B
|
114 |
- Nexusflow/Starling-LM-7B-beta
|
|
|
115 |
- NotAiLOL/Yi-1.5-dolphin-9B
|
116 |
- NousResearch/Hermes-2-Pro-Llama-3-8B
|
117 |
- NousResearch/Hermes-2-Theta-Llama-3-8B
|
@@ -127,6 +156,7 @@
|
|
127 |
- Oburaco/llama2-qlora-finetunined-ptbr
|
128 |
- Oburaco/ptbr-falcon-7b
|
129 |
- Oburaco/ptbr-falcon-7b-v3
|
|
|
130 |
- OpenBuddy/openbuddy-qwen1.5-32b-v21.1-32k
|
131 |
- OpenBuddy/openbuddy-qwen1.5-32b-v21.2-32k
|
132 |
- OpenLLM-France/Claire-7B-0.1
|
@@ -164,17 +194,23 @@
|
|
164 |
- Qwen/Qwen1.5-MoE-A2.7B-Chat
|
165 |
- Qwen/Qwen2-0.5B
|
166 |
- Qwen/Qwen2-0.5B-Instruct
|
|
|
167 |
- Qwen/Qwen2-72B-Instruct
|
168 |
- Qwen/Qwen2-7B
|
169 |
- Qwen/Qwen2-7B-Instruct
|
170 |
- RLHFlow/LLaMA3-iterative-DPO-final
|
|
|
171 |
- Ramikan-BR/TiamaPY-v30
|
|
|
172 |
- Ramikan-BR/tinyllama-coder-py-4bit-v10
|
173 |
- Ramikan-BR/tinyllama-coder-py-v11
|
174 |
- Ramikan-BR/tinyllama-coder-py-v12
|
175 |
- RogerioPiazzon/alpaca-lora-ptbr-7b
|
|
|
176 |
- SakanaAI/DiscoPOP-zephyr-7b-gemma
|
|
|
177 |
- SeaLLMs/SeaLLM-7B-v2.5
|
|
|
178 |
- SinclairSchneider/zephyr-orpo-141b-A35b-v0.1-bnb-4bit
|
179 |
- Skywork/Skywork-13B-base
|
180 |
- THUDM/LongAlign-7B-64k
|
@@ -195,10 +231,18 @@
|
|
195 |
- TheBloke/zephyr-7B-beta-GPTQ
|
196 |
- TinyLlama/TinyLlama-1.1B-Chat-v1.0
|
197 |
- TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T
|
|
|
198 |
- TinyPixel/Llama-2-7B-bf16-sharded
|
|
|
|
|
|
|
|
|
|
|
|
|
199 |
- Unbabel/TowerBase-7B-v0.1
|
200 |
- VAGOsolutions/Llama-3-SauerkrautLM-8b-Instruct
|
201 |
- VAGOsolutions/SauerkrautLM-Gemma-7b
|
|
|
202 |
- VAGOsolutions/SauerkrautLM-Qwen-32b
|
203 |
- Walmart-the-bag/Misted-v2-7B
|
204 |
- Walmart-the-bag/Quintellect-10.7B
|
@@ -214,6 +258,7 @@
|
|
214 |
- Weni/ZeroShot-3.4.22-Mistral-7b-DPO-1.0.0
|
215 |
- Weni/ZeroShot-Multilanguage-Zephyr-7B
|
216 |
- Weyaxi/Bagel-Hermes-34B-Slerp
|
|
|
217 |
- Weyaxi/Nous-Hermes-2-SUS-Chat-34B-Slerp
|
218 |
- WizardLMTeam/WizardLM-13B-V1.0
|
219 |
- WizardLMTeam/WizardLM-70B-V1.0
|
@@ -221,6 +266,7 @@
|
|
221 |
- Xwin-LM/Xwin-LM-13B-V0.2
|
222 |
- Xwin-LM/Xwin-LM-7B-V0.1
|
223 |
- Xwin-LM/Xwin-LM-7B-V0.2
|
|
|
224 |
- abacusai/Llama-3-Smaug-8B
|
225 |
- abacusai/Smaug-34B-v0.1
|
226 |
- abacusai/Smaug-72B-v0.1
|
@@ -248,6 +294,7 @@
|
|
248 |
- allenai/tulu-2-dpo-13b
|
249 |
- allenai/tulu-2-dpo-70b
|
250 |
- allenai/tulu-2-dpo-7b
|
|
|
251 |
- alpindale/WizardLM-2-8x22B
|
252 |
- alvarobartt/Mistral-7B-v0.1-ORPO
|
253 |
- alvarobartt/mistral-7b-orpo-alignment-handbook
|
@@ -268,17 +315,20 @@
|
|
268 |
- baichuan-inc/Baichuan2-7B-Base
|
269 |
- bardsai/jaskier-7b-dpo-v5.6
|
270 |
- bartowski/internlm2-chat-7b-llama
|
|
|
271 |
- berkeley-nest/Starling-LM-7B-alpha
|
272 |
- bigscience/bloom-1b7
|
273 |
- bigscience/bloom-3b
|
274 |
- bigscience/bloom-560m
|
275 |
- bigscience/bloom-7b1
|
276 |
- botbot-ai/Cabra-72b
|
|
|
277 |
- botbot-ai/CabraLlama3-8b
|
278 |
- botbot-ai/CabraMistral-v3-7b-32k
|
279 |
- botbot-ai/CabraMixtral-8x7b
|
280 |
- cerebras/Cerebras-GPT-1.3B
|
281 |
- cerebras/Cerebras-GPT-111M
|
|
|
282 |
- cerebras/Cerebras-GPT-2.7B
|
283 |
- cerebras/Cerebras-GPT-256M
|
284 |
- cerebras/Cerebras-GPT-590M
|
@@ -288,15 +338,22 @@
|
|
288 |
- chujiezheng/Llama-3-Instruct-8B-SimPO-ExPO
|
289 |
- chujiezheng/Smaug-34B-v0.1-ExPO
|
290 |
- cnmoro/Mistral-7B-Portuguese
|
|
|
291 |
- cognitivecomputations/WizardLM-13B-Uncensored
|
292 |
- cognitivecomputations/WizardLM-7B-Uncensored
|
293 |
- cognitivecomputations/dolphin-2.9-llama3-8b
|
|
|
294 |
- cognitivecomputations/dolphin-2.9.1-mixtral-1x22b
|
295 |
- cognitivecomputations/dolphin-2.9.1-yi-1.5-34b
|
296 |
- cognitivecomputations/dolphin-2.9.1-yi-1.5-9b
|
297 |
- cognitivecomputations/dolphin-2.9.2-Phi-3-Medium
|
298 |
- cognitivecomputations/dolphin-2.9.2-Phi-3-Medium-abliterated
|
299 |
- cognitivecomputations/dolphin-2.9.2-qwen2-7b
|
|
|
|
|
|
|
|
|
|
|
300 |
- cosmicvalor/mistral-orthogonalized
|
301 |
- croissantllm/CroissantLLMBase
|
302 |
- deepseek-ai/DeepSeek-V2-Lite
|
@@ -314,6 +371,13 @@
|
|
314 |
- eduagarcia/mistral-orpo-capybara-3k
|
315 |
- eduagarcia/mistral-orpo-mix-21k
|
316 |
- eduagarcia/mistral-orpo-mix-7k
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
317 |
- eduagarcia/zephyr-pt-phi-3-mini-128k-dpo-v0.1
|
318 |
- eduagarcia/zephyr-pt-phi-3-mini-128k-orpo-v0.1
|
319 |
- eduagarcia/zephyr-pt-phi-3-mini-128k-sft-v0.1
|
@@ -336,13 +400,20 @@
|
|
336 |
- facebook/xglm-4.5B
|
337 |
- facebook/xglm-564M
|
338 |
- facebook/xglm-7.5B
|
|
|
339 |
- failspy/Meta-Llama-3-8B-Instruct-abliterated-v3
|
340 |
- failspy/Phi-3-medium-4k-instruct-abliterated-v3
|
341 |
- fblgit/UNA-SimpleSmaug-34b-v1beta
|
342 |
- fernandosola/bluearara-7B
|
343 |
- fernandosola/bluearara-7B-instruct
|
|
|
|
|
344 |
- google/gemma-1.1-2b-it
|
345 |
- google/gemma-1.1-7b-it
|
|
|
|
|
|
|
|
|
346 |
- google/gemma-2b
|
347 |
- google/gemma-2b-it
|
348 |
- google/gemma-7b
|
@@ -359,8 +430,12 @@
|
|
359 |
- h2oai/h2o-danube2-1.8b-base
|
360 |
- h2oai/h2o-danube2-1.8b-chat
|
361 |
- h2oai/h2o-danube2-1.8b-sft
|
|
|
|
|
|
|
362 |
- haoranxu/ALMA-13B-Pretrain
|
363 |
- haoranxu/ALMA-13B-R
|
|
|
364 |
- heloisy/zephyr-7b-b-cosmosqa-ptbr-text-v2
|
365 |
- heloisy/zephyr-7b-b-cosmosqa-ptbr-text-v3
|
366 |
- heloisy/zephyr-7b-cosmosqa-ptbr_text
|
@@ -370,6 +445,7 @@
|
|
370 |
- huggyllama/llama-30b
|
371 |
- huggyllama/llama-65b
|
372 |
- huggyllama/llama-7b
|
|
|
373 |
- ibivibiv/multimaster-7b-v6
|
374 |
- internlm/internlm-20b
|
375 |
- internlm/internlm-7b
|
@@ -385,6 +461,9 @@
|
|
385 |
- internlm/internlm2-chat-7b
|
386 |
- internlm/internlm2-chat-7b-sft
|
387 |
- internlm/internlm2-wqx-20b
|
|
|
|
|
|
|
388 |
- invalid-coder/Sakura-SOLAR-Instruct-CarbonVillain-en-10.7B-v2-slerp
|
389 |
- jeonsworld/CarbonVillain-en-10.7B-v4
|
390 |
- jondurbin/bagel-8b-v1.0
|
@@ -393,6 +472,7 @@
|
|
393 |
- josu/gpt-neo-pt-1.3B
|
394 |
- josu/gpt-neo-pt-br
|
395 |
- jsfs11/MixtureofMerges-MoE-4x7b-v4
|
|
|
396 |
- kaist-ai/mistral-orpo-capybara-7k
|
397 |
- kaitchup/Qwen1.5-7B-bnb-4bit
|
398 |
- kekmodel/StopCarbon-10.7B-v5
|
@@ -403,16 +483,22 @@
|
|
403 |
- lightblue/suzume-llama-3-8B-multilingual-orpo-borda-half
|
404 |
- lightblue/suzume-llama-3-8B-multilingual-orpo-borda-top25
|
405 |
- lightblue/suzume-llama-3-8B-multilingual-orpo-borda-top75
|
|
|
406 |
- lmsys/vicuna-13b-v1.5
|
407 |
- lmsys/vicuna-7b-v1.5
|
408 |
- lrds-code/boana-7b-instruct
|
409 |
- lrds-code/samba-1.1B
|
|
|
410 |
- lucianosb/boto-7B
|
411 |
- lucianosb/boto-7B-v1.1
|
412 |
- lucianosb/boto-7B-v1.2
|
|
|
|
|
|
|
413 |
- maritaca-ai/sabia-7b
|
414 |
- matheusrdgsf/cesar-ptbr
|
415 |
- matsuo-lab/weblab-10b
|
|
|
416 |
- maywell/Synatra-7B-v0.3-RP
|
417 |
- meraGPT/mera-mix-4x7B
|
418 |
- meta-llama/Llama-2-13b-chat-hf
|
@@ -425,6 +511,10 @@
|
|
425 |
- meta-llama/Meta-Llama-3-70B-Instruct
|
426 |
- meta-llama/Meta-Llama-3-8B
|
427 |
- meta-llama/Meta-Llama-3-8B-Instruct
|
|
|
|
|
|
|
|
|
428 |
- microsoft/Phi-3-medium-128k-instruct
|
429 |
- microsoft/Phi-3-medium-4k-instruct
|
430 |
- microsoft/Phi-3-mini-128k-instruct
|
@@ -435,19 +525,24 @@
|
|
435 |
- microsoft/phi-1_5
|
436 |
- microsoft/phi-2
|
437 |
- migtissera/Tess-M-v1.3
|
|
|
438 |
- mistral-community/Mistral-7B-v0.2
|
439 |
- mistral-community/Mixtral-8x22B-Instruct-v0.1-4bit
|
440 |
- mistral-community/Mixtral-8x22B-v0.1-4bit
|
|
|
441 |
- mistralai/Mistral-7B-Instruct-v0.1
|
442 |
- mistralai/Mistral-7B-Instruct-v0.2
|
443 |
- mistralai/Mistral-7B-Instruct-v0.3
|
444 |
- mistralai/Mistral-7B-v0.1
|
445 |
- mistralai/Mistral-7B-v0.3
|
|
|
|
|
446 |
- mistralai/Mixtral-8x22B-Instruct-v0.1
|
447 |
- mistralai/Mixtral-8x7B-Instruct-v0.1
|
448 |
- mistralai/Mixtral-8x7B-v0.1
|
449 |
- mlabonne/AlphaMonarch-7B
|
450 |
- mlabonne/Beyonder-4x7B-v3
|
|
|
451 |
- mlabonne/Daredevil-8B-abliterated
|
452 |
- mlabonne/Llama-3-8B-Instruct-abliterated-dpomix
|
453 |
- mlabonne/Monarch-7B
|
@@ -470,6 +565,7 @@
|
|
470 |
- nicolasdec/CabraQwen7b
|
471 |
- nicolasdec/Cabramistral7b
|
472 |
- nicolasdec/cabra13b
|
|
|
473 |
- openai-community/gpt2-large
|
474 |
- openai-community/gpt2-medium
|
475 |
- openai-community/gpt2-xl
|
@@ -486,6 +582,7 @@
|
|
486 |
- pedrogengo/gemma-ptbr
|
487 |
- pfnet/plamo-13b
|
488 |
- pierreguillou/gpt2-small-portuguese
|
|
|
489 |
- princeton-nlp/Llama-3-Instruct-8B-SimPO
|
490 |
- princeton-nlp/Mistral-7B-Base-SFT-SimPO
|
491 |
- projecte-aina/FLOR-1.3B
|
@@ -542,6 +639,7 @@
|
|
542 |
- rhaymison/portuguese-tom-cat-13b
|
543 |
- rishiraj/CatPPT
|
544 |
- rishiraj/CatPPT-base
|
|
|
545 |
- royallab/ZephRP-m7b
|
546 |
- saltlux/luxia-21.4b-alignment-v1.0
|
547 |
- saltlux/luxia-21.4b-alignment-v1.2
|
@@ -570,9 +668,12 @@
|
|
570 |
- t5-small
|
571 |
- teknium/OpenHermes-2-Mistral-7B
|
572 |
- teknium/OpenHermes-2.5-Mistral-7B
|
|
|
|
|
573 |
- tiiuae/falcon-11B
|
574 |
- tiiuae/falcon-40b
|
575 |
- tiiuae/falcon-7b
|
|
|
576 |
- togethercomputer/RedPajama-INCITE-7B-Base
|
577 |
- togethercomputer/RedPajama-INCITE-Base-3B-v1
|
578 |
- unicamp-dl/ptt5-base-portuguese-vocab
|
@@ -589,8 +690,10 @@
|
|
589 |
- upstage/SOLAR-10.7B-Instruct-v1.0
|
590 |
- upstage/SOLAR-10.7B-v1.0
|
591 |
- uukuguy/speechless-code-mistral-7b-v1.0
|
|
|
592 |
- uukuguy/zephyr-7b-alpha-dare-0.85
|
593 |
- uygarkurt/llama-3-merged-linear
|
|
|
594 |
- vicgalle/CarbonBeagle-11B-truthy
|
595 |
- vicgalle/Configurable-Hermes-2-Pro-Llama-3-8B
|
596 |
- vicgalle/Configurable-Llama-3-8B-v0.3
|
@@ -610,5 +713,6 @@
|
|
610 |
- xverse/XVERSE-7B
|
611 |
- yahma/llama-7b-hf
|
612 |
- yunconglong/DARE_TIES_13B
|
|
|
613 |
- yunconglong/Truthful_DPO_TomGrc_FusionNet_7Bx2_MoE_13B
|
614 |
- zhengr/MixTAO-7Bx2-MoE-v8.1
|
|
|
35 |
- BAAI/Aquila-7B
|
36 |
- BAAI/Aquila2-34B
|
37 |
- BAAI/Aquila2-7B
|
38 |
+
- BAAI/Infinity-Instruct-3M-0613-Mistral-7B
|
39 |
+
- BAAI/Infinity-Instruct-3M-0625-Llama3-8B
|
40 |
+
- BAAI/Infinity-Instruct-3M-0625-Mistral-7B
|
41 |
+
- BAAI/Infinity-Instruct-3M-0625-Qwen2-7B
|
42 |
+
- BAAI/Infinity-Instruct-3M-0625-Yi-1.5-9B
|
43 |
+
- BAAI/Infinity-Instruct-7M-0729-Llama3_1-8B
|
44 |
- Bruno/Caramelinho
|
45 |
- Bruno/Caramelo_7B
|
46 |
- CausalLM/34b-beta
|
|
|
49 |
- CohereForAI/aya-23-8B
|
50 |
- CohereForAI/c4ai-command-r-plus-4bit
|
51 |
- CohereForAI/c4ai-command-r-v01
|
52 |
+
- Columbia-NLP/LION-LLaMA-3-8b-odpo-v1.0
|
53 |
- ConvexAI/Luminex-34B-v0.1
|
54 |
- ConvexAI/Luminex-34B-v0.2
|
55 |
- CultriX/NeuralMona_MoE-4x7B
|
56 |
- DAMO-NLP-MT/polylm-1.7b
|
57 |
- DAMO-NLP-MT/polylm-13b
|
58 |
+
- Danielbrdz/Barcenas-14b-Phi-3-medium-ORPO
|
59 |
- Danielbrdz/Barcenas-Llama3-8b-ORPO
|
60 |
- Deci/DeciLM-7B
|
61 |
- DeepMount00/Llama-3-8b-Ita
|
|
|
80 |
- EleutherAI/pythia-70m-deduped
|
81 |
- FuseAI/FuseChat-7B-VaRM
|
82 |
- FuseAI/OpenChat-3.5-7B-Solar
|
83 |
+
- GeneZC/MiniChat-1.5-3B
|
84 |
+
- GeneZC/MiniChat-2-3B
|
85 |
+
- GeneZC/MiniChat-3B
|
86 |
+
- GeneZC/MiniLoong-3B
|
87 |
+
- GeneZC/MiniMA-2-1B
|
88 |
+
- GeneZC/MiniMA-2-3B
|
89 |
+
- GeneZC/MiniMA-3B
|
90 |
- GritLM/GritLM-7B
|
91 |
- GritLM/GritLM-7B-KTO
|
92 |
- GuiCas/Phituguese_FP16
|
|
|
94 |
- HuggingFaceH4/zephyr-7b-alpha
|
95 |
- HuggingFaceH4/zephyr-7b-beta
|
96 |
- HuggingFaceH4/zephyr-7b-gemma-v0.1
|
97 |
+
- HuggingFaceTB/SmolLM-1.7B
|
98 |
+
- HuggingFaceTB/SmolLM-1.7B-Instruct
|
99 |
+
- HuggingFaceTB/SmolLM-135M
|
100 |
+
- HuggingFaceTB/SmolLM-135M-Instruct
|
101 |
+
- HuggingFaceTB/SmolLM-360M
|
102 |
+
- HuggingFaceTB/SmolLM-360M-Instruct
|
103 |
- HuggingFaceTB/cosmo-1b
|
104 |
- Intel/neural-chat-7b-v3-1
|
105 |
- Intel/neural-chat-7b-v3-3
|
|
|
112 |
- JJhooww/Qwen2-7B_reload_v1
|
113 |
- JosephusCheung/LL7M
|
114 |
- Kquant03/CognitiveFusion2-4x7B-BF16
|
115 |
+
- Kukedlc/NeuralExperiment-7b-MagicCoder-v7.5
|
116 |
- Kukedlc/NeuralLLaMa-3-8b-DT-v0.1
|
117 |
- Kukedlc/NeuralLLaMa-3-8b-ORPO-v0.3
|
118 |
- Kukedlc/NeuralLLaMa-3-8b-ORPO-v0.4
|
119 |
- Kukedlc/NeuralSynthesis-7B-v0.1
|
120 |
+
- Kukedlc/NeuralSynthesis-7B-v0.3
|
121 |
- Kukedlc/NeuralSynthesis-7b-v0.4-slerp
|
122 |
+
- LiteAI/Hare-1.1B-Chat
|
123 |
+
- LiteAI/Hare-1.1B-base
|
124 |
- M4-ai/tau-0.5B
|
125 |
- M4-ai/tau-0.5B-instruct-DPOP
|
126 |
- M4-ai/tau-1.8B
|
127 |
- MTSAIR/multi_verse_model
|
128 |
+
- Magpie-Align/Llama-3-8B-Magpie-Align-v0.3
|
129 |
- MagusCorp/legislinho
|
130 |
- MaziyarPanahi/Calme-4x7B-MoE-v0.1
|
131 |
+
- MaziyarPanahi/Calme-4x7B-MoE-v0.2
|
132 |
- MaziyarPanahi/Llama-3-8B-Instruct-v0.8
|
133 |
- MaziyarPanahi/Mistral-7B-Instruct-Aya-101
|
134 |
- MaziyarPanahi/Mistral-7B-Instruct-v0.3
|
|
|
136 |
- MaziyarPanahi/Topxtral-4x7B-v0.1
|
137 |
- MulaBR/Mula-4x160-v0.1
|
138 |
- MulaBR/Mula-8x160-v0.1
|
139 |
+
- NLPark/AnFeng_v3.1-Avocet
|
140 |
- NLPark/AnFeng_v3_Avocet
|
141 |
- NOVA-vision-language/GlorIA-1.3B
|
142 |
- Nexusflow/Starling-LM-7B-beta
|
143 |
+
- Nos-PT/Carvalho_pt-gl-1.3B
|
144 |
- NotAiLOL/Yi-1.5-dolphin-9B
|
145 |
- NousResearch/Hermes-2-Pro-Llama-3-8B
|
146 |
- NousResearch/Hermes-2-Theta-Llama-3-8B
|
|
|
156 |
- Oburaco/llama2-qlora-finetunined-ptbr
|
157 |
- Oburaco/ptbr-falcon-7b
|
158 |
- Oburaco/ptbr-falcon-7b-v3
|
159 |
+
- OliveiraJLT/Sagui-7B-Instruct-v0.1
|
160 |
- OpenBuddy/openbuddy-qwen1.5-32b-v21.1-32k
|
161 |
- OpenBuddy/openbuddy-qwen1.5-32b-v21.2-32k
|
162 |
- OpenLLM-France/Claire-7B-0.1
|
|
|
194 |
- Qwen/Qwen1.5-MoE-A2.7B-Chat
|
195 |
- Qwen/Qwen2-0.5B
|
196 |
- Qwen/Qwen2-0.5B-Instruct
|
197 |
+
- Qwen/Qwen2-72B
|
198 |
- Qwen/Qwen2-72B-Instruct
|
199 |
- Qwen/Qwen2-7B
|
200 |
- Qwen/Qwen2-7B-Instruct
|
201 |
- RLHFlow/LLaMA3-iterative-DPO-final
|
202 |
+
- Ramikan-BR/Qwen2-0.5B-v5
|
203 |
- Ramikan-BR/TiamaPY-v30
|
204 |
+
- Ramikan-BR/TiamaPY-v31
|
205 |
- Ramikan-BR/tinyllama-coder-py-4bit-v10
|
206 |
- Ramikan-BR/tinyllama-coder-py-v11
|
207 |
- Ramikan-BR/tinyllama-coder-py-v12
|
208 |
- RogerioPiazzon/alpaca-lora-ptbr-7b
|
209 |
+
- RubielLabarta/LogoS-7Bx2-MoE-13B-v0.2
|
210 |
- SakanaAI/DiscoPOP-zephyr-7b-gemma
|
211 |
+
- SeaLLMs/SeaLLM-7B-v2
|
212 |
- SeaLLMs/SeaLLM-7B-v2.5
|
213 |
+
- SeaLLMs/SeaLLMs-v3-7B-Chat
|
214 |
- SinclairSchneider/zephyr-orpo-141b-A35b-v0.1-bnb-4bit
|
215 |
- Skywork/Skywork-13B-base
|
216 |
- THUDM/LongAlign-7B-64k
|
|
|
231 |
- TheBloke/zephyr-7B-beta-GPTQ
|
232 |
- TinyLlama/TinyLlama-1.1B-Chat-v1.0
|
233 |
- TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T
|
234 |
+
- TinyLlama/TinyLlama_v1.1
|
235 |
- TinyPixel/Llama-2-7B-bf16-sharded
|
236 |
+
- UCLA-AGI/Gemma-2-9B-It-SPPO-Iter2
|
237 |
+
- UCLA-AGI/Gemma-2-9B-It-SPPO-Iter3
|
238 |
+
- UCLA-AGI/Llama-3-Instruct-8B-SPPO-Iter2
|
239 |
+
- UCLA-AGI/Llama-3-Instruct-8B-SPPO-Iter3
|
240 |
+
- UCLA-AGI/Mistral7B-PairRM-SPPO-Iter2
|
241 |
+
- UCLA-AGI/Mistral7B-PairRM-SPPO-Iter3
|
242 |
- Unbabel/TowerBase-7B-v0.1
|
243 |
- VAGOsolutions/Llama-3-SauerkrautLM-8b-Instruct
|
244 |
- VAGOsolutions/SauerkrautLM-Gemma-7b
|
245 |
+
- VAGOsolutions/SauerkrautLM-Nemo-12b-Instruct
|
246 |
- VAGOsolutions/SauerkrautLM-Qwen-32b
|
247 |
- Walmart-the-bag/Misted-v2-7B
|
248 |
- Walmart-the-bag/Quintellect-10.7B
|
|
|
258 |
- Weni/ZeroShot-3.4.22-Mistral-7b-DPO-1.0.0
|
259 |
- Weni/ZeroShot-Multilanguage-Zephyr-7B
|
260 |
- Weyaxi/Bagel-Hermes-34B-Slerp
|
261 |
+
- Weyaxi/Einstein-v7-Qwen2-7B
|
262 |
- Weyaxi/Nous-Hermes-2-SUS-Chat-34B-Slerp
|
263 |
- WizardLMTeam/WizardLM-13B-V1.0
|
264 |
- WizardLMTeam/WizardLM-70B-V1.0
|
|
|
266 |
- Xwin-LM/Xwin-LM-13B-V0.2
|
267 |
- Xwin-LM/Xwin-LM-7B-V0.1
|
268 |
- Xwin-LM/Xwin-LM-7B-V0.2
|
269 |
+
- abacusai/Liberated-Qwen1.5-14B
|
270 |
- abacusai/Llama-3-Smaug-8B
|
271 |
- abacusai/Smaug-34B-v0.1
|
272 |
- abacusai/Smaug-72B-v0.1
|
|
|
294 |
- allenai/tulu-2-dpo-13b
|
295 |
- allenai/tulu-2-dpo-70b
|
296 |
- allenai/tulu-2-dpo-7b
|
297 |
+
- allknowingroger/MultiverseEx26-7B-slerp
|
298 |
- alpindale/WizardLM-2-8x22B
|
299 |
- alvarobartt/Mistral-7B-v0.1-ORPO
|
300 |
- alvarobartt/mistral-7b-orpo-alignment-handbook
|
|
|
315 |
- baichuan-inc/Baichuan2-7B-Base
|
316 |
- bardsai/jaskier-7b-dpo-v5.6
|
317 |
- bartowski/internlm2-chat-7b-llama
|
318 |
+
- beowolx/CodeNinja-1.0-OpenChat-7B
|
319 |
- berkeley-nest/Starling-LM-7B-alpha
|
320 |
- bigscience/bloom-1b7
|
321 |
- bigscience/bloom-3b
|
322 |
- bigscience/bloom-560m
|
323 |
- bigscience/bloom-7b1
|
324 |
- botbot-ai/Cabra-72b
|
325 |
+
- botbot-ai/CabraLlama3-70b
|
326 |
- botbot-ai/CabraLlama3-8b
|
327 |
- botbot-ai/CabraMistral-v3-7b-32k
|
328 |
- botbot-ai/CabraMixtral-8x7b
|
329 |
- cerebras/Cerebras-GPT-1.3B
|
330 |
- cerebras/Cerebras-GPT-111M
|
331 |
+
- cerebras/Cerebras-GPT-13B
|
332 |
- cerebras/Cerebras-GPT-2.7B
|
333 |
- cerebras/Cerebras-GPT-256M
|
334 |
- cerebras/Cerebras-GPT-590M
|
|
|
338 |
- chujiezheng/Llama-3-Instruct-8B-SimPO-ExPO
|
339 |
- chujiezheng/Smaug-34B-v0.1-ExPO
|
340 |
- cnmoro/Mistral-7B-Portuguese
|
341 |
+
- cognitivecomputations/WestLake-7B-v2-laser
|
342 |
- cognitivecomputations/WizardLM-13B-Uncensored
|
343 |
- cognitivecomputations/WizardLM-7B-Uncensored
|
344 |
- cognitivecomputations/dolphin-2.9-llama3-8b
|
345 |
+
- cognitivecomputations/dolphin-2.9.1-llama-3-70b
|
346 |
- cognitivecomputations/dolphin-2.9.1-mixtral-1x22b
|
347 |
- cognitivecomputations/dolphin-2.9.1-yi-1.5-34b
|
348 |
- cognitivecomputations/dolphin-2.9.1-yi-1.5-9b
|
349 |
- cognitivecomputations/dolphin-2.9.2-Phi-3-Medium
|
350 |
- cognitivecomputations/dolphin-2.9.2-Phi-3-Medium-abliterated
|
351 |
- cognitivecomputations/dolphin-2.9.2-qwen2-7b
|
352 |
+
- cognitivecomputations/dolphin-2.9.3-llama-3-8b
|
353 |
+
- cognitivecomputations/dolphin-2.9.3-mistral-7B-32k
|
354 |
+
- cognitivecomputations/dolphin-2.9.3-mistral-nemo-12b
|
355 |
+
- cognitivecomputations/openchat-3.5-0106-laser
|
356 |
+
- cognitivess/bella-1-8b
|
357 |
- cosmicvalor/mistral-orthogonalized
|
358 |
- croissantllm/CroissantLLMBase
|
359 |
- deepseek-ai/DeepSeek-V2-Lite
|
|
|
371 |
- eduagarcia/mistral-orpo-capybara-3k
|
372 |
- eduagarcia/mistral-orpo-mix-21k
|
373 |
- eduagarcia/mistral-orpo-mix-7k
|
374 |
+
- eduagarcia/zephyr-pt-Yi-1.5-9B-orpo-v0.1
|
375 |
+
- eduagarcia/zephyr-pt-Yi-1.5-9B-orpo-v0.2
|
376 |
+
- eduagarcia/zephyr-pt-Yi-1.5-9B-orpo-v0.3
|
377 |
+
- eduagarcia/zephyr-pt-Yi-1.5-9B-orpo-v0.4
|
378 |
+
- eduagarcia/zephyr-pt-Yi-1.5-9B-orpo-v0.5
|
379 |
+
- eduagarcia/zephyr-pt-Yi-1.5-9B-orpo-v0.6
|
380 |
+
- eduagarcia/zephyr-pt-llama-3-8B-orpo-v0.1
|
381 |
- eduagarcia/zephyr-pt-phi-3-mini-128k-dpo-v0.1
|
382 |
- eduagarcia/zephyr-pt-phi-3-mini-128k-orpo-v0.1
|
383 |
- eduagarcia/zephyr-pt-phi-3-mini-128k-sft-v0.1
|
|
|
400 |
- facebook/xglm-4.5B
|
401 |
- facebook/xglm-564M
|
402 |
- facebook/xglm-7.5B
|
403 |
+
- failspy/Codestral-22B-v0.1-abliterated-v3
|
404 |
- failspy/Meta-Llama-3-8B-Instruct-abliterated-v3
|
405 |
- failspy/Phi-3-medium-4k-instruct-abliterated-v3
|
406 |
- fblgit/UNA-SimpleSmaug-34b-v1beta
|
407 |
- fernandosola/bluearara-7B
|
408 |
- fernandosola/bluearara-7B-instruct
|
409 |
+
- freewheelin/free-solar-evo-v0.11
|
410 |
+
- ghost-x/ghost-8b-beta
|
411 |
- google/gemma-1.1-2b-it
|
412 |
- google/gemma-1.1-7b-it
|
413 |
+
- google/gemma-2-27b
|
414 |
+
- google/gemma-2-27b-it
|
415 |
+
- google/gemma-2-9b
|
416 |
+
- google/gemma-2-9b-it
|
417 |
- google/gemma-2b
|
418 |
- google/gemma-2b-it
|
419 |
- google/gemma-7b
|
|
|
430 |
- h2oai/h2o-danube2-1.8b-base
|
431 |
- h2oai/h2o-danube2-1.8b-chat
|
432 |
- h2oai/h2o-danube2-1.8b-sft
|
433 |
+
- h2oai/h2o-danube3-4b-base
|
434 |
+
- h2oai/h2o-danube3-500m-base
|
435 |
+
- h2oai/h2o-danube3-500m-chat
|
436 |
- haoranxu/ALMA-13B-Pretrain
|
437 |
- haoranxu/ALMA-13B-R
|
438 |
+
- haoranxu/ALMA-7B-R
|
439 |
- heloisy/zephyr-7b-b-cosmosqa-ptbr-text-v2
|
440 |
- heloisy/zephyr-7b-b-cosmosqa-ptbr-text-v3
|
441 |
- heloisy/zephyr-7b-cosmosqa-ptbr_text
|
|
|
445 |
- huggyllama/llama-30b
|
446 |
- huggyllama/llama-65b
|
447 |
- huggyllama/llama-7b
|
448 |
+
- ibivibiv/llama-3-nectar-dpo-8B
|
449 |
- ibivibiv/multimaster-7b-v6
|
450 |
- internlm/internlm-20b
|
451 |
- internlm/internlm-7b
|
|
|
461 |
- internlm/internlm2-chat-7b
|
462 |
- internlm/internlm2-chat-7b-sft
|
463 |
- internlm/internlm2-wqx-20b
|
464 |
+
- internlm/internlm2_5-7b
|
465 |
+
- internlm/internlm2_5-7b-chat
|
466 |
+
- internlm/internlm2_5-7b-chat-1m
|
467 |
- invalid-coder/Sakura-SOLAR-Instruct-CarbonVillain-en-10.7B-v2-slerp
|
468 |
- jeonsworld/CarbonVillain-en-10.7B-v4
|
469 |
- jondurbin/bagel-8b-v1.0
|
|
|
472 |
- josu/gpt-neo-pt-1.3B
|
473 |
- josu/gpt-neo-pt-br
|
474 |
- jsfs11/MixtureofMerges-MoE-4x7b-v4
|
475 |
+
- jsfs11/MixtureofMerges-MoE-4x7b-v5
|
476 |
- kaist-ai/mistral-orpo-capybara-7k
|
477 |
- kaitchup/Qwen1.5-7B-bnb-4bit
|
478 |
- kekmodel/StopCarbon-10.7B-v5
|
|
|
483 |
- lightblue/suzume-llama-3-8B-multilingual-orpo-borda-half
|
484 |
- lightblue/suzume-llama-3-8B-multilingual-orpo-borda-top25
|
485 |
- lightblue/suzume-llama-3-8B-multilingual-orpo-borda-top75
|
486 |
+
- liminerity/M7-7b
|
487 |
- lmsys/vicuna-13b-v1.5
|
488 |
- lmsys/vicuna-7b-v1.5
|
489 |
- lrds-code/boana-7b-instruct
|
490 |
- lrds-code/samba-1.1B
|
491 |
+
- lucianosb/boto-27B
|
492 |
- lucianosb/boto-7B
|
493 |
- lucianosb/boto-7B-v1.1
|
494 |
- lucianosb/boto-7B-v1.2
|
495 |
+
- lucianosb/boto-9B
|
496 |
+
- lucianosb/boto-9B-it
|
497 |
+
- macadeliccc/Samantha-Qwen-2-7B
|
498 |
- maritaca-ai/sabia-7b
|
499 |
- matheusrdgsf/cesar-ptbr
|
500 |
- matsuo-lab/weblab-10b
|
501 |
+
- maywell/Qwen2-7B-Multilingual-RP
|
502 |
- maywell/Synatra-7B-v0.3-RP
|
503 |
- meraGPT/mera-mix-4x7B
|
504 |
- meta-llama/Llama-2-13b-chat-hf
|
|
|
511 |
- meta-llama/Meta-Llama-3-70B-Instruct
|
512 |
- meta-llama/Meta-Llama-3-8B
|
513 |
- meta-llama/Meta-Llama-3-8B-Instruct
|
514 |
+
- meta-llama/Meta-Llama-3.1-70B
|
515 |
+
- meta-llama/Meta-Llama-3.1-70B-Instruct
|
516 |
+
- meta-llama/Meta-Llama-3.1-8B
|
517 |
+
- meta-llama/Meta-Llama-3.1-8B-Instruct
|
518 |
- microsoft/Phi-3-medium-128k-instruct
|
519 |
- microsoft/Phi-3-medium-4k-instruct
|
520 |
- microsoft/Phi-3-mini-128k-instruct
|
|
|
525 |
- microsoft/phi-1_5
|
526 |
- microsoft/phi-2
|
527 |
- migtissera/Tess-M-v1.3
|
528 |
+
- migtissera/Tess-v2.5-Phi-3-medium-128k-14B
|
529 |
- mistral-community/Mistral-7B-v0.2
|
530 |
- mistral-community/Mixtral-8x22B-Instruct-v0.1-4bit
|
531 |
- mistral-community/Mixtral-8x22B-v0.1-4bit
|
532 |
+
- mistralai/Codestral-22B-v0.1
|
533 |
- mistralai/Mistral-7B-Instruct-v0.1
|
534 |
- mistralai/Mistral-7B-Instruct-v0.2
|
535 |
- mistralai/Mistral-7B-Instruct-v0.3
|
536 |
- mistralai/Mistral-7B-v0.1
|
537 |
- mistralai/Mistral-7B-v0.3
|
538 |
+
- mistralai/Mistral-Nemo-Base-2407
|
539 |
+
- mistralai/Mistral-Nemo-Instruct-2407
|
540 |
- mistralai/Mixtral-8x22B-Instruct-v0.1
|
541 |
- mistralai/Mixtral-8x7B-Instruct-v0.1
|
542 |
- mistralai/Mixtral-8x7B-v0.1
|
543 |
- mlabonne/AlphaMonarch-7B
|
544 |
- mlabonne/Beyonder-4x7B-v3
|
545 |
+
- mlabonne/ChimeraLlama-3-8B-v3
|
546 |
- mlabonne/Daredevil-8B-abliterated
|
547 |
- mlabonne/Llama-3-8B-Instruct-abliterated-dpomix
|
548 |
- mlabonne/Monarch-7B
|
|
|
565 |
- nicolasdec/CabraQwen7b
|
566 |
- nicolasdec/Cabramistral7b
|
567 |
- nicolasdec/cabra13b
|
568 |
+
- nvidia/Nemotron-4-340B-Instruct
|
569 |
- openai-community/gpt2-large
|
570 |
- openai-community/gpt2-medium
|
571 |
- openai-community/gpt2-xl
|
|
|
582 |
- pedrogengo/gemma-ptbr
|
583 |
- pfnet/plamo-13b
|
584 |
- pierreguillou/gpt2-small-portuguese
|
585 |
+
- premai-io/prem-1B-chat
|
586 |
- princeton-nlp/Llama-3-Instruct-8B-SimPO
|
587 |
- princeton-nlp/Mistral-7B-Base-SFT-SimPO
|
588 |
- projecte-aina/FLOR-1.3B
|
|
|
639 |
- rhaymison/portuguese-tom-cat-13b
|
640 |
- rishiraj/CatPPT
|
641 |
- rishiraj/CatPPT-base
|
642 |
+
- rombodawg/Everyone-Coder-4x7b-Base
|
643 |
- royallab/ZephRP-m7b
|
644 |
- saltlux/luxia-21.4b-alignment-v1.0
|
645 |
- saltlux/luxia-21.4b-alignment-v1.2
|
|
|
668 |
- t5-small
|
669 |
- teknium/OpenHermes-2-Mistral-7B
|
670 |
- teknium/OpenHermes-2.5-Mistral-7B
|
671 |
+
- tensoropera/Fox-1-1.6B
|
672 |
+
- tensoropera/Fox-1-1.6B-Instruct-v0.1
|
673 |
- tiiuae/falcon-11B
|
674 |
- tiiuae/falcon-40b
|
675 |
- tiiuae/falcon-7b
|
676 |
+
- tobiaspires/command-r-p11-fn
|
677 |
- togethercomputer/RedPajama-INCITE-7B-Base
|
678 |
- togethercomputer/RedPajama-INCITE-Base-3B-v1
|
679 |
- unicamp-dl/ptt5-base-portuguese-vocab
|
|
|
690 |
- upstage/SOLAR-10.7B-Instruct-v1.0
|
691 |
- upstage/SOLAR-10.7B-v1.0
|
692 |
- uukuguy/speechless-code-mistral-7b-v1.0
|
693 |
+
- uukuguy/speechless-zephyr-code-functionary-7b
|
694 |
- uukuguy/zephyr-7b-alpha-dare-0.85
|
695 |
- uygarkurt/llama-3-merged-linear
|
696 |
+
- vicgalle/CarbonBeagle-11B
|
697 |
- vicgalle/CarbonBeagle-11B-truthy
|
698 |
- vicgalle/Configurable-Hermes-2-Pro-Llama-3-8B
|
699 |
- vicgalle/Configurable-Llama-3-8B-v0.3
|
|
|
713 |
- xverse/XVERSE-7B
|
714 |
- yahma/llama-7b-hf
|
715 |
- yunconglong/DARE_TIES_13B
|
716 |
+
- yunconglong/MoE_13B_DPO
|
717 |
- yunconglong/Truthful_DPO_TomGrc_FusionNet_7Bx2_MoE_13B
|
718 |
- zhengr/MixTAO-7Bx2-MoE-v8.1
|
update_models_in_readme.py
CHANGED
@@ -18,6 +18,7 @@ import json
|
|
18 |
|
19 |
snapshot_download(repo_id=QUEUE_REPO, local_dir=EVAL_REQUESTS_PATH, repo_type="dataset", tqdm_class=None, etag_timeout=30)
|
20 |
all_models = []
|
|
|
21 |
for filepath in glob.glob(os.path.join(EVAL_REQUESTS_PATH, '**/*.json'), recursive=True):
|
22 |
with open(filepath, 'r') as f:
|
23 |
model_data = json.load(f)
|
|
|
18 |
|
19 |
snapshot_download(repo_id=QUEUE_REPO, local_dir=EVAL_REQUESTS_PATH, repo_type="dataset", tqdm_class=None, etag_timeout=30)
|
20 |
all_models = []
|
21 |
+
all_models.append('nvidia/Nemotron-4-340B-Instruct')
|
22 |
for filepath in glob.glob(os.path.join(EVAL_REQUESTS_PATH, '**/*.json'), recursive=True):
|
23 |
with open(filepath, 'r') as f:
|
24 |
model_data = json.load(f)
|