|
{ |
|
"architectures": [ |
|
"AceCalisto3" |
|
], |
|
"attention_probs_dropout_prob": 0.1, |
|
"bos_token_id": 0, |
|
"eos_token_id": 2, |
|
"hidden_act": "gelu", |
|
"hidden_dropout_prob": 0.1, |
|
"hidden_size": 1024, |
|
"initializer_range": 0.02, |
|
"intermediate_size": 4096, |
|
"layer_norm_eps": 1e-05, |
|
"max_position_embeddings": 512, |
|
"model_type": "acecalisto3", |
|
"num_attention_heads": 16, |
|
"num_hidden_layers": 24, |
|
"pad_token_id": 1, |
|
"vocab_size": 50257, |
|
"use_cache": true, |
|
"gradient_checkpointing": false, |
|
"is_decoder": true, |
|
"is_encoder_decoder": false, |
|
"tie_word_embeddings": false, |
|
"use_bias": true, |
|
"vocab_path": "vocab.json", |
|
"use_bf16": false, |
|
"use_fp16": false, |
|
"use_m32": false, |
|
"use_m64": false, |
|
"use_m128": false, |
|
"use_sharded_weights": false, |
|
"use_mps": false, |
|
"use_xpu": false, |
|
"use_tpu": false, |
|
"use_fast_gelu": false, |
|
"use_gelu_new": false, |
|
"torchscript": false, |
|
"load_in_8bit": false, |
|
"load_in_4bit": false, |
|
"quantization_config": { |
|
"bits": 8, |
|
"mode": "static", |
|
"use_fp16": false |
|
}, |
|
"trust_remote_code": false, |
|
"use_slow_tokenizer": false, |
|
"revision": "main", |
|
"cache_dir": "./model_cache", |
|
"resume_download": true, |
|
"proxies": null, |
|
"local_files_only": false, |
|
"force_download": false, |
|
"token": null, |
|
"repo_id": "acecalisto3/InstructiPhi", |
|
"repo_type": "model", |
|
"use_cdn": true, |
|
"force_http": false, |
|
"max_retries": 5, |
|
"timeout": 60, |
|
"ignore_download_warnings": false, |
|
"offline_mode": false, |
|
"use_fast_tokenizer": true, |
|
"use_fast": true, |
|
"low_cpu": false, |
|
"pad_to_max_length": false, |
|
"model_max_length": 512, |
|
"max_position_embeddings": 512, |
|
"model_kwargs": {} |
|
} |