Skip to content
Snippets Groups Projects
Commit cdc25d0f authored by zverkov's avatar zverkov
Browse files

Ptuned model

parent fdb36e31
No related branches found
No related tags found
No related merge requests found
{
"auto_mapping": null,
"base_model_name_or_path": "teknium/OpenHermes-2.5-Mistral-7B",
"encoder_dropout": 0.0,
"encoder_hidden_size": 128,
"encoder_num_layers": 2,
"encoder_reparameterization_type": "MLP",
"inference_mode": true,
"num_attention_heads": 32,
"num_layers": 32,
"num_transformer_submodules": 1,
"num_virtual_tokens": 20,
"peft_type": "P_TUNING",
"revision": null,
"task_type": "CAUSAL_LM",
"token_dim": 4096
}
\ No newline at end of file
File added
......@@ -24,7 +24,7 @@ class MistralAgent(object):
torch.cuda.manual_seed(0)
# model_name = "teknium/OpenHermes-2.5-Mistral-7B"
adapter_model_id = "./agents/mistral_adapter"
adapter_model_id = "./agents/hermes_ptuned"
compute_dtype = getattr(torch, "float16")
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment