neural-coder
/

llama-3-8b-ft

Text Generation

Trained with AutoTrain

text-generation-inference

Model card Files Files and versions Community

neural-coder commited on 21 days ago

Commit

dfd954b

·

verified ·

1 Parent(s): 9d1f32f

Delete training_params.json

Files changed (1) hide show

training_params.json +0 -49

training_params.json DELETED Viewed

@@ -1,49 +0,0 @@
-{
-    "model": "Team-ACE/ToolACE-2-Llama-3.1-8B",
-    "project_name": "llama-3-8b-ft",
-    "data_path": "llama-3-8b-ft/autotrain-data",
-    "train_split": "train",
-    "valid_split": null,
-    "add_eos_token": true,
-    "block_size": -1,
-    "model_max_length": 2048,
-    "padding": "right",
-    "trainer": "sft",
-    "use_flash_attention_2": false,
-    "log": "none",
-    "disable_gradient_checkpointing": false,
-    "logging_steps": 5,
-    "eval_strategy": "epoch",
-    "save_total_limit": 3,
-    "auto_find_batch_size": false,
-    "mixed_precision": null,
-    "lr": 5e-06,
-    "epochs": 1,
-    "batch_size": 1,
-    "warmup_ratio": 0.1,
-    "gradient_accumulation": 1,
-    "optimizer": "adamw_torch",
-    "scheduler": "cosine_with_restarts",
-    "weight_decay": 0.0001,
-    "max_grad_norm": 0.3,
-    "seed": 42,
-    "chat_template": null,
-    "quantization": "int8",
-    "target_modules": "q_proj,k_proj,v_proj,o_proj,gate_proj,up_proj,down_proj",
-    "merge_adapter": true,
-    "peft": true,
-    "lora_r": 128,
-    "lora_alpha": 256,
-    "lora_dropout": 0.05,
-    "model_ref": null,
-    "dpo_beta": 0.1,
-    "max_prompt_length": 128,
-    "max_completion_length": null,
-    "prompt_text_column": "autotrain_prompt",
-    "text_column": "autotrain_text",
-    "rejected_text_column": "autotrain_rejected_text",
-    "push_to_hub": true,
-    "username": "neural-coder",
-    "unsloth": false,
-    "distributed_backend": null
-}