diff --git a/llama-factory/config/models/Qwen2.5-3B-Instruct.yaml b/llama-factory/config/models/Qwen2.5-3B-Instruct.yaml new file mode 100644 index 0000000000000000000000000000000000000000..c4636aee16d5a6d75509df72f281207c2f155831 --- /dev/null +++ b/llama-factory/config/models/Qwen2.5-3B-Instruct.yaml @@ -0,0 +1,43 @@ +### model +model_name_or_path: Qwen/Qwen2.5-3B-Instruct + +### method +stage: sft +do_train: true +finetuning_type: lora +lora_target: all + +### dataset +dataset: alpaca_mgtv_p2 +template: qwen +cutoff_len: 8192 +max_samples: 25000 +overwrite_cache: true +preprocessing_num_workers: 16 + +### output +output_dir: saves/Qwen2.5-3B-Instruct +logging_steps: 5 +save_steps: 35 +plot_loss: true +# overwrite_output_dir: true + +### train +per_device_train_batch_size: 16 +gradient_accumulation_steps: 8 +learning_rate: 1.0e-4 +num_train_epochs: 2.0 +lr_scheduler_type: cosine +warmup_ratio: 0.1 +bf16: true +ddp_timeout: 180000000 + +### eval +val_size: 0.1 +per_device_eval_batch_size: 1 +eval_strategy: steps +eval_steps: 35 + +# report_to: wandb +report_to: none +run_name: Qwen2.5-3B-Instruct_lora_sft diff --git a/llama-factory/config/models/Qwen2.5-7B-Instruct.yaml b/llama-factory/config/models/Qwen2.5-7B-Instruct.yaml new file mode 100644 index 0000000000000000000000000000000000000000..9c14bbeb73b1859b4ed83474d5a5becc2a9cf079 --- /dev/null +++ b/llama-factory/config/models/Qwen2.5-7B-Instruct.yaml @@ -0,0 +1,43 @@ +### model +model_name_or_path: Qwen/Qwen2.5-7B-Instruct + +### method +stage: sft +do_train: true +finetuning_type: lora +lora_target: all + +### dataset +dataset: alpaca_mgtv_p2 +template: qwen +cutoff_len: 8192 +max_samples: 25000 +overwrite_cache: true +preprocessing_num_workers: 16 + +### output +output_dir: saves/Qwen2.5-7B-Instruct +logging_steps: 5 +save_steps: 35 +plot_loss: true +# overwrite_output_dir: true + +### train +per_device_train_batch_size: 16 +gradient_accumulation_steps: 8 +learning_rate: 1.0e-4 +num_train_epochs: 2.0 +lr_scheduler_type: cosine +warmup_ratio: 0.1 +bf16: true +ddp_timeout: 180000000 + +### eval +val_size: 0.1 +per_device_eval_batch_size: 1 +eval_strategy: steps +eval_steps: 35 + +# report_to: wandb +report_to: none +run_name: Qwen2.5-7B-Instruct_lora_sft diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/README.md b/llama-factory/saves/Qwen2.5-3B-Instruct/README.md new file mode 100644 index 0000000000000000000000000000000000000000..3d3ba8007a2eb97b1da88e4fd5ae3c159e83e9a6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/README.md @@ -0,0 +1,73 @@ +--- +license: other +library_name: peft +tags: +- llama-factory +- lora +- generated_from_trainer +base_model: Qwen/Qwen2.5-3B-Instruct +model-index: +- name: Qwen2.5-3B-Instruct + results: [] +--- + + + +# Qwen2.5-3B-Instruct + +This model is a fine-tuned version of [Qwen/Qwen2.5-3B-Instruct](https://huggingface.co/Qwen/Qwen2.5-3B-Instruct) on the alpaca_mgtv_p2 dataset. +It achieves the following results on the evaluation set: +- Loss: 0.2272 + +## Model description + +More information needed + +## Intended uses & limitations + +More information needed + +## Training and evaluation data + +More information needed + +## Training procedure + +### Training hyperparameters + +The following hyperparameters were used during training: +- learning_rate: 0.0001 +- train_batch_size: 16 +- eval_batch_size: 1 +- seed: 42 +- gradient_accumulation_steps: 8 +- total_train_batch_size: 128 +- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08 +- lr_scheduler_type: cosine +- lr_scheduler_warmup_ratio: 0.1 +- num_epochs: 2.0 + +### Training results + +| Training Loss | Epoch | Step | Validation Loss | +|:-------------:|:------:|:----:|:---------------:| +| 0.3533 | 0.1990 | 35 | 0.3218 | +| 0.2926 | 0.3980 | 70 | 0.2747 | +| 0.277 | 0.5970 | 105 | 0.2519 | +| 0.2691 | 0.7960 | 140 | 0.2480 | +| 0.2597 | 0.9950 | 175 | 0.2401 | +| 0.2218 | 1.1940 | 210 | 0.2376 | +| 0.2594 | 1.3930 | 245 | 0.2271 | +| 0.2232 | 1.5920 | 280 | 0.2287 | +| 0.2145 | 1.7910 | 315 | 0.2291 | +| 0.2284 | 1.9900 | 350 | 0.2272 | + + +### Framework versions + +- PEFT 0.11.1 +- Transformers 4.43.3 +- Pytorch 2.4.0+cu121 +- Datasets 2.19.1 +- Tokenizers 0.19.1 \ No newline at end of file diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/adapter_config.json b/llama-factory/saves/Qwen2.5-3B-Instruct/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..03f49183e24abb461ddebc53b6eee34823b55388 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84d680391ed23a325a2b7e6b51a17eb4dcb88cf61df37394e05b692c992356ca +size 725 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/adapter_model.safetensors b/llama-factory/saves/Qwen2.5-3B-Instruct/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2c68459e47ae78072892c7f2184ea30a82ae493d --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:833899af6e9af5bb8a1c023a6502457c19c493606ba65cd9d6597b689ff23e32 +size 59933632 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/added_tokens.json b/llama-factory/saves/Qwen2.5-3B-Instruct/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..cc13ea617def6b99e484e257e68cda43fa549161 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b +size 605 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/all_results.json b/llama-factory/saves/Qwen2.5-3B-Instruct/all_results.json new file mode 100644 index 0000000000000000000000000000000000000000..d339ed01af8a3065841af89e700a816a544c1cdd --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/all_results.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbd40c54055d514e430a719a0bf2a2b0f4b49ec7e20b8a6db48d1612d28a171d +size 366 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/README.md b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/README.md new file mode 100644 index 0000000000000000000000000000000000000000..0ccaae0d48afac305415af2524c8599ffb6a2a53 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: Qwen/Qwen2.5-3B-Instruct +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.11.1 \ No newline at end of file diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/adapter_config.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..03f49183e24abb461ddebc53b6eee34823b55388 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84d680391ed23a325a2b7e6b51a17eb4dcb88cf61df37394e05b692c992356ca +size 725 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/adapter_model.safetensors b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..55d0f75e932d38c559ceaf2b97dbcdbffb7342c9 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47388c5e53572d952b4a8710caa6d32a842afa38fd5dc109d0ea86174639131c +size 59933632 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/added_tokens.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..cc13ea617def6b99e484e257e68cda43fa549161 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b +size 605 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/merges.txt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/optimizer.pt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..130a1737de0da2060c547fbdeec8d9c9ec056b0e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b07158a18093274cb446983f77c98a4e0994470f525e1a42d5f6038d0d488262 +size 120158586 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/rng_state.pth b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..0a11d850e4f9ddde03041fb0f3247ef616fbda77 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d138cfe3a4adf21f048848ee35837c9a757a0a3616ff7adbb45b69aac247435 +size 14244 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/scheduler.pt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..31341807bd31628f4c98a98fdf9521811486cae0 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1df35574ae0ca5dc85d2b83a77932ee5ca941a642bbe53370339fdfdc60d04fe +size 1064 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/special_tokens_map.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/tokenizer.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebe2829a5954e029cfeb28ed919a1bd4096886a --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8506e7111b80c6d8635951a02eab0f4e1a8e4e5772da83846579e97b16f61bf +size 7031673 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/tokenizer_config.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c81b15160a2b1f478a64526aaebb4596bdd6071e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca15adc168b881d165c75baa466706e504887a8867b86da3f83a851c76352686 +size 5246 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/trainer_state.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..d80c2c62b2bb81f2ef66778d6e460be72df97832 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba681b4f5e5fd5e8d26acbecdc8b3a1b6a63bba736c8bf83d4eccead6590f628 +size 5010 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/training_args.bin b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..981f1f6f7f04ed3103d92392cee9deb2c11a7a77 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b8ee63c342cd8f1feefb8bbe844c83b88e9da16a420145b45e5834855105c5a +size 5368 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/vocab.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-105/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/README.md b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/README.md new file mode 100644 index 0000000000000000000000000000000000000000..0ccaae0d48afac305415af2524c8599ffb6a2a53 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: Qwen/Qwen2.5-3B-Instruct +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.11.1 \ No newline at end of file diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/adapter_config.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..03f49183e24abb461ddebc53b6eee34823b55388 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84d680391ed23a325a2b7e6b51a17eb4dcb88cf61df37394e05b692c992356ca +size 725 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/adapter_model.safetensors b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e229bc85ae3fac141b179252b3874ebab7967c34 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f2683d010df801251bddec17066f2a38243e46eb8aaf9d7f7dc34e4d01d3624 +size 59933632 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/added_tokens.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..cc13ea617def6b99e484e257e68cda43fa549161 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b +size 605 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/merges.txt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/optimizer.pt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cc5ce3fc36c4358797a197e276cd22c92d37597 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d39f76226016291c4a1381f630eed60b8c5d5cea1a859d1e8af65de532475abd +size 120158586 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/rng_state.pth b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..06c25b71551e4830f82f7687d2345c7fbd987daa --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b3ee827a7a00012c0a116546df467feee35e70376d81a7a85b1a70eb90414d3 +size 14244 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/scheduler.pt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..61cce90db59762d086e6d3b6852a405fa6be19b9 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d84219d2b98872e152b7eefd22ea5f06fe28a80c80055cd7d460c7c6e20ea10 +size 1064 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/special_tokens_map.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/tokenizer.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebe2829a5954e029cfeb28ed919a1bd4096886a --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8506e7111b80c6d8635951a02eab0f4e1a8e4e5772da83846579e97b16f61bf +size 7031673 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/tokenizer_config.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c81b15160a2b1f478a64526aaebb4596bdd6071e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca15adc168b881d165c75baa466706e504887a8867b86da3f83a851c76352686 +size 5246 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/trainer_state.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..ed3bfb6c8bd8fed41d385d2540cfcdd34cd12e60 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d910db61d8d6a7019ed56759df96fd605a1ecc51c1bd83dbd6cbd8683fcb179f +size 6435 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/training_args.bin b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..981f1f6f7f04ed3103d92392cee9deb2c11a7a77 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b8ee63c342cd8f1feefb8bbe844c83b88e9da16a420145b45e5834855105c5a +size 5368 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/vocab.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-140/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/README.md b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/README.md new file mode 100644 index 0000000000000000000000000000000000000000..0ccaae0d48afac305415af2524c8599ffb6a2a53 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: Qwen/Qwen2.5-3B-Instruct +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.11.1 \ No newline at end of file diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/adapter_config.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..03f49183e24abb461ddebc53b6eee34823b55388 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84d680391ed23a325a2b7e6b51a17eb4dcb88cf61df37394e05b692c992356ca +size 725 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/adapter_model.safetensors b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..782b81ca395e41c779fae9afb9d9d0d840bc1bf0 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e342dbd975c5396f38767848a0fd9bbef7b68ad93236bc41e0c0ccbf2651f979 +size 59933632 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/added_tokens.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..cc13ea617def6b99e484e257e68cda43fa549161 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b +size 605 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/merges.txt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/optimizer.pt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ab18bef1951ac6981388e3d53480467357ddd91 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d5ecc4cf15e7bff02ca7f99ad30e0baf82bb2a8783c01485594eaa14ee9d068 +size 120158586 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/rng_state.pth b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..41dfa7d7903dea42d227bad638c2c750928d590c --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c062f7f375beded48b5337f5a3f3a5cb38807fa3e85dbf3e294c0ab6b627bfc2 +size 14244 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/scheduler.pt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..caf175aaec2f1527a696c358e4aa29e516403eb7 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c52b9ccde85457c1de9dfacdf0248d968713afb8256de2ba990f67de54c96d00 +size 1064 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/special_tokens_map.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/tokenizer.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebe2829a5954e029cfeb28ed919a1bd4096886a --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8506e7111b80c6d8635951a02eab0f4e1a8e4e5772da83846579e97b16f61bf +size 7031673 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/tokenizer_config.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c81b15160a2b1f478a64526aaebb4596bdd6071e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca15adc168b881d165c75baa466706e504887a8867b86da3f83a851c76352686 +size 5246 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/trainer_state.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..71b88e88225d956bcd838564a178d4f2f80f75f4 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9f4d824b13c70c35c23cac6b053c351b5d934779a5913195de5450c7b3d5b25 +size 7864 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/training_args.bin b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..981f1f6f7f04ed3103d92392cee9deb2c11a7a77 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b8ee63c342cd8f1feefb8bbe844c83b88e9da16a420145b45e5834855105c5a +size 5368 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/vocab.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-175/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/README.md b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/README.md new file mode 100644 index 0000000000000000000000000000000000000000..0ccaae0d48afac305415af2524c8599ffb6a2a53 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: Qwen/Qwen2.5-3B-Instruct +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.11.1 \ No newline at end of file diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/adapter_config.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..03f49183e24abb461ddebc53b6eee34823b55388 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84d680391ed23a325a2b7e6b51a17eb4dcb88cf61df37394e05b692c992356ca +size 725 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/adapter_model.safetensors b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..09a7ddd43f8cbabf14b7f049912213fe833db1ef --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fff8c5728ba148d975626e02702d269d776cc0cb90f52817660e0e3160d870f9 +size 59933632 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/added_tokens.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..cc13ea617def6b99e484e257e68cda43fa549161 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b +size 605 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/merges.txt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/optimizer.pt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..507b2822d915eb823937ed0782c503a3fa81bc8c --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b21eccee189f2aa1537fad6b8b1a4829a19509249480890d338f6f7a3263b858 +size 120158586 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/rng_state.pth b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..407e47abbdfb90afd3e1f979b5c0260135d2050e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9899ccda7f0d8d9511991180b93aab508ce6e8489de708c88ad1188e7e1d90d6 +size 14244 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/scheduler.pt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..419b1e14bcc9207421651855b0ff80e2794ef324 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:899dadd74ba016d8a701a0e5dc593ac31e21ddf1b80316db30ef9fa873894423 +size 1064 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/special_tokens_map.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/tokenizer.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebe2829a5954e029cfeb28ed919a1bd4096886a --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8506e7111b80c6d8635951a02eab0f4e1a8e4e5772da83846579e97b16f61bf +size 7031673 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/tokenizer_config.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c81b15160a2b1f478a64526aaebb4596bdd6071e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca15adc168b881d165c75baa466706e504887a8867b86da3f83a851c76352686 +size 5246 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/trainer_state.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..3ea409d7e27537a37cc42bbd14560d4c35e9763d --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d12f2d58485d6848dd314143163e8524ce31862792df27edcd9425ecc81e52ca +size 9287 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/training_args.bin b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..981f1f6f7f04ed3103d92392cee9deb2c11a7a77 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b8ee63c342cd8f1feefb8bbe844c83b88e9da16a420145b45e5834855105c5a +size 5368 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/vocab.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-210/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/README.md b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/README.md new file mode 100644 index 0000000000000000000000000000000000000000..0ccaae0d48afac305415af2524c8599ffb6a2a53 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: Qwen/Qwen2.5-3B-Instruct +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.11.1 \ No newline at end of file diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/adapter_config.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..03f49183e24abb461ddebc53b6eee34823b55388 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84d680391ed23a325a2b7e6b51a17eb4dcb88cf61df37394e05b692c992356ca +size 725 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/adapter_model.safetensors b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5d9723a169cb6b8ccedf6a282e784701f1bf22c4 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7312757482868afe20aa957d1d531d350f7fb46c9268af809825076cc6dda4d9 +size 59933632 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/added_tokens.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..cc13ea617def6b99e484e257e68cda43fa549161 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b +size 605 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/merges.txt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/optimizer.pt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e9121bf9791b184d3d471802ecf9bd381a85438 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbff4b22dcfbe384a2032c33742185c8c27c60ac11fcc689eb5faf9116ce6099 +size 120158586 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/rng_state.pth b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..585f2a6a28a143f55b2a0574f949d7f87bb22a65 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48ee9b73399c28d7e668360bf1d5a4d11095c4738bf96c13f7bb6fbff59f8ccb +size 14244 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/scheduler.pt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..06881b899f23cfe38e114beffd6a2057ea8fadf6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bce9fd37ac7a73d2e522f6aa056fe3582cfe6e7367584d378837991de3ebbf16 +size 1064 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/special_tokens_map.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/tokenizer.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebe2829a5954e029cfeb28ed919a1bd4096886a --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8506e7111b80c6d8635951a02eab0f4e1a8e4e5772da83846579e97b16f61bf +size 7031673 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/tokenizer_config.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c81b15160a2b1f478a64526aaebb4596bdd6071e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca15adc168b881d165c75baa466706e504887a8867b86da3f83a851c76352686 +size 5246 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/trainer_state.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..dffe280bccd72f9082791d3636b8a72dc9a8f1ad --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c61aa0527623e25b5ec64936925dd55d78cdbe408b9e1d8f60fa87861d3f431 +size 10718 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/training_args.bin b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..981f1f6f7f04ed3103d92392cee9deb2c11a7a77 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b8ee63c342cd8f1feefb8bbe844c83b88e9da16a420145b45e5834855105c5a +size 5368 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/vocab.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-245/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/README.md b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/README.md new file mode 100644 index 0000000000000000000000000000000000000000..0ccaae0d48afac305415af2524c8599ffb6a2a53 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: Qwen/Qwen2.5-3B-Instruct +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.11.1 \ No newline at end of file diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/adapter_config.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..03f49183e24abb461ddebc53b6eee34823b55388 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84d680391ed23a325a2b7e6b51a17eb4dcb88cf61df37394e05b692c992356ca +size 725 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/adapter_model.safetensors b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4636c786b253c99623df85f73c5f5fa8d0a2cb5c --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df3eb88d3fe3bade7129a8370bc75015339b1a94ba5f164789c08e499dbb622b +size 59933632 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/added_tokens.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..cc13ea617def6b99e484e257e68cda43fa549161 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b +size 605 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/merges.txt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/optimizer.pt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..071f82c51d4e4a7c6d753e57551a567824edb68b --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc87df2fe9cd9892e9e9108ff4cbd52424abb7c840f17a6abf0b44c368778c8 +size 120158586 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/rng_state.pth b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..87383f4346e5c6eea0e725de97c392797ed938b5 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d245e05e72192c132e0f2edb6fdcae0c578c890f0fe912f17ec7b0bba2d38cc3 +size 14244 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/scheduler.pt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..8524c54f7e80c306ab69001ab3e5ce83c067a269 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48872d731120fe18674f751953b72c38d9a966768719eb9601a17faaf31a5957 +size 1064 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/special_tokens_map.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/tokenizer.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebe2829a5954e029cfeb28ed919a1bd4096886a --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8506e7111b80c6d8635951a02eab0f4e1a8e4e5772da83846579e97b16f61bf +size 7031673 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/tokenizer_config.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c81b15160a2b1f478a64526aaebb4596bdd6071e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca15adc168b881d165c75baa466706e504887a8867b86da3f83a851c76352686 +size 5246 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/trainer_state.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..d7a8ece4b0b841cad3974c4d79690a0bb05483f9 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65306c92e96dd85b99b030434b600e82b1cc754a5ae47540aa8fb91fdd4df1c1 +size 12149 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/training_args.bin b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..981f1f6f7f04ed3103d92392cee9deb2c11a7a77 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b8ee63c342cd8f1feefb8bbe844c83b88e9da16a420145b45e5834855105c5a +size 5368 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/vocab.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-280/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/README.md b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/README.md new file mode 100644 index 0000000000000000000000000000000000000000..0ccaae0d48afac305415af2524c8599ffb6a2a53 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: Qwen/Qwen2.5-3B-Instruct +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.11.1 \ No newline at end of file diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/adapter_config.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..03f49183e24abb461ddebc53b6eee34823b55388 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84d680391ed23a325a2b7e6b51a17eb4dcb88cf61df37394e05b692c992356ca +size 725 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/adapter_model.safetensors b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..02e271e020e80629eea131063d83dd76d68147dd --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:203188cca3f961aaf0510a667257fdc8b487ce8fad5c89db83ea528cf449d1b2 +size 59933632 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/added_tokens.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..cc13ea617def6b99e484e257e68cda43fa549161 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b +size 605 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/merges.txt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/optimizer.pt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a83e9b098a4e90d60b696a54f4691ce9ffe3f5a --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c46d4e83becfdb5ecbe22d2791c06b96f7db18dae5cbbc012457b7e2d0bf1a4f +size 120158586 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/rng_state.pth b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..87571ba044576778d1d6e555eff20ea04c20bbab --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5edb34d031c0c2b447f3eaadb401a4c1e7e7e6d8c096e28b7092e01a8bd48c92 +size 14244 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/scheduler.pt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..e862fd38e2c7cdddf014a017679cfb606782bbfd --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d3743edaf33aa6d682b5e3cd55c73686d21dd7b15b0ef47ae54db03259173ce +size 1064 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/special_tokens_map.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/tokenizer.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebe2829a5954e029cfeb28ed919a1bd4096886a --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8506e7111b80c6d8635951a02eab0f4e1a8e4e5772da83846579e97b16f61bf +size 7031673 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/tokenizer_config.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c81b15160a2b1f478a64526aaebb4596bdd6071e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca15adc168b881d165c75baa466706e504887a8867b86da3f83a851c76352686 +size 5246 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/trainer_state.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..8d2365eac6806a6aa0b6b0f3b627e41d76bef804 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:396b8e537875112730d4f1eeed0e6fe6866d124a1410d22bb182e1968a60482f +size 13579 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/training_args.bin b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..981f1f6f7f04ed3103d92392cee9deb2c11a7a77 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b8ee63c342cd8f1feefb8bbe844c83b88e9da16a420145b45e5834855105c5a +size 5368 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/vocab.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-315/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/README.md b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/README.md new file mode 100644 index 0000000000000000000000000000000000000000..0ccaae0d48afac305415af2524c8599ffb6a2a53 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: Qwen/Qwen2.5-3B-Instruct +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.11.1 \ No newline at end of file diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/adapter_config.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..03f49183e24abb461ddebc53b6eee34823b55388 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84d680391ed23a325a2b7e6b51a17eb4dcb88cf61df37394e05b692c992356ca +size 725 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/adapter_model.safetensors b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dfb67b48cb06c7b3caf85f2e997df3bfe0690a90 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9155b39dd96f3be64b1c20cbf7007422416d94add481ad2014fd71dcef022a16 +size 59933632 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/added_tokens.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..cc13ea617def6b99e484e257e68cda43fa549161 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b +size 605 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/merges.txt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/optimizer.pt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b9defdc1be1a7f1050f11ad535caf7daad4cb45 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e750ef489584d90ee66005c55b7cd7f7ba889ba2c4124732bc530f135096369a +size 120158586 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/rng_state.pth b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..33cefe6919222ddfa3c3946df69b8e5c5a17a0fc --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ff264f99d31b522cc7e2a4eac9d38606d0c58a34c0adc74d71e0ca8b371dc36 +size 14244 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/scheduler.pt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..73bbef1c4091057200c13a251b858c508a5f73cf --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:713eaf28d14874341960ad352a5374454ad5735a0a3ccca502696adbb018f8cd +size 1064 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/special_tokens_map.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/tokenizer.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebe2829a5954e029cfeb28ed919a1bd4096886a --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8506e7111b80c6d8635951a02eab0f4e1a8e4e5772da83846579e97b16f61bf +size 7031673 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/tokenizer_config.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c81b15160a2b1f478a64526aaebb4596bdd6071e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca15adc168b881d165c75baa466706e504887a8867b86da3f83a851c76352686 +size 5246 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/trainer_state.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..9ce6d553f81dba1a23bd7045131f63e37176b186 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:817ad183483cba9f325d43859d78d5af3e5c7ee4b1571a2672e4166aabca19f7 +size 2167 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/training_args.bin b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..981f1f6f7f04ed3103d92392cee9deb2c11a7a77 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b8ee63c342cd8f1feefb8bbe844c83b88e9da16a420145b45e5834855105c5a +size 5368 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/vocab.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-35/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/README.md b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/README.md new file mode 100644 index 0000000000000000000000000000000000000000..0ccaae0d48afac305415af2524c8599ffb6a2a53 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: Qwen/Qwen2.5-3B-Instruct +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.11.1 \ No newline at end of file diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/adapter_config.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..03f49183e24abb461ddebc53b6eee34823b55388 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84d680391ed23a325a2b7e6b51a17eb4dcb88cf61df37394e05b692c992356ca +size 725 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/adapter_model.safetensors b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..2c68459e47ae78072892c7f2184ea30a82ae493d --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:833899af6e9af5bb8a1c023a6502457c19c493606ba65cd9d6597b689ff23e32 +size 59933632 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/added_tokens.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..cc13ea617def6b99e484e257e68cda43fa549161 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b +size 605 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/merges.txt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/optimizer.pt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea059e72a0d32ef5c044912547bac79aa43d4960 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59b3f5bb99711c441be073c4ce89dee32f488270ba37985d3691cb1b779cb543 +size 120158586 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/rng_state.pth b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..58d17c224a6607097f486f1f48f823a1a17c6ef9 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3e5d946241df2516b06d7074d8779088eae7607173ad780df56583910a9589b +size 14244 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/scheduler.pt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..f76c07a3f0e64c9417333cce47e5b470958a860d --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70732dec4f14211b78555ce1acfc091b59c12a05595924c42e5da10d3a62cd6d +size 1064 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/special_tokens_map.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/tokenizer.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebe2829a5954e029cfeb28ed919a1bd4096886a --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8506e7111b80c6d8635951a02eab0f4e1a8e4e5772da83846579e97b16f61bf +size 7031673 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/tokenizer_config.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c81b15160a2b1f478a64526aaebb4596bdd6071e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca15adc168b881d165c75baa466706e504887a8867b86da3f83a851c76352686 +size 5246 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/trainer_state.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..752d6e491b42a15d06f1bda911bd8fdb2a433805 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65e02ef34aed9cb0b8250b7d9f5bc5acfe6af36eb08422929f913301e65410b5 +size 14985 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/training_args.bin b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..981f1f6f7f04ed3103d92392cee9deb2c11a7a77 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b8ee63c342cd8f1feefb8bbe844c83b88e9da16a420145b45e5834855105c5a +size 5368 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/vocab.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-350/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/README.md b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/README.md new file mode 100644 index 0000000000000000000000000000000000000000..0ccaae0d48afac305415af2524c8599ffb6a2a53 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: Qwen/Qwen2.5-3B-Instruct +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.11.1 \ No newline at end of file diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/adapter_config.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..03f49183e24abb461ddebc53b6eee34823b55388 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84d680391ed23a325a2b7e6b51a17eb4dcb88cf61df37394e05b692c992356ca +size 725 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/adapter_model.safetensors b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..16b6ac322d0b6d2f0b871ffb767e35a56bab951c --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c55a67c9057857ea103177acafb00519d11ef94a857afabf1c1dad89a03a1ca +size 59933632 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/added_tokens.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..cc13ea617def6b99e484e257e68cda43fa549161 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b +size 605 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/merges.txt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/optimizer.pt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7294e6d3468a782eb60f4a04a0dc30992c3b14e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac34c6196e4bdb5d24cdb40823d5aea5bc9327079ab34000803cd1fdac5d7e7f +size 120158586 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/rng_state.pth b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..323d589b0258d085c7a07b0c4f97b26796e865c5 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9196a1e708bf24d6abba41cce3f8558820acc3e50f9394c5955e29eb41ffea3d +size 14244 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/scheduler.pt b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..43271f9b860a5a3e1ca9e072a5f84047795b51de --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1a6560ee67f398abb4366caa0f28dce005bfe2be169777509fc1f459e63edc6 +size 1064 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/special_tokens_map.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/tokenizer.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebe2829a5954e029cfeb28ed919a1bd4096886a --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8506e7111b80c6d8635951a02eab0f4e1a8e4e5772da83846579e97b16f61bf +size 7031673 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/tokenizer_config.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c81b15160a2b1f478a64526aaebb4596bdd6071e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca15adc168b881d165c75baa466706e504887a8867b86da3f83a851c76352686 +size 5246 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/trainer_state.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..24d3f5500241ba3f0ceb6d8e63479e0717f5ebf2 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:214ec1114841e4e0b57a87a854b92fd589083501b17f90b079782b0da83a51c0 +size 3589 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/training_args.bin b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..981f1f6f7f04ed3103d92392cee9deb2c11a7a77 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b8ee63c342cd8f1feefb8bbe844c83b88e9da16a420145b45e5834855105c5a +size 5368 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/vocab.json b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/checkpoint-70/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/eval_results.json b/llama-factory/saves/Qwen2.5-3B-Instruct/eval_results.json new file mode 100644 index 0000000000000000000000000000000000000000..d29f9f2c8d06f153aa4d3e1b9e94ace32610be77 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/eval_results.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93f6f0347df8fd22d9547a7d58e773d3b30819b653e6a9921fea7aa318fb6929 +size 177 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/merges.txt b/llama-factory/saves/Qwen2.5-3B-Instruct/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/special_tokens_map.json b/llama-factory/saves/Qwen2.5-3B-Instruct/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/tokenizer.json b/llama-factory/saves/Qwen2.5-3B-Instruct/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebe2829a5954e029cfeb28ed919a1bd4096886a --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8506e7111b80c6d8635951a02eab0f4e1a8e4e5772da83846579e97b16f61bf +size 7031673 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/tokenizer_config.json b/llama-factory/saves/Qwen2.5-3B-Instruct/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c81b15160a2b1f478a64526aaebb4596bdd6071e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca15adc168b881d165c75baa466706e504887a8867b86da3f83a851c76352686 +size 5246 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/train_results.json b/llama-factory/saves/Qwen2.5-3B-Instruct/train_results.json new file mode 100644 index 0000000000000000000000000000000000000000..796861c96d0877d586608f4e07a38d8b6cb6e1c5 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/train_results.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b3527ddf7539db4918f7ad445de7c126ef6b8e5562cf2bb70c252e65f898885 +size 224 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/trainer_log.jsonl b/llama-factory/saves/Qwen2.5-3B-Instruct/trainer_log.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e47d69f65e482830e91dea3c8aad8b7801945653 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/trainer_log.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cd698eedeabeea988e5a05d58d366522aa14b62031352699cc4871d92e98e77 +size 19576 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/trainer_state.json b/llama-factory/saves/Qwen2.5-3B-Instruct/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..4180977fe764b22c43fe4d05fd2e468bd4913f75 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0511d73e70e975bf8b14c26a3d8b202aa0bc128ab754fee6356bc098033b566 +size 15250 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/training_args.bin b/llama-factory/saves/Qwen2.5-3B-Instruct/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..981f1f6f7f04ed3103d92392cee9deb2c11a7a77 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b8ee63c342cd8f1feefb8bbe844c83b88e9da16a420145b45e5834855105c5a +size 5368 diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/training_eval_loss.png b/llama-factory/saves/Qwen2.5-3B-Instruct/training_eval_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..88ce096a0e95ab9b72efc6fee990df1f34ba6fff Binary files /dev/null and b/llama-factory/saves/Qwen2.5-3B-Instruct/training_eval_loss.png differ diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/training_loss.png b/llama-factory/saves/Qwen2.5-3B-Instruct/training_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..a27ad2791804da25102e5936dffa47b95fe947cd Binary files /dev/null and b/llama-factory/saves/Qwen2.5-3B-Instruct/training_loss.png differ diff --git a/llama-factory/saves/Qwen2.5-3B-Instruct/vocab.json b/llama-factory/saves/Qwen2.5-3B-Instruct/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-3B-Instruct/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/README.md b/llama-factory/saves/Qwen2.5-7B-Instruct/README.md new file mode 100644 index 0000000000000000000000000000000000000000..d0728964988ae7e4f69b383f0d5ffc92fce2e036 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/README.md @@ -0,0 +1,73 @@ +--- +license: other +library_name: peft +tags: +- llama-factory +- lora +- generated_from_trainer +base_model: Qwen/Qwen2.5-7B-Instruct +model-index: +- name: Qwen2.5-7B-Instruct + results: [] +--- + + + +# Qwen2.5-7B-Instruct + +This model is a fine-tuned version of [Qwen/Qwen2.5-7B-Instruct](https://huggingface.co/Qwen/Qwen2.5-7B-Instruct) on the alpaca_mgtv_p2 dataset. +It achieves the following results on the evaluation set: +- Loss: 0.2167 + +## Model description + +More information needed + +## Intended uses & limitations + +More information needed + +## Training and evaluation data + +More information needed + +## Training procedure + +### Training hyperparameters + +The following hyperparameters were used during training: +- learning_rate: 0.0001 +- train_batch_size: 16 +- eval_batch_size: 1 +- seed: 42 +- gradient_accumulation_steps: 8 +- total_train_batch_size: 128 +- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08 +- lr_scheduler_type: cosine +- lr_scheduler_warmup_ratio: 0.1 +- num_epochs: 2.0 + +### Training results + +| Training Loss | Epoch | Step | Validation Loss | +|:-------------:|:------:|:----:|:---------------:| +| 0.345 | 0.1990 | 35 | 0.3033 | +| 0.2741 | 0.3980 | 70 | 0.2615 | +| 0.2521 | 0.5970 | 105 | 0.2490 | +| 0.2631 | 0.7960 | 140 | 0.2443 | +| 0.242 | 0.9950 | 175 | 0.2242 | +| 0.2162 | 1.1940 | 210 | 0.2290 | +| 0.2395 | 1.3930 | 245 | 0.2209 | +| 0.2179 | 1.5920 | 280 | 0.2177 | +| 0.2109 | 1.7910 | 315 | 0.2156 | +| 0.2179 | 1.9900 | 350 | 0.2167 | + + +### Framework versions + +- PEFT 0.11.1 +- Transformers 4.43.3 +- Pytorch 2.4.0+cu121 +- Datasets 2.19.1 +- Tokenizers 0.19.1 \ No newline at end of file diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/adapter_config.json b/llama-factory/saves/Qwen2.5-7B-Instruct/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..61e1ca0933b6b165a54ea5f25c681e9c8efcf7ca --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc011490518ef823de33b3f4568e93a526c7cd6dc3da300f8a81c58080cb83c0 +size 725 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/adapter_model.safetensors b/llama-factory/saves/Qwen2.5-7B-Instruct/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c1a624e9f42f2f50f9cf39aa27acb79a7bebedff --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de28c7c82e4785adaa27a74ad5c24dd086ea551bc22152501a979eefae8bd951 +size 80792096 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/added_tokens.json b/llama-factory/saves/Qwen2.5-7B-Instruct/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..cc13ea617def6b99e484e257e68cda43fa549161 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b +size 605 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/all_results.json b/llama-factory/saves/Qwen2.5-7B-Instruct/all_results.json new file mode 100644 index 0000000000000000000000000000000000000000..d65ccfdb17deb5bcf5501be7489e1721cef43f32 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/all_results.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f354757c0f5e3ef2eed47380cd3cd5325e022f6e048266623fc35ec4a49bf3c +size 365 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/README.md b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/README.md new file mode 100644 index 0000000000000000000000000000000000000000..c706a035a44604a790ca8a761c4514546bae42bc --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: Qwen/Qwen2.5-7B-Instruct +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.11.1 \ No newline at end of file diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/adapter_config.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..61e1ca0933b6b165a54ea5f25c681e9c8efcf7ca --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc011490518ef823de33b3f4568e93a526c7cd6dc3da300f8a81c58080cb83c0 +size 725 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/adapter_model.safetensors b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..7120f62203928ceddb6070ec07c3aed8869c4d68 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da6a9ef647f558a71d0c6b33aa9203adf93419c8e4f80c5c8b194e45f7ab25d4 +size 80792096 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/added_tokens.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..cc13ea617def6b99e484e257e68cda43fa549161 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b +size 605 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/merges.txt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/optimizer.pt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f5cb432337e42c466e33410ed07747db1736688 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:499e4391974225dc4941f96a7f0531597b2da5dd6f1b5475295686d5a00892a4 +size 161810282 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/rng_state.pth b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..0a11d850e4f9ddde03041fb0f3247ef616fbda77 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d138cfe3a4adf21f048848ee35837c9a757a0a3616ff7adbb45b69aac247435 +size 14244 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/scheduler.pt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..31341807bd31628f4c98a98fdf9521811486cae0 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1df35574ae0ca5dc85d2b83a77932ee5ca941a642bbe53370339fdfdc60d04fe +size 1064 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/special_tokens_map.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/tokenizer.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebe2829a5954e029cfeb28ed919a1bd4096886a --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8506e7111b80c6d8635951a02eab0f4e1a8e4e5772da83846579e97b16f61bf +size 7031673 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/tokenizer_config.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c81b15160a2b1f478a64526aaebb4596bdd6071e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca15adc168b881d165c75baa466706e504887a8867b86da3f83a851c76352686 +size 5246 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/trainer_state.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..d532e15403178e7c6b71bae7a63ac610d6e4722b --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6549aa906d130eb1030ee196805a5fc80005ccb1c3db2ce2cb1d8b49014d0446 +size 5003 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/training_args.bin b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..23a5f9953cc91f706c066c5411874b0478d6ec3c --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:039c4b57de20a49fd93bb328a7925705bf9d70e83568f1c084c3a5abf085e686 +size 5368 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/vocab.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-105/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/README.md b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/README.md new file mode 100644 index 0000000000000000000000000000000000000000..c706a035a44604a790ca8a761c4514546bae42bc --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: Qwen/Qwen2.5-7B-Instruct +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.11.1 \ No newline at end of file diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/adapter_config.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..61e1ca0933b6b165a54ea5f25c681e9c8efcf7ca --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc011490518ef823de33b3f4568e93a526c7cd6dc3da300f8a81c58080cb83c0 +size 725 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/adapter_model.safetensors b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c3311725edd84c2f196a7aa24383bcd65bca3afc --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d5149d4e278f167b5e3eaa05b6cb2b80fd2b8c8cba90f4891401061c557d413 +size 80792096 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/added_tokens.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..cc13ea617def6b99e484e257e68cda43fa549161 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b +size 605 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/merges.txt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/optimizer.pt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..58c17d86f47433659edfa9fe038946bc597014ac --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6263d0c6a7141d0f5f977f7ca9f372c87dd38bae19d0e15f9a15e45838bc352 +size 161810282 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/rng_state.pth b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..06c25b71551e4830f82f7687d2345c7fbd987daa --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b3ee827a7a00012c0a116546df467feee35e70376d81a7a85b1a70eb90414d3 +size 14244 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/scheduler.pt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..61cce90db59762d086e6d3b6852a405fa6be19b9 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d84219d2b98872e152b7eefd22ea5f06fe28a80c80055cd7d460c7c6e20ea10 +size 1064 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/special_tokens_map.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/tokenizer.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebe2829a5954e029cfeb28ed919a1bd4096886a --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8506e7111b80c6d8635951a02eab0f4e1a8e4e5772da83846579e97b16f61bf +size 7031673 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/tokenizer_config.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c81b15160a2b1f478a64526aaebb4596bdd6071e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca15adc168b881d165c75baa466706e504887a8867b86da3f83a851c76352686 +size 5246 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/trainer_state.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..446a9cb219a911f6a83163ab91b7a73d83deddf4 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93a279ee56e5b28cc3f14c7c955e04ce13863bba68eb2328a8ba5a8265d57e64 +size 6426 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/training_args.bin b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..23a5f9953cc91f706c066c5411874b0478d6ec3c --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:039c4b57de20a49fd93bb328a7925705bf9d70e83568f1c084c3a5abf085e686 +size 5368 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/vocab.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-140/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/README.md b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/README.md new file mode 100644 index 0000000000000000000000000000000000000000..c706a035a44604a790ca8a761c4514546bae42bc --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: Qwen/Qwen2.5-7B-Instruct +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.11.1 \ No newline at end of file diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/adapter_config.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..61e1ca0933b6b165a54ea5f25c681e9c8efcf7ca --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc011490518ef823de33b3f4568e93a526c7cd6dc3da300f8a81c58080cb83c0 +size 725 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/adapter_model.safetensors b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e8b71ddc9ed8434d4086effcf891ac60665d5ffc --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7007ec3c5117990290b70a468fb4693f74f03d9c86817d10600f46ed65f36f26 +size 80792096 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/added_tokens.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..cc13ea617def6b99e484e257e68cda43fa549161 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b +size 605 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/merges.txt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/optimizer.pt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d85a44968844395607c1c0b3a39945720412578 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bb7f85c217c405d3290cb37bb939bfc3c0eab6cfbe98a87f8d73d674d03efb1 +size 161810282 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/rng_state.pth b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..41dfa7d7903dea42d227bad638c2c750928d590c --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c062f7f375beded48b5337f5a3f3a5cb38807fa3e85dbf3e294c0ab6b627bfc2 +size 14244 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/scheduler.pt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..caf175aaec2f1527a696c358e4aa29e516403eb7 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c52b9ccde85457c1de9dfacdf0248d968713afb8256de2ba990f67de54c96d00 +size 1064 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/special_tokens_map.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/tokenizer.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebe2829a5954e029cfeb28ed919a1bd4096886a --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8506e7111b80c6d8635951a02eab0f4e1a8e4e5772da83846579e97b16f61bf +size 7031673 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/tokenizer_config.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c81b15160a2b1f478a64526aaebb4596bdd6071e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca15adc168b881d165c75baa466706e504887a8867b86da3f83a851c76352686 +size 5246 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/trainer_state.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..bc1c2b3a6983b9f66632dae64744dc09bdc9d042 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6e54a35701ad3f3ee45943f08061ec28bac4c7197ff8bde0c42053ca00f5133 +size 7851 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/training_args.bin b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..23a5f9953cc91f706c066c5411874b0478d6ec3c --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:039c4b57de20a49fd93bb328a7925705bf9d70e83568f1c084c3a5abf085e686 +size 5368 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/vocab.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-175/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/README.md b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/README.md new file mode 100644 index 0000000000000000000000000000000000000000..c706a035a44604a790ca8a761c4514546bae42bc --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: Qwen/Qwen2.5-7B-Instruct +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.11.1 \ No newline at end of file diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/adapter_config.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..61e1ca0933b6b165a54ea5f25c681e9c8efcf7ca --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc011490518ef823de33b3f4568e93a526c7cd6dc3da300f8a81c58080cb83c0 +size 725 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/adapter_model.safetensors b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..9e7a4c36449087d2995a043a57269359740a7a72 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dad66c6518b8799af179dc4f0b949c69d611ef498f26ebe8f7ff6a932d7a77c9 +size 80792096 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/added_tokens.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..cc13ea617def6b99e484e257e68cda43fa549161 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b +size 605 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/merges.txt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/optimizer.pt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0e053c0d98d142415ba5e0e8c888ce51fbbed97 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c6c40d434813f00dfb79c011c642e8d04c7b138a0262a2a762370757056c3db +size 161810282 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/rng_state.pth b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..407e47abbdfb90afd3e1f979b5c0260135d2050e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9899ccda7f0d8d9511991180b93aab508ce6e8489de708c88ad1188e7e1d90d6 +size 14244 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/scheduler.pt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..419b1e14bcc9207421651855b0ff80e2794ef324 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:899dadd74ba016d8a701a0e5dc593ac31e21ddf1b80316db30ef9fa873894423 +size 1064 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/special_tokens_map.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/tokenizer.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebe2829a5954e029cfeb28ed919a1bd4096886a --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8506e7111b80c6d8635951a02eab0f4e1a8e4e5772da83846579e97b16f61bf +size 7031673 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/tokenizer_config.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c81b15160a2b1f478a64526aaebb4596bdd6071e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca15adc168b881d165c75baa466706e504887a8867b86da3f83a851c76352686 +size 5246 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/trainer_state.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..07b405c55dda757337d50aa121621c0979e0a2f0 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:432ff1f4bed446c2d8d058bb53fa8cfa576503b5d16696e9cf844edee7881a32 +size 9279 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/training_args.bin b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..23a5f9953cc91f706c066c5411874b0478d6ec3c --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:039c4b57de20a49fd93bb328a7925705bf9d70e83568f1c084c3a5abf085e686 +size 5368 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/vocab.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-210/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/README.md b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/README.md new file mode 100644 index 0000000000000000000000000000000000000000..c706a035a44604a790ca8a761c4514546bae42bc --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: Qwen/Qwen2.5-7B-Instruct +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.11.1 \ No newline at end of file diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/adapter_config.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..61e1ca0933b6b165a54ea5f25c681e9c8efcf7ca --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc011490518ef823de33b3f4568e93a526c7cd6dc3da300f8a81c58080cb83c0 +size 725 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/adapter_model.safetensors b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..810c8229103b46646f9e36f4aa495876b8de0b67 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00d1d4413949074d097b60555a2b384269ceb76d05656abd676523996a3249df +size 80792096 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/added_tokens.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..cc13ea617def6b99e484e257e68cda43fa549161 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b +size 605 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/merges.txt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/optimizer.pt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..f161009664c8fd601ab09845dfd576f44b74269f --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d993a7b8d9fdfef459caa8035a272a90c2968dd8f197c03d1be5b790fd6877b3 +size 161810282 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/rng_state.pth b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..585f2a6a28a143f55b2a0574f949d7f87bb22a65 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48ee9b73399c28d7e668360bf1d5a4d11095c4738bf96c13f7bb6fbff59f8ccb +size 14244 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/scheduler.pt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..06881b899f23cfe38e114beffd6a2057ea8fadf6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bce9fd37ac7a73d2e522f6aa056fe3582cfe6e7367584d378837991de3ebbf16 +size 1064 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/special_tokens_map.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/tokenizer.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebe2829a5954e029cfeb28ed919a1bd4096886a --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8506e7111b80c6d8635951a02eab0f4e1a8e4e5772da83846579e97b16f61bf +size 7031673 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/tokenizer_config.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c81b15160a2b1f478a64526aaebb4596bdd6071e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca15adc168b881d165c75baa466706e504887a8867b86da3f83a851c76352686 +size 5246 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/trainer_state.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..40d2867e8dc892b2637322ad1b846e53e7ae21dd --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14b69cda7b2deb31b1b01b4437c2674ab1611cc5a43807774aa6988e0afd0715 +size 10709 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/training_args.bin b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..23a5f9953cc91f706c066c5411874b0478d6ec3c --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:039c4b57de20a49fd93bb328a7925705bf9d70e83568f1c084c3a5abf085e686 +size 5368 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/vocab.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-245/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/README.md b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/README.md new file mode 100644 index 0000000000000000000000000000000000000000..c706a035a44604a790ca8a761c4514546bae42bc --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: Qwen/Qwen2.5-7B-Instruct +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.11.1 \ No newline at end of file diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/adapter_config.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..61e1ca0933b6b165a54ea5f25c681e9c8efcf7ca --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc011490518ef823de33b3f4568e93a526c7cd6dc3da300f8a81c58080cb83c0 +size 725 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/adapter_model.safetensors b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..fdf8c6ade0bb0545e021ff13aa9a2205c3bc39ff --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e0f8da2473d646e669b0115ec3767599a5e15ad719c0c13647f0deeb4ea1b69 +size 80792096 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/added_tokens.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..cc13ea617def6b99e484e257e68cda43fa549161 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b +size 605 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/merges.txt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/optimizer.pt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..92c7dc6c55ec78392c34853171f66d06c5e38fd6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee7565f005e58f44512c1a484329e6e9892124823a03984dcbeaf7439b239a74 +size 161810282 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/rng_state.pth b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..87383f4346e5c6eea0e725de97c392797ed938b5 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d245e05e72192c132e0f2edb6fdcae0c578c890f0fe912f17ec7b0bba2d38cc3 +size 14244 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/scheduler.pt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..8524c54f7e80c306ab69001ab3e5ce83c067a269 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48872d731120fe18674f751953b72c38d9a966768719eb9601a17faaf31a5957 +size 1064 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/special_tokens_map.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/tokenizer.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebe2829a5954e029cfeb28ed919a1bd4096886a --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8506e7111b80c6d8635951a02eab0f4e1a8e4e5772da83846579e97b16f61bf +size 7031673 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/tokenizer_config.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c81b15160a2b1f478a64526aaebb4596bdd6071e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca15adc168b881d165c75baa466706e504887a8867b86da3f83a851c76352686 +size 5246 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/trainer_state.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..2e1056d3b2e5c86282c4bb53133b9b38798b3f12 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:456b10f422da2885f65f2f6b0ebd863493f2b24744b034769932bf95fe20d8b2 +size 12142 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/training_args.bin b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..23a5f9953cc91f706c066c5411874b0478d6ec3c --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:039c4b57de20a49fd93bb328a7925705bf9d70e83568f1c084c3a5abf085e686 +size 5368 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/vocab.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-280/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/README.md b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/README.md new file mode 100644 index 0000000000000000000000000000000000000000..c706a035a44604a790ca8a761c4514546bae42bc --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: Qwen/Qwen2.5-7B-Instruct +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.11.1 \ No newline at end of file diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/adapter_config.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..61e1ca0933b6b165a54ea5f25c681e9c8efcf7ca --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc011490518ef823de33b3f4568e93a526c7cd6dc3da300f8a81c58080cb83c0 +size 725 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/adapter_model.safetensors b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0cca12d080506374cebffd79714e219816b153cc --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec57d80c02d37b70b7525ba0a6d5a55c7d8d235b83367d4caa6750e53bfb7dbd +size 80792096 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/added_tokens.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..cc13ea617def6b99e484e257e68cda43fa549161 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b +size 605 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/merges.txt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/optimizer.pt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f772333277204a6ef9afe288235c5626e837cd1 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7c9e504640518d802a9cca989a39091525d5b45446f2a3bb337dda0ddb76d0c +size 161810282 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/rng_state.pth b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..87571ba044576778d1d6e555eff20ea04c20bbab --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5edb34d031c0c2b447f3eaadb401a4c1e7e7e6d8c096e28b7092e01a8bd48c92 +size 14244 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/scheduler.pt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..e862fd38e2c7cdddf014a017679cfb606782bbfd --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d3743edaf33aa6d682b5e3cd55c73686d21dd7b15b0ef47ae54db03259173ce +size 1064 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/special_tokens_map.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/tokenizer.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebe2829a5954e029cfeb28ed919a1bd4096886a --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8506e7111b80c6d8635951a02eab0f4e1a8e4e5772da83846579e97b16f61bf +size 7031673 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/tokenizer_config.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c81b15160a2b1f478a64526aaebb4596bdd6071e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca15adc168b881d165c75baa466706e504887a8867b86da3f83a851c76352686 +size 5246 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/trainer_state.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..55fe2433cf1e2191cc2d0c78f9566b6378785e42 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be99ec418a3936f357be81d0cf3d0f4e11cc847ff2564b11887841bcb76ecde3 +size 13573 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/training_args.bin b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..23a5f9953cc91f706c066c5411874b0478d6ec3c --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:039c4b57de20a49fd93bb328a7925705bf9d70e83568f1c084c3a5abf085e686 +size 5368 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/vocab.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-315/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/README.md b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/README.md new file mode 100644 index 0000000000000000000000000000000000000000..c706a035a44604a790ca8a761c4514546bae42bc --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: Qwen/Qwen2.5-7B-Instruct +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.11.1 \ No newline at end of file diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/adapter_config.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..61e1ca0933b6b165a54ea5f25c681e9c8efcf7ca --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc011490518ef823de33b3f4568e93a526c7cd6dc3da300f8a81c58080cb83c0 +size 725 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/adapter_model.safetensors b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a81ec5a47762ffdaff20b37116eef0f997bbeecf --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6db2cdc0e01c3c5b25822b3be775d01a54c0c083349b7e72e39fe9c467d41939 +size 80792096 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/added_tokens.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..cc13ea617def6b99e484e257e68cda43fa549161 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b +size 605 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/merges.txt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/optimizer.pt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb676dc8b40b6c1efa620de78d29ea7a31a38d09 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71a02f684333c48937dbff8fe6d149fbcac468cddefc5ba31e680ee25888e620 +size 161810282 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/rng_state.pth b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..33cefe6919222ddfa3c3946df69b8e5c5a17a0fc --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ff264f99d31b522cc7e2a4eac9d38606d0c58a34c0adc74d71e0ca8b371dc36 +size 14244 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/scheduler.pt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..73bbef1c4091057200c13a251b858c508a5f73cf --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:713eaf28d14874341960ad352a5374454ad5735a0a3ccca502696adbb018f8cd +size 1064 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/special_tokens_map.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/tokenizer.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebe2829a5954e029cfeb28ed919a1bd4096886a --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8506e7111b80c6d8635951a02eab0f4e1a8e4e5772da83846579e97b16f61bf +size 7031673 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/tokenizer_config.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c81b15160a2b1f478a64526aaebb4596bdd6071e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca15adc168b881d165c75baa466706e504887a8867b86da3f83a851c76352686 +size 5246 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/trainer_state.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..9dde316d325932cf646ee266787b4ae6dda34e1c --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14129eba65f376102725f9d3f2b837f69470533af1027cc9aa3e86073a45a45e +size 2168 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/training_args.bin b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..23a5f9953cc91f706c066c5411874b0478d6ec3c --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:039c4b57de20a49fd93bb328a7925705bf9d70e83568f1c084c3a5abf085e686 +size 5368 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/vocab.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-35/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/README.md b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/README.md new file mode 100644 index 0000000000000000000000000000000000000000..c706a035a44604a790ca8a761c4514546bae42bc --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: Qwen/Qwen2.5-7B-Instruct +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.11.1 \ No newline at end of file diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/adapter_config.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..61e1ca0933b6b165a54ea5f25c681e9c8efcf7ca --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc011490518ef823de33b3f4568e93a526c7cd6dc3da300f8a81c58080cb83c0 +size 725 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/adapter_model.safetensors b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..c1a624e9f42f2f50f9cf39aa27acb79a7bebedff --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de28c7c82e4785adaa27a74ad5c24dd086ea551bc22152501a979eefae8bd951 +size 80792096 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/added_tokens.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..cc13ea617def6b99e484e257e68cda43fa549161 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b +size 605 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/merges.txt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/optimizer.pt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..e55497bb6116414b4f153b31133b0035a612cb22 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6d1b61835c611e26d6f802adf379dbe70c6349026044a32737297c7ca7551b2 +size 161810282 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/rng_state.pth b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..58d17c224a6607097f486f1f48f823a1a17c6ef9 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3e5d946241df2516b06d7074d8779088eae7607173ad780df56583910a9589b +size 14244 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/scheduler.pt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..f76c07a3f0e64c9417333cce47e5b470958a860d --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70732dec4f14211b78555ce1acfc091b59c12a05595924c42e5da10d3a62cd6d +size 1064 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/special_tokens_map.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/tokenizer.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebe2829a5954e029cfeb28ed919a1bd4096886a --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8506e7111b80c6d8635951a02eab0f4e1a8e4e5772da83846579e97b16f61bf +size 7031673 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/tokenizer_config.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c81b15160a2b1f478a64526aaebb4596bdd6071e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca15adc168b881d165c75baa466706e504887a8867b86da3f83a851c76352686 +size 5246 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/trainer_state.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..80a1e35f9b349608d59c4c6e5d66742789ca2dd3 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5d5632fc6ae70b022f381d9d24ee80463d3af6e2ee5f115be0b896a8505b8e0 +size 14983 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/training_args.bin b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..23a5f9953cc91f706c066c5411874b0478d6ec3c --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:039c4b57de20a49fd93bb328a7925705bf9d70e83568f1c084c3a5abf085e686 +size 5368 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/vocab.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-350/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/README.md b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/README.md new file mode 100644 index 0000000000000000000000000000000000000000..c706a035a44604a790ca8a761c4514546bae42bc --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/README.md @@ -0,0 +1,202 @@ +--- +library_name: peft +base_model: Qwen/Qwen2.5-7B-Instruct +--- + +# Model Card for Model ID + + + + + +## Model Details + +### Model Description + + + + + +- **Developed by:** [More Information Needed] +- **Funded by [optional]:** [More Information Needed] +- **Shared by [optional]:** [More Information Needed] +- **Model type:** [More Information Needed] +- **Language(s) (NLP):** [More Information Needed] +- **License:** [More Information Needed] +- **Finetuned from model [optional]:** [More Information Needed] + +### Model Sources [optional] + + + +- **Repository:** [More Information Needed] +- **Paper [optional]:** [More Information Needed] +- **Demo [optional]:** [More Information Needed] + +## Uses + + + +### Direct Use + + + +[More Information Needed] + +### Downstream Use [optional] + + + +[More Information Needed] + +### Out-of-Scope Use + + + +[More Information Needed] + +## Bias, Risks, and Limitations + + + +[More Information Needed] + +### Recommendations + + + +Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations. + +## How to Get Started with the Model + +Use the code below to get started with the model. + +[More Information Needed] + +## Training Details + +### Training Data + + + +[More Information Needed] + +### Training Procedure + + + +#### Preprocessing [optional] + +[More Information Needed] + + +#### Training Hyperparameters + +- **Training regime:** [More Information Needed] + +#### Speeds, Sizes, Times [optional] + + + +[More Information Needed] + +## Evaluation + + + +### Testing Data, Factors & Metrics + +#### Testing Data + + + +[More Information Needed] + +#### Factors + + + +[More Information Needed] + +#### Metrics + + + +[More Information Needed] + +### Results + +[More Information Needed] + +#### Summary + + + +## Model Examination [optional] + + + +[More Information Needed] + +## Environmental Impact + + + +Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700). + +- **Hardware Type:** [More Information Needed] +- **Hours used:** [More Information Needed] +- **Cloud Provider:** [More Information Needed] +- **Compute Region:** [More Information Needed] +- **Carbon Emitted:** [More Information Needed] + +## Technical Specifications [optional] + +### Model Architecture and Objective + +[More Information Needed] + +### Compute Infrastructure + +[More Information Needed] + +#### Hardware + +[More Information Needed] + +#### Software + +[More Information Needed] + +## Citation [optional] + + + +**BibTeX:** + +[More Information Needed] + +**APA:** + +[More Information Needed] + +## Glossary [optional] + + + +[More Information Needed] + +## More Information [optional] + +[More Information Needed] + +## Model Card Authors [optional] + +[More Information Needed] + +## Model Card Contact + +[More Information Needed] +### Framework versions + +- PEFT 0.11.1 \ No newline at end of file diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/adapter_config.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/adapter_config.json new file mode 100644 index 0000000000000000000000000000000000000000..61e1ca0933b6b165a54ea5f25c681e9c8efcf7ca --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/adapter_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc011490518ef823de33b3f4568e93a526c7cd6dc3da300f8a81c58080cb83c0 +size 725 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/adapter_model.safetensors b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/adapter_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..cace93b31ab635a8ba1a4f5f23fa13952585a325 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/adapter_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdfba72ae23a8c2b484137c2820748edd02a7c509d98c22d35362e3c59743917 +size 80792096 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/added_tokens.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..cc13ea617def6b99e484e257e68cda43fa549161 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/added_tokens.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b54bbe36fc752f79a24a271ef66a0a0830054b4dfad94bde757d851968060b +size 605 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/merges.txt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/optimizer.pt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/optimizer.pt new file mode 100644 index 0000000000000000000000000000000000000000..476dc988cba93928e024dd51e600d7921dfc79d2 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/optimizer.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3ab196511bb8329679f082018baa6e06a1d67ebb513685c027efacd0abf2a72 +size 161810282 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/rng_state.pth b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/rng_state.pth new file mode 100644 index 0000000000000000000000000000000000000000..323d589b0258d085c7a07b0c4f97b26796e865c5 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/rng_state.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9196a1e708bf24d6abba41cce3f8558820acc3e50f9394c5955e29eb41ffea3d +size 14244 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/scheduler.pt b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/scheduler.pt new file mode 100644 index 0000000000000000000000000000000000000000..43271f9b860a5a3e1ca9e072a5f84047795b51de --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/scheduler.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1a6560ee67f398abb4366caa0f28dce005bfe2be169777509fc1f459e63edc6 +size 1064 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/special_tokens_map.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/tokenizer.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebe2829a5954e029cfeb28ed919a1bd4096886a --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8506e7111b80c6d8635951a02eab0f4e1a8e4e5772da83846579e97b16f61bf +size 7031673 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/tokenizer_config.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c81b15160a2b1f478a64526aaebb4596bdd6071e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca15adc168b881d165c75baa466706e504887a8867b86da3f83a851c76352686 +size 5246 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/trainer_state.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..b1ba37376540cb6fc66ecf4b771805a051076737 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ace5b1c1a4412392d394bcd6eaa7b1568170b342a437d27695d4bb509b08cc0 +size 3588 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/training_args.bin b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..23a5f9953cc91f706c066c5411874b0478d6ec3c --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:039c4b57de20a49fd93bb328a7925705bf9d70e83568f1c084c3a5abf085e686 +size 5368 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/vocab.json b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/checkpoint-70/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/eval_results.json b/llama-factory/saves/Qwen2.5-7B-Instruct/eval_results.json new file mode 100644 index 0000000000000000000000000000000000000000..a0098c049c0aa8d6d2a0613f5455e8a3aa0f2d5d --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/eval_results.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e408e4ecc64585ffcc3fcf24c751d803bcca5447b2a295e3b5bfd365f12fb19 +size 177 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/merges.txt b/llama-factory/saves/Qwen2.5-7B-Instruct/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..80c1a19fae38f8f4c9ab32cc9d4e145c241147e6 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8831e4f1a044471340f7c0a83d7bd71306a5b867e95fd870f74d0c5308a904d5 +size 1671853 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/special_tokens_map.json b/llama-factory/saves/Qwen2.5-7B-Instruct/special_tokens_map.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3f6af3ba18b7d721f02bdf3fbca2814b7eda35 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/special_tokens_map.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76862e765266b85aa9459767e33cbaf13970f327a0e88d1c65846c2ddd3a1ecd +size 613 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/tokenizer.json b/llama-factory/saves/Qwen2.5-7B-Instruct/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..7ebe2829a5954e029cfeb28ed919a1bd4096886a --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8506e7111b80c6d8635951a02eab0f4e1a8e4e5772da83846579e97b16f61bf +size 7031673 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/tokenizer_config.json b/llama-factory/saves/Qwen2.5-7B-Instruct/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..c81b15160a2b1f478a64526aaebb4596bdd6071e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/tokenizer_config.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca15adc168b881d165c75baa466706e504887a8867b86da3f83a851c76352686 +size 5246 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/train_results.json b/llama-factory/saves/Qwen2.5-7B-Instruct/train_results.json new file mode 100644 index 0000000000000000000000000000000000000000..9f7fcd0de4a6ac0f5a7b7b85e888bdd0a6df4904 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/train_results.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ceed29c2815ce1357c19eeb57aaa680a16b7072aabb0223324c747a474c029a +size 223 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/trainer_log.jsonl b/llama-factory/saves/Qwen2.5-7B-Instruct/trainer_log.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8b517eb49b7a735da79b08be51878694e9f57e5e --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/trainer_log.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a678c8c426e69ecfe230db8c437c7433bd42cbec7da01724e681acc7e3ba4744 +size 19573 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/trainer_state.json b/llama-factory/saves/Qwen2.5-7B-Instruct/trainer_state.json new file mode 100644 index 0000000000000000000000000000000000000000..7c3dfeefc941cd6e3dbfc91daf09518e28b8b2b8 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/trainer_state.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a7ebdad5abf91510e0fd1acc357a56796a9cf41c24bc50049bd23d2801b87ca +size 15247 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/training_args.bin b/llama-factory/saves/Qwen2.5-7B-Instruct/training_args.bin new file mode 100644 index 0000000000000000000000000000000000000000..23a5f9953cc91f706c066c5411874b0478d6ec3c --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/training_args.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:039c4b57de20a49fd93bb328a7925705bf9d70e83568f1c084c3a5abf085e686 +size 5368 diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/training_eval_loss.png b/llama-factory/saves/Qwen2.5-7B-Instruct/training_eval_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..cced33a436380bd9593d2faedb1143d278bcd2b5 Binary files /dev/null and b/llama-factory/saves/Qwen2.5-7B-Instruct/training_eval_loss.png differ diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/training_loss.png b/llama-factory/saves/Qwen2.5-7B-Instruct/training_loss.png new file mode 100644 index 0000000000000000000000000000000000000000..f17d50717201af46804987ffcfc58b3a101f2caf Binary files /dev/null and b/llama-factory/saves/Qwen2.5-7B-Instruct/training_loss.png differ diff --git a/llama-factory/saves/Qwen2.5-7B-Instruct/vocab.json b/llama-factory/saves/Qwen2.5-7B-Instruct/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..6c49fc63bcb109de13abe49e58f85a4cdba7b679 --- /dev/null +++ b/llama-factory/saves/Qwen2.5-7B-Instruct/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca10d7e9fb3ed18575dd1e277a2579c16d108e32f27439684afa0e10b1440910 +size 2776833