Instructions to use evgmaslov/Mistral-Nemo-Instruct-2407-cars with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- PEFT
How to use evgmaslov/Mistral-Nemo-Instruct-2407-cars with PEFT:
from peft import PeftModel from transformers import AutoModelForCausalLM base_model = AutoModelForCausalLM.from_pretrained("mistralai/Mistral-Nemo-Instruct-2407") model = PeftModel.from_pretrained(base_model, "evgmaslov/Mistral-Nemo-Instruct-2407-cars") - Notebooks
- Google Colab
- Kaggle
Training in progress, step 300, checkpoint
Browse files- last-checkpoint/adapter_model.safetensors +1 -1
- last-checkpoint/optimizer.pt +2 -2
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/rng_state_4.pth +1 -1
- last-checkpoint/rng_state_5.pth +1 -1
- last-checkpoint/rng_state_6.pth +1 -1
- last-checkpoint/rng_state_7.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +13 -5
last-checkpoint/adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 157308096
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:af13b68fa43378eeb1d9477887e1f4b280a05be96737b5750839609cdd90a6d8
|
| 3 |
size 157308096
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8ab7c0f5a4a81699b122c49904d07e780819ce82f6ed8f06b2193f1320c4453f
|
| 3 |
+
size 314671226
|
last-checkpoint/rng_state_0.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15920
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9afbf9b2cc7ffb82e39603ea3e9793624776e974898f71cddb75c50b95a8ff20
|
| 3 |
size 15920
|
last-checkpoint/rng_state_1.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15920
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ca4fa167ac420fbc12a0b1225ad375db648a55f16b7e4866651104ea0cc00a49
|
| 3 |
size 15920
|
last-checkpoint/rng_state_2.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15920
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e799329eb62e1eb372f5e1a106e0710d002dddfe0cb96b7478769d095e752b5f
|
| 3 |
size 15920
|
last-checkpoint/rng_state_3.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15920
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:148ecc351dae84aea8cdc86447e26d57a1165551634773232252cd35029fec44
|
| 3 |
size 15920
|
last-checkpoint/rng_state_4.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15920
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a6c737fa9218e50ea3ce9320b640c05dff0f18b8b0409fe5e3f6340fa144ae6f
|
| 3 |
size 15920
|
last-checkpoint/rng_state_5.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15920
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:40fdcad7ba51bcc458150b1d4b2c87d4dee4fcbb7619ccd347b91ff0f61763b2
|
| 3 |
size 15920
|
last-checkpoint/rng_state_6.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15920
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d3d21b509f3e70f8a0fe13164c8b6d889c6ab04755a1218812e3a6427ea94537
|
| 3 |
size 15920
|
last-checkpoint/rng_state_7.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 15920
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1304350d7f8258aaa5c749bd82f5c7ddf08eafecb5eb5f18652eb3f7d1198b19
|
| 3 |
size 15920
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1d0bcc3306c506981564a07ff3b261b32731741ed53940e879827feb4c6814eb
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
{
|
| 2 |
-
"best_metric": 0.
|
| 3 |
-
"best_model_checkpoint": "evgmaslov/Mistral-Nemo-Instruct-2407-cars/checkpoint-
|
| 4 |
-
"epoch": 0.
|
| 5 |
"eval_steps": 100,
|
| 6 |
-
"global_step":
|
| 7 |
"is_hyper_param_search": false,
|
| 8 |
"is_local_process_zero": true,
|
| 9 |
"is_world_process_zero": true,
|
|
@@ -23,6 +23,14 @@
|
|
| 23 |
"eval_samples_per_second": 6.015,
|
| 24 |
"eval_steps_per_second": 0.376,
|
| 25 |
"step": 200
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 26 |
}
|
| 27 |
],
|
| 28 |
"logging_steps": 500,
|
|
@@ -42,7 +50,7 @@
|
|
| 42 |
"attributes": {}
|
| 43 |
}
|
| 44 |
},
|
| 45 |
-
"total_flos":
|
| 46 |
"train_batch_size": 2,
|
| 47 |
"trial_name": null,
|
| 48 |
"trial_params": null
|
|
|
|
| 1 |
{
|
| 2 |
+
"best_metric": 0.05055840685963631,
|
| 3 |
+
"best_model_checkpoint": "evgmaslov/Mistral-Nemo-Instruct-2407-cars/checkpoint-300",
|
| 4 |
+
"epoch": 0.37546933667083854,
|
| 5 |
"eval_steps": 100,
|
| 6 |
+
"global_step": 300,
|
| 7 |
"is_hyper_param_search": false,
|
| 8 |
"is_local_process_zero": true,
|
| 9 |
"is_world_process_zero": true,
|
|
|
|
| 23 |
"eval_samples_per_second": 6.015,
|
| 24 |
"eval_steps_per_second": 0.376,
|
| 25 |
"step": 200
|
| 26 |
+
},
|
| 27 |
+
{
|
| 28 |
+
"epoch": 0.37546933667083854,
|
| 29 |
+
"eval_loss": 0.05055840685963631,
|
| 30 |
+
"eval_runtime": 5.3195,
|
| 31 |
+
"eval_samples_per_second": 6.016,
|
| 32 |
+
"eval_steps_per_second": 0.376,
|
| 33 |
+
"step": 300
|
| 34 |
}
|
| 35 |
],
|
| 36 |
"logging_steps": 500,
|
|
|
|
| 50 |
"attributes": {}
|
| 51 |
}
|
| 52 |
},
|
| 53 |
+
"total_flos": 3.425702422511616e+17,
|
| 54 |
"train_batch_size": 2,
|
| 55 |
"trial_name": null,
|
| 56 |
"trial_params": null
|