Instructions to use Howard881010/epidemiology_sft_10000_mcq_2epoch with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- PEFT
How to use Howard881010/epidemiology_sft_10000_mcq_2epoch with PEFT:
from peft import PeftModel from transformers import AutoModelForCausalLM base_model = AutoModelForCausalLM.from_pretrained("mistralai/Mistral-Nemo-Instruct-2407") model = PeftModel.from_pretrained(base_model, "Howard881010/epidemiology_sft_10000_mcq_2epoch") - Notebooks
- Google Colab
- Kaggle
| {"current_steps": 10, "total_steps": 450, "loss": 0.3008, "lr": 9.987820251299122e-05, "epoch": 0.044444444444444446, "percentage": 2.22, "elapsed_time": "0:02:02", "remaining_time": "1:30:03"} | |
| {"current_steps": 20, "total_steps": 450, "loss": 0.0061, "lr": 9.951340343707852e-05, "epoch": 0.08888888888888889, "percentage": 4.44, "elapsed_time": "0:04:05", "remaining_time": "1:28:05"} | |
| {"current_steps": 30, "total_steps": 450, "loss": 0.0042, "lr": 9.890738003669029e-05, "epoch": 0.13333333333333333, "percentage": 6.67, "elapsed_time": "0:06:08", "remaining_time": "1:26:04"} | |
| {"current_steps": 30, "total_steps": 450, "eval_loss": 0.004080221988260746, "epoch": 0.13333333333333333, "percentage": 6.67, "elapsed_time": "0:07:45", "remaining_time": "1:48:39"} | |
| {"current_steps": 40, "total_steps": 450, "loss": 0.0039, "lr": 9.806308479691595e-05, "epoch": 0.17777777777777778, "percentage": 8.89, "elapsed_time": "0:09:48", "remaining_time": "1:40:34"} | |
| {"current_steps": 50, "total_steps": 450, "loss": 0.0039, "lr": 9.698463103929542e-05, "epoch": 0.2222222222222222, "percentage": 11.11, "elapsed_time": "0:11:51", "remaining_time": "1:34:55"} | |
| {"current_steps": 60, "total_steps": 450, "loss": 0.0039, "lr": 9.567727288213005e-05, "epoch": 0.26666666666666666, "percentage": 13.33, "elapsed_time": "0:13:55", "remaining_time": "1:30:28"} | |
| {"current_steps": 60, "total_steps": 450, "eval_loss": 0.003909846767783165, "epoch": 0.26666666666666666, "percentage": 13.33, "elapsed_time": "0:15:31", "remaining_time": "1:40:57"} | |
| {"current_steps": 70, "total_steps": 450, "loss": 0.0039, "lr": 9.414737964294636e-05, "epoch": 0.3111111111111111, "percentage": 15.56, "elapsed_time": "0:17:35", "remaining_time": "1:35:27"} | |
| {"current_steps": 80, "total_steps": 450, "loss": 0.0039, "lr": 9.24024048078213e-05, "epoch": 0.35555555555555557, "percentage": 17.78, "elapsed_time": "0:19:38", "remaining_time": "1:30:49"} | |
| {"current_steps": 90, "total_steps": 450, "loss": 0.0039, "lr": 9.045084971874738e-05, "epoch": 0.4, "percentage": 20.0, "elapsed_time": "0:21:41", "remaining_time": "1:26:46"} | |
| {"current_steps": 90, "total_steps": 450, "eval_loss": 0.0038871022406965494, "epoch": 0.4, "percentage": 20.0, "elapsed_time": "0:23:18", "remaining_time": "1:33:13"} | |
| {"current_steps": 100, "total_steps": 450, "loss": 0.0039, "lr": 8.83022221559489e-05, "epoch": 0.4444444444444444, "percentage": 22.22, "elapsed_time": "0:25:21", "remaining_time": "1:28:45"} | |
| {"current_steps": 110, "total_steps": 450, "loss": 0.0039, "lr": 8.596699001693255e-05, "epoch": 0.4888888888888889, "percentage": 24.44, "elapsed_time": "0:27:24", "remaining_time": "1:24:44"} | |
| {"current_steps": 120, "total_steps": 450, "loss": 0.0039, "lr": 8.345653031794292e-05, "epoch": 0.5333333333333333, "percentage": 26.67, "elapsed_time": "0:29:27", "remaining_time": "1:21:01"} | |
| {"current_steps": 120, "total_steps": 450, "eval_loss": 0.0038501631934195757, "epoch": 0.5333333333333333, "percentage": 26.67, "elapsed_time": "0:31:04", "remaining_time": "1:25:28"} | |
| {"current_steps": 130, "total_steps": 450, "loss": 0.0038, "lr": 8.07830737662829e-05, "epoch": 0.5777777777777777, "percentage": 28.89, "elapsed_time": "0:33:07", "remaining_time": "1:21:33"} | |
| {"current_steps": 140, "total_steps": 450, "loss": 0.0037, "lr": 7.795964517353735e-05, "epoch": 0.6222222222222222, "percentage": 31.11, "elapsed_time": "0:35:10", "remaining_time": "1:17:54"} | |
| {"current_steps": 150, "total_steps": 450, "loss": 0.0033, "lr": 7.500000000000001e-05, "epoch": 0.6666666666666666, "percentage": 33.33, "elapsed_time": "0:37:14", "remaining_time": "1:14:28"} | |
| {"current_steps": 150, "total_steps": 450, "eval_loss": 0.0030691924039274454, "epoch": 0.6666666666666666, "percentage": 33.33, "elapsed_time": "0:38:51", "remaining_time": "1:17:42"} | |
| {"current_steps": 160, "total_steps": 450, "loss": 0.0031, "lr": 7.191855733945387e-05, "epoch": 0.7111111111111111, "percentage": 35.56, "elapsed_time": "0:40:54", "remaining_time": "1:14:08"} | |
| {"current_steps": 170, "total_steps": 450, "loss": 0.0031, "lr": 6.873032967079561e-05, "epoch": 0.7555555555555555, "percentage": 37.78, "elapsed_time": "0:42:57", "remaining_time": "1:10:45"} | |
| {"current_steps": 180, "total_steps": 450, "loss": 0.0029, "lr": 6.545084971874738e-05, "epoch": 0.8, "percentage": 40.0, "elapsed_time": "0:45:00", "remaining_time": "1:07:30"} | |
| {"current_steps": 180, "total_steps": 450, "eval_loss": 0.0029199642594903708, "epoch": 0.8, "percentage": 40.0, "elapsed_time": "0:46:37", "remaining_time": "1:09:56"} | |
| {"current_steps": 190, "total_steps": 450, "loss": 0.0029, "lr": 6.209609477998338e-05, "epoch": 0.8444444444444444, "percentage": 42.22, "elapsed_time": "0:48:40", "remaining_time": "1:06:36"} | |
| {"current_steps": 200, "total_steps": 450, "loss": 0.0028, "lr": 5.868240888334653e-05, "epoch": 0.8888888888888888, "percentage": 44.44, "elapsed_time": "0:50:43", "remaining_time": "1:03:24"} | |
| {"current_steps": 210, "total_steps": 450, "loss": 0.0028, "lr": 5.522642316338268e-05, "epoch": 0.9333333333333333, "percentage": 46.67, "elapsed_time": "0:52:47", "remaining_time": "1:00:19"} | |
| {"current_steps": 210, "total_steps": 450, "eval_loss": 0.002507995581254363, "epoch": 0.9333333333333333, "percentage": 46.67, "elapsed_time": "0:54:23", "remaining_time": "1:02:10"} | |
| {"current_steps": 220, "total_steps": 450, "loss": 0.0026, "lr": 5.174497483512506e-05, "epoch": 0.9777777777777777, "percentage": 48.89, "elapsed_time": "0:56:26", "remaining_time": "0:59:00"} | |
| {"current_steps": 230, "total_steps": 450, "loss": 0.0028, "lr": 4.825502516487497e-05, "epoch": 1.0222222222222221, "percentage": 51.11, "elapsed_time": "0:58:30", "remaining_time": "0:55:57"} | |
| {"current_steps": 240, "total_steps": 450, "loss": 0.0025, "lr": 4.477357683661734e-05, "epoch": 1.0666666666666667, "percentage": 53.33, "elapsed_time": "1:00:33", "remaining_time": "0:52:59"} | |
| {"current_steps": 240, "total_steps": 450, "eval_loss": 0.0024458724074065685, "epoch": 1.0666666666666667, "percentage": 53.33, "elapsed_time": "1:02:10", "remaining_time": "0:54:23"} | |
| {"current_steps": 250, "total_steps": 450, "loss": 0.0025, "lr": 4.131759111665349e-05, "epoch": 1.1111111111111112, "percentage": 55.56, "elapsed_time": "1:04:13", "remaining_time": "0:51:22"} | |
| {"current_steps": 260, "total_steps": 450, "loss": 0.0026, "lr": 3.790390522001662e-05, "epoch": 1.1555555555555554, "percentage": 57.78, "elapsed_time": "1:06:16", "remaining_time": "0:48:25"} | |
| {"current_steps": 270, "total_steps": 450, "loss": 0.0024, "lr": 3.4549150281252636e-05, "epoch": 1.2, "percentage": 60.0, "elapsed_time": "1:08:19", "remaining_time": "0:45:33"} | |
| {"current_steps": 270, "total_steps": 450, "eval_loss": 0.002419873373582959, "epoch": 1.2, "percentage": 60.0, "elapsed_time": "1:09:56", "remaining_time": "0:46:37"} | |
| {"current_steps": 280, "total_steps": 450, "loss": 0.0026, "lr": 3.12696703292044e-05, "epoch": 1.2444444444444445, "percentage": 62.22, "elapsed_time": "1:12:00", "remaining_time": "0:43:42"} | |
| {"current_steps": 290, "total_steps": 450, "loss": 0.0026, "lr": 2.8081442660546125e-05, "epoch": 1.2888888888888888, "percentage": 64.44, "elapsed_time": "1:14:03", "remaining_time": "0:40:51"} | |
| {"current_steps": 300, "total_steps": 450, "loss": 0.0027, "lr": 2.500000000000001e-05, "epoch": 1.3333333333333333, "percentage": 66.67, "elapsed_time": "1:16:06", "remaining_time": "0:38:03"} | |
| {"current_steps": 300, "total_steps": 450, "eval_loss": 0.0023624880705028772, "epoch": 1.3333333333333333, "percentage": 66.67, "elapsed_time": "1:17:43", "remaining_time": "0:38:51"} | |
| {"current_steps": 310, "total_steps": 450, "loss": 0.0024, "lr": 2.2040354826462668e-05, "epoch": 1.3777777777777778, "percentage": 68.89, "elapsed_time": "1:19:46", "remaining_time": "0:36:01"} | |
| {"current_steps": 320, "total_steps": 450, "loss": 0.0025, "lr": 1.9216926233717085e-05, "epoch": 1.4222222222222223, "percentage": 71.11, "elapsed_time": "1:21:49", "remaining_time": "0:33:14"} | |
| {"current_steps": 330, "total_steps": 450, "loss": 0.0025, "lr": 1.6543469682057106e-05, "epoch": 1.4666666666666668, "percentage": 73.33, "elapsed_time": "1:23:53", "remaining_time": "0:30:30"} | |
| {"current_steps": 330, "total_steps": 450, "eval_loss": 0.0022804364562034607, "epoch": 1.4666666666666668, "percentage": 73.33, "elapsed_time": "1:25:30", "remaining_time": "0:31:05"} | |
| {"current_steps": 340, "total_steps": 450, "loss": 0.0024, "lr": 1.4033009983067452e-05, "epoch": 1.511111111111111, "percentage": 75.56, "elapsed_time": "1:27:33", "remaining_time": "0:28:19"} | |
| {"current_steps": 350, "total_steps": 450, "loss": 0.0027, "lr": 1.1697777844051105e-05, "epoch": 1.5555555555555556, "percentage": 77.78, "elapsed_time": "1:29:36", "remaining_time": "0:25:36"} | |
| {"current_steps": 360, "total_steps": 450, "loss": 0.0023, "lr": 9.549150281252633e-06, "epoch": 1.6, "percentage": 80.0, "elapsed_time": "1:31:39", "remaining_time": "0:22:54"} | |
| {"current_steps": 360, "total_steps": 450, "eval_loss": 0.002201332012191415, "epoch": 1.6, "percentage": 80.0, "elapsed_time": "1:33:16", "remaining_time": "0:23:19"} | |
| {"current_steps": 370, "total_steps": 450, "loss": 0.0025, "lr": 7.597595192178702e-06, "epoch": 1.6444444444444444, "percentage": 82.22, "elapsed_time": "1:35:19", "remaining_time": "0:20:36"} | |
| {"current_steps": 380, "total_steps": 450, "loss": 0.0022, "lr": 5.852620357053651e-06, "epoch": 1.6888888888888889, "percentage": 84.44, "elapsed_time": "1:37:22", "remaining_time": "0:17:56"} | |
| {"current_steps": 390, "total_steps": 450, "loss": 0.0023, "lr": 4.322727117869951e-06, "epoch": 1.7333333333333334, "percentage": 86.67, "elapsed_time": "1:39:25", "remaining_time": "0:15:17"} | |
| {"current_steps": 390, "total_steps": 450, "eval_loss": 0.002075706608593464, "epoch": 1.7333333333333334, "percentage": 86.67, "elapsed_time": "1:41:02", "remaining_time": "0:15:32"} | |
| {"current_steps": 400, "total_steps": 450, "loss": 0.002, "lr": 3.0153689607045845e-06, "epoch": 1.7777777777777777, "percentage": 88.89, "elapsed_time": "1:43:05", "remaining_time": "0:12:53"} | |
| {"current_steps": 410, "total_steps": 450, "loss": 0.002, "lr": 1.9369152030840556e-06, "epoch": 1.8222222222222222, "percentage": 91.11, "elapsed_time": "1:45:09", "remaining_time": "0:10:15"} | |
| {"current_steps": 420, "total_steps": 450, "loss": 0.002, "lr": 1.0926199633097157e-06, "epoch": 1.8666666666666667, "percentage": 93.33, "elapsed_time": "1:47:12", "remaining_time": "0:07:39"} | |
| {"current_steps": 420, "total_steps": 450, "eval_loss": 0.0020291407126933336, "epoch": 1.8666666666666667, "percentage": 93.33, "elapsed_time": "1:48:49", "remaining_time": "0:07:46"} | |
| {"current_steps": 430, "total_steps": 450, "loss": 0.002, "lr": 4.865965629214819e-07, "epoch": 1.911111111111111, "percentage": 95.56, "elapsed_time": "1:50:52", "remaining_time": "0:05:09"} | |
| {"current_steps": 440, "total_steps": 450, "loss": 0.0025, "lr": 1.2179748700879012e-07, "epoch": 1.9555555555555557, "percentage": 97.78, "elapsed_time": "1:52:56", "remaining_time": "0:02:34"} | |
| {"current_steps": 450, "total_steps": 450, "loss": 0.0022, "lr": 0.0, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "1:54:59", "remaining_time": "0:00:00"} | |
| {"current_steps": 450, "total_steps": 450, "eval_loss": 0.0020088243763893843, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "1:56:36", "remaining_time": "0:00:00"} | |
| {"current_steps": 450, "total_steps": 450, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "1:56:37", "remaining_time": "0:00:00"} | |