rstudioweb's picture
Upload logs/6_log.txt with huggingface_hub
c7d2729 verified
raw
history blame
133 kB
Running 1 job
{
"type": "diffusion_trainer",
"training_folder": "/teamspace/studios/this_studio/ai-toolkit/output",
"sqlite_db_path": "/teamspace/studios/this_studio/ai-toolkit/aitk_db.db",
"device": "cuda",
"trigger_word": "xtishaz1",
"performance_log_every": 10,
"network": {
"type": "lora",
"linear": 32,
"linear_alpha": 32,
"conv": 16,
"conv_alpha": 16,
"lokr_full_rank": true,
"lokr_factor": -1,
"network_kwargs": {
"ignore_if_contains": []
}
},
"save": {
"dtype": "bf16",
"save_every": 500,
"max_step_saves_to_keep": 8,
"save_format": "diffusers",
"push_to_hub": false
},
"datasets": [
{
"folder_path": "/teamspace/studios/this_studio/ai-toolkit/datasets/nishani",
"mask_path": null,
"mask_min_value": 0.1,
"default_caption": "Indian 18y nude girl",
"caption_ext": "txt",
"caption_dropout_rate": 0.05,
"cache_latents_to_disk": false,
"is_reg": false,
"network_weight": 1,
"resolution": [
1024,
512,
768
],
"controls": [],
"shrink_video_to_frames": true,
"num_frames": 1,
"do_i2v": true,
"flip_x": false,
"flip_y": false
}
],
"train": {
"batch_size": 1,
"bypass_guidance_embedding": false,
"steps": 6000,
"gradient_accumulation": 1,
"train_unet": true,
"train_text_encoder": false,
"gradient_checkpointing": true,
"noise_scheduler": "flowmatch",
"optimizer": "adamw8bit",
"timestep_type": "weighted",
"content_or_style": "balanced",
"optimizer_params": {
"weight_decay": 0.0001
},
"unload_text_encoder": true,
"cache_text_embeddings": false,
"lr": 0.0001,
"ema_config": {
"use_ema": false,
"ema_decay": 0.99
},
"skip_first_sample": false,
"force_first_sample": false,
"disable_sampling": false,
"dtype": "bf16",
"diff_output_preservation": false,
"diff_output_preservation_multiplier": 1,
"diff_output_preservation_class": "person",
"switch_boundary_every": 1,
"loss_type": "mse",
"do_differential_guidance": true,
"differential_guidance_scale": 3
},
"model": {
"name_or_path": "Tongyi-MAI/Z-Image-Turbo",
"quantize": true,
"qtype": "qfloat8",
"quantize_te": true,
"qtype_te": "qfloat8",
"arch": "zimage:turbo",
"low_vram": true,
"model_kwargs": {},
"layer_offloading": false,
"layer_offloading_text_encoder_percent": 1,
"layer_offloading_transformer_percent": 1,
"assistant_lora_path": "ostris/zimage_turbo_training_adapter/zimage_turbo_training_adapter_v1.safetensors"
},
"sample": {
"sampler": "flowmatch",
"sample_every": 250,
"width": 1024,
"height": 1024,
"samples": [
{
"prompt": "xtishaz1, A young nude woman with a soft oval face shape, smooth light-to-medium warm skin tone, and clear glowing complexion, large expressive almond-shaped dark brown eyes, well-defined natural eyebrows, a small straight nose, and full pink lips with a gentle smile, long straight silky black hair styled with volume at the crown (slight puffed front) flowing past the shoulders, with a youthful, fresh, and naturally elegant appearance and balanced facial symmetry, is captured in a moment of intense intimacy as she leans forward with her eyes closed in pleasure, her tongue delicately exploring the base of a man\u2019s erect penis, her head tilted back slightly, her left hand gently cradling the back of her head while her right arm rests along his torso, the man\u2019s tattooed forearm adorned with a black dagger design rests possessively on her head, his body partially visible with defined musculature and natural body hair, the scene bathed in warm, golden-orange ambient lighting that casts soft shadows and highlights the contours of their skin, the background blurred into a smooth gradient of rich amber tones with subtle bokeh lights, creating a shallow depth of field that draws focus entirely to the couple\u2019s connection, the camera positioned at a close, slightly low angle to emphasize the intimacy and raw emotion of the moment, the woman\u2019s delicate gold hoop earring and thin gold chain necklace catching the light, adding a touch of elegance to the sensual scene, the overall composition exudes a sense of passion, trust, and natural beauty, rendered in ultra-high detail with a realistic, NSFW, adult, Z-Image Turbo optimized aesthetic."
},
{
"prompt": "xtishaz1, A young nude woman with a soft oval face shape, smooth light-to-medium warm skin tone, and clear glowing complexion, large expressive almond-shaped dark brown eyes, well-defined natural eyebrows, a small straight nose, and full pink lips with a gentle smile, long straight silky black hair styled with volume at the crown (slight puffed front) flowing past the shoulders, with a youthful, fresh, and naturally elegant appearance and balanced facial symmetry, is captured in a moment of intense intimacy, kneeling on a plush white quilted bed, her body arched gracefully as she leans forward, one hand resting possessively on her hip while the other is gently placed on her thigh, her skin glistening with natural moisture under the soft, diffused natural light filtering through sheer white curtains and a wooden-framed window in the background, the warm beige walls and a wicker basket subtly visible in the corner adding to the serene, private atmosphere, the camera angle is low and intimate, emphasizing the curves of her body and the sensual tension of the moment, the depth of field is shallow, blurring the background slightly to draw focus to her form and the subtle interplay of light and shadow across her skin, creating a highly detailed, realistic, NSFW, adult, Z-Image Turbo optimized scene that exudes passion, elegance, and natural beauty."
},
{
"prompt": "xtishaz1, Photo of a nude Indian woman 21y old with a soft oval face shape, smooth light-to-medium warm skin tone, and clear glowing complexion, large expressive almond-shaped dark brown eyes, well-defined natural eyebrows, a small straight nose, and full pink lips with a gentle smile, long straight silky black hair styled with volume at the crown (slight puffed front) flowing past the shoulders, with a youthful, fresh, and naturally elegant appearance and balanced facial symmetry, is captured in a moment of intense intimacy as she standing in a bedroom, facing the camera, medium wide shot, full body, black hair, dark eyes, medium breasts, slender physique, medium skin tone, brown eyes, dark eyebrows, small areola, standing with her legs together , perfect feet, hands at her sides, perfect fingers, visible clitoris, pussy, looking at the camera, natural lighting, bright and airy room, white walls, large window with sheer white curtains, white bed with a wooden frame, white bed linens, wooden floor, potted plant in the background, casual and relaxed pose, confident expression, soft shadows, high quality, jpeg artifacts, no watermark, perfectly optimized for Z-Image Turbo."
},
{
"prompt": "xtishaz1, A young nude woman with a soft oval face shape, smooth light-to-medium warm skin tone, and clear glowing complexion, large expressive almond-shaped dark brown eyes, well-defined natural eyebrows, a small straight nose, and full pink lips with a gentle smile, long straight silky black hair styled with volume at the crown (slight puffed front) flowing past the shoulders, with a youthful, fresh, and naturally elegant appearance and balanced facial symmetry, reclines provocatively atop a plush, deep purple satin couch, her legs spread wide in a bold, sensual pose that accentuates her curves and natural beauty, her tongue playfully extended in a teasing expression, the rich, velvety texture of the couch contrasting with the smooth, glistening skin of her body, the ambient lighting casting soft, warm highlights across her form, the background revealing a cozy, intimate room with a purple wall, a bookshelf filled with books and decorative items, and a vintage-style lamp casting a gentle glow, the depth of field keeps the focus sharply on her figure while softly blurring the background elements, creating a luxurious, NSFW, adult, Z-Image Turbo optimized scene that exudes confidence, allure, and raw sensuality."
},
{
"prompt": "xtishaz1, Photo of a Indian 21y woman with a soft oval face shape, smooth light-to-medium warm skin tone, and clear glowing complexion, large expressive almond-shaped dark brown eyes, well-defined natural eyebrows, a small straight nose, and full pink lips with a gentle smile, long straight silky black hair styled with volume at the crown (slight puffed front) flowing past the shoulders, with a youthful, fresh, and naturally elegant appearance and balanced facial symmetry, is captured in a moment of intense intimacy as she on her knees in a bathroom, giving a blowjob to a man standing in front of her. The woman has long black hair and a slender physique, with medium-sized breasts. The man is naked, with a large erected penis. The woman is performing oral sex on the man, with her eyes closed and her lips wrapped around his penis. The bathroom has a modern design, a wooden floor. The lighting is soft and warm, with a gentle glow on the woman's skin. The image is high quality and has a watermark in the bottom right corner"
}
],
"neg": "",
"seed": 42,
"walk_seed": true,
"guidance_scale": 1,
"sample_steps": 8,
"num_frames": 1,
"fps": 1
},
"logging": {
"log_every": 1,
"use_ui_logger": true
}
}
Using SQLite database at /teamspace/studios/this_studio/ai-toolkit/aitk_db.db
Job ID: "f7eb6cbb-a54a-4f3a-92b0-66455621336c"
#############################################
# Running job: my_first_lora_v6
#############################################
Running 1 process
Loading ZImage model
Loading transformer
Loading checkpoint shards: 0%| | 0/3 [00:00<?, ?it/s] Loading checkpoint shards: 0%| | 0/3 [00:00<?, ?it/s] Loading checkpoint shards: 33%|###3 | 1/3 [00:00<00:01, 1.22it/s] Loading checkpoint shards: 33%|###3 | 1/3 [00:00<00:01, 1.22it/s] Loading checkpoint shards: 67%|######6 | 2/3 [00:01<00:00, 1.20it/s] Loading checkpoint shards: 67%|######6 | 2/3 [00:01<00:00, 1.20it/s] Loading checkpoint shards: 100%|##########| 3/3 [00:05<00:00, 2.00s/it] Loading checkpoint shards: 100%|##########| 3/3 [00:05<00:00, 2.00s/it] Loading checkpoint shards: 100%|##########| 3/3 [00:05<00:00, 1.68s/it] Loading checkpoint shards: 100%|##########| 3/3 [00:05<00:00, 1.68s/it]
Loading assistant LoRA
create LoRA network. base dim (rank): 32, alpha: 32
neuron dropout: p=None, rank dropout: p=None, module dropout: p=None
create LoRA for Text Encoder: 0 modules.
create LoRA for U-Net: 276 modules.
enable LoRA for U-Net
Merging in assistant LoRA
Missing keys: []
Quantizing Transformer
- quantizing 30 transformer blocks
0%| | 0/30 [00:00<?, ?it/s] 0%| | 0/30 [00:00<?, ?it/s] 3%|3 | 1/30 [00:00<00:04, 6.58it/s] 3%|3 | 1/30 [00:00<00:04, 6.58it/s] 7%|6 | 2/30 [00:00<00:03, 7.79it/s] 7%|6 | 2/30 [00:00<00:03, 7.79it/s] 10%|# | 3/30 [00:00<00:03, 8.28it/s] 10%|# | 3/30 [00:00<00:03, 8.28it/s] 13%|#3 | 4/30 [00:00<00:03, 8.53it/s] 13%|#3 | 4/30 [00:00<00:03, 8.53it/s] 17%|#6 | 5/30 [00:00<00:02, 8.69it/s] 17%|#6 | 5/30 [00:00<00:02, 8.69it/s] 20%|## | 6/30 [00:00<00:02, 8.79it/s] 20%|## | 6/30 [00:00<00:02, 8.79it/s] 23%|##3 | 7/30 [00:00<00:02, 8.86it/s] 23%|##3 | 7/30 [00:00<00:02, 8.86it/s] 27%|##6 | 8/30 [00:00<00:02, 8.79it/s] 27%|##6 | 8/30 [00:00<00:02, 8.79it/s] 30%|### | 9/30 [00:01<00:02, 8.82it/s] 30%|### | 9/30 [00:01<00:02, 8.82it/s] 33%|###3 | 10/30 [00:01<00:02, 8.83it/s] 33%|###3 | 10/30 [00:01<00:02, 8.83it/s] 37%|###6 | 11/30 [00:01<00:02, 8.44it/s] 37%|###6 | 11/30 [00:01<00:02, 8.44it/s] 40%|#### | 12/30 [00:01<00:02, 8.44it/s] 40%|#### | 12/30 [00:01<00:02, 8.44it/s] 43%|####3 | 13/30 [00:01<00:01, 8.53it/s] 43%|####3 | 13/30 [00:01<00:01, 8.53it/s] 47%|####6 | 14/30 [00:01<00:01, 8.61it/s] 47%|####6 | 14/30 [00:01<00:01, 8.61it/s] 53%|#####3 | 16/30 [00:01<00:01, 9.00it/s] 53%|#####3 | 16/30 [00:01<00:01, 9.00it/s] 57%|#####6 | 17/30 [00:01<00:01, 8.94it/s] 57%|#####6 | 17/30 [00:01<00:01, 8.94it/s] 60%|###### | 18/30 [00:02<00:01, 8.88it/s] 60%|###### | 18/30 [00:02<00:01, 8.88it/s] 67%|######6 | 20/30 [00:02<00:01, 9.14it/s] 67%|######6 | 20/30 [00:02<00:01, 9.14it/s] 70%|####### | 21/30 [00:02<00:00, 9.05it/s] 70%|####### | 21/30 [00:02<00:00, 9.05it/s] 73%|#######3 | 22/30 [00:02<00:00, 8.98it/s] 73%|#######3 | 22/30 [00:02<00:00, 8.98it/s] 77%|#######6 | 23/30 [00:02<00:00, 8.94it/s] 77%|#######6 | 23/30 [00:02<00:00, 8.94it/s] 80%|######## | 24/30 [00:02<00:00, 8.92it/s] 80%|######## | 24/30 [00:02<00:00, 8.92it/s] 83%|########3 | 25/30 [00:02<00:00, 8.90it/s] 83%|########3 | 25/30 [00:02<00:00, 8.90it/s] 87%|########6 | 26/30 [00:02<00:00, 8.84it/s] 87%|########6 | 26/30 [00:02<00:00, 8.84it/s] 90%|######### | 27/30 [00:03<00:00, 8.61it/s] 90%|######### | 27/30 [00:03<00:00, 8.61it/s] 93%|#########3| 28/30 [00:03<00:00, 8.61it/s] 93%|#########3| 28/30 [00:03<00:00, 8.61it/s] 97%|#########6| 29/30 [00:03<00:00, 8.65it/s] 97%|#########6| 29/30 [00:03<00:00, 8.65it/s] 100%|##########| 30/30 [00:03<00:00, 8.73it/s] 100%|##########| 30/30 [00:03<00:00, 8.73it/s] 100%|##########| 30/30 [00:03<00:00, 8.73it/s] 100%|##########| 30/30 [00:03<00:00, 8.73it/s]
- quantizing extras
Moving transformer to CPU
Text Encoder
`torch_dtype` is deprecated! Use `dtype` instead!
`torch_dtype` is deprecated! Use `dtype` instead!
Loading checkpoint shards: 0%| | 0/3 [00:00<?, ?it/s] Loading checkpoint shards: 0%| | 0/3 [00:00<?, ?it/s] Loading checkpoint shards: 67%|######6 | 2/3 [00:00<00:00, 14.49it/s] Loading checkpoint shards: 67%|######6 | 2/3 [00:00<00:00, 14.49it/s] Loading checkpoint shards: 100%|##########| 3/3 [00:00<00:00, 21.38it/s] Loading checkpoint shards: 100%|##########| 3/3 [00:00<00:00, 21.38it/s]
Quantizing Text Encoder
Loading VAE
Making pipe
Preparing Model
Model Loaded
create LoRA network. base dim (rank): 32, alpha: 32
neuron dropout: p=None, rank dropout: p=None, module dropout: p=None
apply LoRA to Conv2d with kernel size (3,3). dim (rank): 16, alpha: 16
create LoRA for Text Encoder: 0 modules.
create LoRA for U-Net: 240 modules.
enable LoRA for U-Net
#### IMPORTANT RESUMING FROM /teamspace/studios/this_studio/ai-toolkit/output/my_first_lora_v6/my_first_lora_v6_000003000.safetensors ####
Loading from /teamspace/studios/this_studio/ai-toolkit/output/my_first_lora_v6/my_first_lora_v6_000003000.safetensors
Missing keys: []
Found step 3000 in metadata, starting from there
Loading optimizer state from /teamspace/studios/this_studio/ai-toolkit/output/my_first_lora_v6/optimizer.pt
Updating optimizer LR from params
Dataset: /teamspace/studios/this_studio/ai-toolkit/datasets/nishani
- Preprocessing image dimensions
0%| | 0/8 [00:00<?, ?it/s] 0%| | 0/8 [00:00<?, ?it/s] 100%|##########| 8/8 [00:00<00:00, 17933.96it/s] 100%|##########| 8/8 [00:00<00:00, 17933.96it/s]
- Found 8 images
Bucket sizes for /teamspace/studios/this_studio/ai-toolkit/datasets/nishani:
704x704: 1 files
832x1152: 4 files
704x1248: 2 files
768x1344: 1 files
4 buckets made
Dataset: /teamspace/studios/this_studio/ai-toolkit/datasets/nishani
- Preprocessing image dimensions
0%| | 0/8 [00:00<?, ?it/s] 0%| | 0/8 [00:00<?, ?it/s] 100%|##########| 8/8 [00:00<00:00, 27391.37it/s] 100%|##########| 8/8 [00:00<00:00, 27391.37it/s]
- Found 8 images
Bucket sizes for /teamspace/studios/this_studio/ai-toolkit/datasets/nishani:
512x512: 1 files
416x576: 4 files
384x672: 3 files
3 buckets made
Dataset: /teamspace/studios/this_studio/ai-toolkit/datasets/nishani
- Preprocessing image dimensions
0%| | 0/8 [00:00<?, ?it/s] 0%| | 0/8 [00:00<?, ?it/s] 100%|##########| 8/8 [00:00<00:00, 32419.74it/s] 100%|##########| 8/8 [00:00<00:00, 32419.74it/s]
- Found 8 images
Bucket sizes for /teamspace/studios/this_studio/ai-toolkit/datasets/nishani:
704x704: 1 files
672x864: 4 files
576x992: 3 files
3 buckets made
Caching embeddings and unloading text encoder
***** UNLOADING TEXT ENCODER *****
This will train only with a blank prompt or trigger word, if set
If this is not what you want, remove the unload_text_encoder flag
***********************************
my_first_lora_v6: 50%|##### | 3000/6000 [00:00<?, ?it/s] my_first_lora_v6: 50%|##### | 3000/6000 [00:00<?, ?it/s] my_first_lora_v6: 50%|##### | 3000/6000 [00:01<?, ?it/s, lr: 1.0e-04 loss: 9.086e-02] my_first_lora_v6: 50%|##### | 3000/6000 [00:01<?, ?it/s, lr: 1.0e-04 loss: 9.086e-02] my_first_lora_v6: 50%|##### | 3000/6000 [00:01<?, ?it/s, lr: 1.0e-04 loss: 9.086e-02] my_first_lora_v6: 50%|##### | 3000/6000 [00:01<?, ?it/s, lr: 1.0e-04 loss: 9.086e-02] my_first_lora_v6: 50%|##### | 3000/6000 [00:03<?, ?it/s, lr: 1.0e-04 loss: 5.214e-01] my_first_lora_v6: 50%|##### | 3000/6000 [00:03<?, ?it/s, lr: 1.0e-04 loss: 5.214e-01] my_first_lora_v6: 50%|##### | 3001/6000 [00:04<3:20:46, 4.02s/it, lr: 1.0e-04 loss: 7.091e-01] my_first_lora_v6: 50%|##### | 3001/6000 [00:04<3:20:46, 4.02s/it, lr: 1.0e-04 loss: 7.091e-01] my_first_lora_v6: 50%|##### | 3002/6000 [00:06<2:42:58, 3.26s/it, lr: 1.0e-04 loss: 1.334e-01] my_first_lora_v6: 50%|##### | 3002/6000 [00:06<2:42:58, 3.26s/it, lr: 1.0e-04 loss: 1.334e-01] my_first_lora_v6: 50%|##### | 3003/6000 [00:07<2:11:00, 2.62s/it, lr: 1.0e-04 loss: 7.609e-01] my_first_lora_v6: 50%|##### | 3003/6000 [00:07<2:11:00, 2.62s/it, lr: 1.0e-04 loss: 7.609e-01] my_first_lora_v6: 50%|##### | 3004/6000 [00:08<1:46:50, 2.14s/it, lr: 1.0e-04 loss: 4.457e-01] my_first_lora_v6: 50%|##### | 3004/6000 [00:08<1:46:50, 2.14s/it, lr: 1.0e-04 loss: 4.457e-01] my_first_lora_v6: 50%|##### | 3005/6000 [00:09<1:32:24, 1.85s/it, lr: 1.0e-04 loss: 5.656e-01] my_first_lora_v6: 50%|##### | 3005/6000 [00:09<1:32:24, 1.85s/it, lr: 1.0e-04 loss: 5.656e-01] my_first_lora_v6: 50%|##### | 3006/6000 [00:11<1:35:19, 1.91s/it, lr: 1.0e-04 loss: 1.383e-01] my_first_lora_v6: 50%|##### | 3006/6000 [00:11<1:35:19, 1.91s/it, lr: 1.0e-04 loss: 1.383e-01] my_first_lora_v6: 50%|##### | 3007/6000 [00:13<1:38:54, 1.98s/it, lr: 1.0e-04 loss: 6.286e-01] my_first_lora_v6: 50%|##### | 3007/6000 [00:13<1:38:54, 1.98s/it, lr: 1.0e-04 loss: 6.286e-01] my_first_lora_v6: 50%|##### | 3008/6000 [00:16<1:41:50, 2.04s/it, lr: 1.0e-04 loss: 2.827e-01] my_first_lora_v6: 50%|##### | 3008/6000 [00:16<1:41:50, 2.04s/it, lr: 1.0e-04 loss: 2.827e-01] my_first_lora_v6: 50%|##### | 3009/6000 [00:17<1:34:25, 1.89s/it, lr: 1.0e-04 loss: 2.918e-01] my_first_lora_v6: 50%|##### | 3009/6000 [00:17<1:34:25, 1.89s/it, lr: 1.0e-04 loss: 2.918e-01] my_first_lora_v6: 50%|##### | 3010/6000 [00:18<1:30:48, 1.82s/it, lr: 1.0e-04 loss: 1.444e-01] my_first_lora_v6: 50%|##### | 3010/6000 [00:18<1:30:48, 1.82s/it, lr: 1.0e-04 loss: 1.444e-01] my_first_lora_v6: 50%|##### | 3011/6000 [00:20<1:32:30, 1.86s/it, lr: 1.0e-04 loss: 5.821e-01] my_first_lora_v6: 50%|##### | 3011/6000 [00:20<1:32:30, 1.86s/it, lr: 1.0e-04 loss: 5.821e-01] my_first_lora_v6: 50%|##### | 3012/6000 [00:21<1:27:45, 1.76s/it, lr: 1.0e-04 loss: 5.028e-01] my_first_lora_v6: 50%|##### | 3012/6000 [00:21<1:27:45, 1.76s/it, lr: 1.0e-04 loss: 5.028e-01] my_first_lora_v6: 50%|##### | 3013/6000 [00:22<1:26:07, 1.73s/it, lr: 1.0e-04 loss: 4.212e-02] my_first_lora_v6: 50%|##### | 3013/6000 [00:22<1:26:07, 1.73s/it, lr: 1.0e-04 loss: 4.212e-02] my_first_lora_v6: 50%|##### | 3014/6000 [00:23<1:23:25, 1.68s/it, lr: 1.0e-04 loss: 3.094e-01] my_first_lora_v6: 50%|##### | 3014/6000 [00:23<1:23:25, 1.68s/it, lr: 1.0e-04 loss: 3.094e-01] my_first_lora_v6: 50%|##### | 3015/6000 [00:24<1:22:13, 1.65s/it, lr: 1.0e-04 loss: 7.712e-01] my_first_lora_v6: 50%|##### | 3015/6000 [00:24<1:22:13, 1.65s/it, lr: 1.0e-04 loss: 7.712e-01] my_first_lora_v6: 50%|##### | 3016/6000 [00:27<1:24:36, 1.70s/it, lr: 1.0e-04 loss: 5.914e-02] my_first_lora_v6: 50%|##### | 3016/6000 [00:27<1:24:36, 1.70s/it, lr: 1.0e-04 loss: 5.914e-02] my_first_lora_v6: 50%|##### | 3017/6000 [00:29<1:27:32, 1.76s/it, lr: 1.0e-04 loss: 5.672e-01] my_first_lora_v6: 50%|##### | 3017/6000 [00:29<1:27:32, 1.76s/it, lr: 1.0e-04 loss: 5.672e-01] my_first_lora_v6: 50%|##### | 3018/6000 [00:31<1:26:20, 1.74s/it, lr: 1.0e-04 loss: 4.198e-01] my_first_lora_v6: 50%|##### | 3018/6000 [00:31<1:26:20, 1.74s/it, lr: 1.0e-04 loss: 4.198e-01] my_first_lora_v6: 50%|##### | 3019/6000 [00:32<1:24:48, 1.71s/it, lr: 1.0e-04 loss: 3.886e-01] my_first_lora_v6: 50%|##### | 3019/6000 [00:32<1:24:48, 1.71s/it, lr: 1.0e-04 loss: 3.886e-01] my_first_lora_v6: 50%|##### | 3020/6000 [00:33<1:23:53, 1.69s/it, lr: 1.0e-04 loss: 7.007e-01] my_first_lora_v6: 50%|##### | 3020/6000 [00:33<1:23:53, 1.69s/it, lr: 1.0e-04 loss: 7.007e-01] my_first_lora_v6: 50%|##### | 3021/6000 [00:34<1:21:32, 1.64s/it, lr: 1.0e-04 loss: 7.860e-01] my_first_lora_v6: 50%|##### | 3021/6000 [00:34<1:21:32, 1.64s/it, lr: 1.0e-04 loss: 7.860e-01] my_first_lora_v6: 50%|##### | 3022/6000 [00:35<1:19:22, 1.60s/it, lr: 1.0e-04 loss: 5.055e-01] my_first_lora_v6: 50%|##### | 3022/6000 [00:35<1:19:22, 1.60s/it, lr: 1.0e-04 loss: 5.055e-01] my_first_lora_v6: 50%|##### | 3023/6000 [00:36<1:17:47, 1.57s/it, lr: 1.0e-04 loss: 6.093e-01] my_first_lora_v6: 50%|##### | 3023/6000 [00:36<1:17:47, 1.57s/it, lr: 1.0e-04 loss: 6.093e-01] my_first_lora_v6: 50%|##### | 3024/6000 [00:37<1:16:56, 1.55s/it, lr: 1.0e-04 loss: 1.140e-01] my_first_lora_v6: 50%|##### | 3024/6000 [00:37<1:16:56, 1.55s/it, lr: 1.0e-04 loss: 1.140e-01] my_first_lora_v6: 50%|##### | 3025/6000 [00:38<1:16:31, 1.54s/it, lr: 1.0e-04 loss: 2.030e-01] my_first_lora_v6: 50%|##### | 3025/6000 [00:38<1:16:31, 1.54s/it, lr: 1.0e-04 loss: 2.030e-01] my_first_lora_v6: 50%|##### | 3026/6000 [00:40<1:17:45, 1.57s/it, lr: 1.0e-04 loss: 7.535e-01] my_first_lora_v6: 50%|##### | 3026/6000 [00:40<1:17:45, 1.57s/it, lr: 1.0e-04 loss: 7.535e-01] my_first_lora_v6: 50%|##### | 3027/6000 [00:41<1:16:03, 1.54s/it, lr: 1.0e-04 loss: 1.899e-01] my_first_lora_v6: 50%|##### | 3027/6000 [00:41<1:16:03, 1.54s/it, lr: 1.0e-04 loss: 1.899e-01] my_first_lora_v6: 50%|##### | 3028/6000 [00:43<1:16:19, 1.54s/it, lr: 1.0e-04 loss: 3.390e-01] my_first_lora_v6: 50%|##### | 3028/6000 [00:43<1:16:19, 1.54s/it, lr: 1.0e-04 loss: 3.390e-01] my_first_lora_v6: 50%|##### | 3029/6000 [00:45<1:17:49, 1.57s/it, lr: 1.0e-04 loss: 2.874e-01] my_first_lora_v6: 50%|##### | 3029/6000 [00:45<1:17:49, 1.57s/it, lr: 1.0e-04 loss: 2.874e-01] my_first_lora_v6: 50%|##### | 3030/6000 [00:46<1:17:08, 1.56s/it, lr: 1.0e-04 loss: 3.428e-01] my_first_lora_v6: 50%|##### | 3030/6000 [00:46<1:17:08, 1.56s/it, lr: 1.0e-04 loss: 3.428e-01] my_first_lora_v6: 51%|##### | 3031/6000 [00:48<1:16:44, 1.55s/it, lr: 1.0e-04 loss: 5.464e-02] my_first_lora_v6: 51%|##### | 3031/6000 [00:48<1:16:44, 1.55s/it, lr: 1.0e-04 loss: 5.464e-02] my_first_lora_v6: 51%|##### | 3032/6000 [00:49<1:16:24, 1.54s/it, lr: 1.0e-04 loss: 7.222e-01] my_first_lora_v6: 51%|##### | 3032/6000 [00:49<1:16:24, 1.54s/it, lr: 1.0e-04 loss: 7.222e-01] my_first_lora_v6: 51%|##### | 3033/6000 [00:50<1:16:03, 1.54s/it, lr: 1.0e-04 loss: 7.569e-01] my_first_lora_v6: 51%|##### | 3033/6000 [00:50<1:16:03, 1.54s/it, lr: 1.0e-04 loss: 7.569e-01] my_first_lora_v6: 51%|##### | 3034/6000 [00:52<1:15:45, 1.53s/it, lr: 1.0e-04 loss: 5.247e-01] my_first_lora_v6: 51%|##### | 3034/6000 [00:52<1:15:45, 1.53s/it, lr: 1.0e-04 loss: 5.247e-01] my_first_lora_v6: 51%|##### | 3035/6000 [00:54<1:16:41, 1.55s/it, lr: 1.0e-04 loss: 2.673e-01] my_first_lora_v6: 51%|##### | 3035/6000 [00:54<1:16:41, 1.55s/it, lr: 1.0e-04 loss: 2.673e-01] my_first_lora_v6: 51%|##### | 3036/6000 [00:54<1:15:28, 1.53s/it, lr: 1.0e-04 loss: 7.033e-01] my_first_lora_v6: 51%|##### | 3036/6000 [00:54<1:15:28, 1.53s/it, lr: 1.0e-04 loss: 7.033e-01] my_first_lora_v6: 51%|##### | 3037/6000 [00:57<1:16:59, 1.56s/it, lr: 1.0e-04 loss: 4.251e-01] my_first_lora_v6: 51%|##### | 3037/6000 [00:57<1:16:59, 1.56s/it, lr: 1.0e-04 loss: 4.251e-01] my_first_lora_v6: 51%|##### | 3038/6000 [00:58<1:15:50, 1.54s/it, lr: 1.0e-04 loss: 1.887e-01] my_first_lora_v6: 51%|##### | 3038/6000 [00:58<1:15:50, 1.54s/it, lr: 1.0e-04 loss: 1.887e-01] my_first_lora_v6: 51%|##### | 3039/6000 [00:59<1:14:40, 1.51s/it, lr: 1.0e-04 loss: 3.833e-01] my_first_lora_v6: 51%|##### | 3039/6000 [00:59<1:14:40, 1.51s/it, lr: 1.0e-04 loss: 3.833e-01] my_first_lora_v6: 51%|##### | 3040/6000 [01:00<1:14:26, 1.51s/it, lr: 1.0e-04 loss: 2.339e-01] my_first_lora_v6: 51%|##### | 3040/6000 [01:00<1:14:26, 1.51s/it, lr: 1.0e-04 loss: 2.339e-01] my_first_lora_v6: 51%|##### | 3041/6000 [01:01<1:13:22, 1.49s/it, lr: 1.0e-04 loss: 5.330e-02] my_first_lora_v6: 51%|##### | 3041/6000 [01:01<1:13:22, 1.49s/it, lr: 1.0e-04 loss: 5.330e-02] my_first_lora_v6: 51%|##### | 3042/6000 [01:03<1:14:40, 1.51s/it, lr: 1.0e-04 loss: 2.748e-01] my_first_lora_v6: 51%|##### | 3042/6000 [01:03<1:14:40, 1.51s/it, lr: 1.0e-04 loss: 2.748e-01] my_first_lora_v6: 51%|##### | 3043/6000 [01:06<1:15:42, 1.54s/it, lr: 1.0e-04 loss: 1.355e-02] my_first_lora_v6: 51%|##### | 3043/6000 [01:06<1:15:42, 1.54s/it, lr: 1.0e-04 loss: 1.355e-02] my_first_lora_v6: 51%|##### | 3044/6000 [01:06<1:14:41, 1.52s/it, lr: 1.0e-04 loss: 7.663e-01] my_first_lora_v6: 51%|##### | 3044/6000 [01:06<1:14:41, 1.52s/it, lr: 1.0e-04 loss: 7.663e-01] my_first_lora_v6: 51%|##### | 3045/6000 [01:07<1:13:45, 1.50s/it, lr: 1.0e-04 loss: 6.233e-01] my_first_lora_v6: 51%|##### | 3045/6000 [01:07<1:13:45, 1.50s/it, lr: 1.0e-04 loss: 6.233e-01] my_first_lora_v6: 51%|##### | 3046/6000 [01:09<1:14:43, 1.52s/it, lr: 1.0e-04 loss: 7.434e-01] my_first_lora_v6: 51%|##### | 3046/6000 [01:09<1:14:43, 1.52s/it, lr: 1.0e-04 loss: 7.434e-01] my_first_lora_v6: 51%|##### | 3047/6000 [01:10<1:14:00, 1.50s/it, lr: 1.0e-04 loss: 1.046e-01] my_first_lora_v6: 51%|##### | 3047/6000 [01:10<1:14:00, 1.50s/it, lr: 1.0e-04 loss: 1.046e-01] my_first_lora_v6: 51%|##### | 3048/6000 [01:12<1:13:49, 1.50s/it, lr: 1.0e-04 loss: 8.476e-02] my_first_lora_v6: 51%|##### | 3048/6000 [01:12<1:13:49, 1.50s/it, lr: 1.0e-04 loss: 8.476e-02] my_first_lora_v6: 51%|##### | 3049/6000 [01:13<1:13:28, 1.49s/it, lr: 1.0e-04 loss: 8.767e-01] my_first_lora_v6: 51%|##### | 3049/6000 [01:13<1:13:28, 1.49s/it, lr: 1.0e-04 loss: 8.767e-01] my_first_lora_v6: 51%|##### | 3050/6000 [01:13<1:12:39, 1.48s/it, lr: 1.0e-04 loss: 2.520e-01] my_first_lora_v6: 51%|##### | 3050/6000 [01:13<1:12:39, 1.48s/it, lr: 1.0e-04 loss: 2.520e-01] my_first_lora_v6: 51%|##### | 3051/6000 [01:16<1:13:20, 1.49s/it, lr: 1.0e-04 loss: 7.468e-01] my_first_lora_v6: 51%|##### | 3051/6000 [01:16<1:13:20, 1.49s/it, lr: 1.0e-04 loss: 7.468e-01] my_first_lora_v6: 51%|##### | 3052/6000 [01:18<1:14:12, 1.51s/it, lr: 1.0e-04 loss: 3.797e-01] my_first_lora_v6: 51%|##### | 3052/6000 [01:18<1:14:12, 1.51s/it, lr: 1.0e-04 loss: 3.797e-01] my_first_lora_v6: 51%|##### | 3053/6000 [01:19<1:14:02, 1.51s/it, lr: 1.0e-04 loss: 1.351e-01] my_first_lora_v6: 51%|##### | 3053/6000 [01:19<1:14:02, 1.51s/it, lr: 1.0e-04 loss: 1.351e-01] my_first_lora_v6: 51%|##### | 3054/6000 [01:20<1:13:16, 1.49s/it, lr: 1.0e-04 loss: 7.555e-01] my_first_lora_v6: 51%|##### | 3054/6000 [01:20<1:13:16, 1.49s/it, lr: 1.0e-04 loss: 7.555e-01] my_first_lora_v6: 51%|##### | 3055/6000 [01:21<1:13:06, 1.49s/it, lr: 1.0e-04 loss: 2.427e-01] my_first_lora_v6: 51%|##### | 3055/6000 [01:21<1:13:06, 1.49s/it, lr: 1.0e-04 loss: 2.427e-01] my_first_lora_v6: 51%|##### | 3056/6000 [01:24<1:13:55, 1.51s/it, lr: 1.0e-04 loss: 5.723e-01] my_first_lora_v6: 51%|##### | 3056/6000 [01:24<1:13:55, 1.51s/it, lr: 1.0e-04 loss: 5.723e-01] my_first_lora_v6: 51%|##### | 3057/6000 [01:26<1:14:01, 1.51s/it, lr: 1.0e-04 loss: 3.730e-01] my_first_lora_v6: 51%|##### | 3057/6000 [01:26<1:14:01, 1.51s/it, lr: 1.0e-04 loss: 3.730e-01] my_first_lora_v6: 51%|##### | 3058/6000 [01:26<1:13:18, 1.50s/it, lr: 1.0e-04 loss: 7.450e-01] my_first_lora_v6: 51%|##### | 3058/6000 [01:26<1:13:18, 1.50s/it, lr: 1.0e-04 loss: 7.450e-01] my_first_lora_v6: 51%|##### | 3059/6000 [01:27<1:13:00, 1.49s/it, lr: 1.0e-04 loss: 9.711e-02] my_first_lora_v6: 51%|##### | 3059/6000 [01:27<1:13:00, 1.49s/it, lr: 1.0e-04 loss: 9.711e-02] my_first_lora_v6: 51%|#####1 | 3060/6000 [01:29<1:12:51, 1.49s/it, lr: 1.0e-04 loss: 6.901e-01] my_first_lora_v6: 51%|#####1 | 3060/6000 [01:29<1:12:51, 1.49s/it, lr: 1.0e-04 loss: 6.901e-01] my_first_lora_v6: 51%|#####1 | 3061/6000 [01:31<1:13:24, 1.50s/it, lr: 1.0e-04 loss: 6.424e-01] my_first_lora_v6: 51%|#####1 | 3061/6000 [01:31<1:13:24, 1.50s/it, lr: 1.0e-04 loss: 6.424e-01] my_first_lora_v6: 51%|#####1 | 3062/6000 [01:32<1:13:15, 1.50s/it, lr: 1.0e-04 loss: 3.945e-01] my_first_lora_v6: 51%|#####1 | 3062/6000 [01:32<1:13:15, 1.50s/it, lr: 1.0e-04 loss: 3.945e-01] my_first_lora_v6: 51%|#####1 | 3063/6000 [01:35<1:13:58, 1.51s/it, lr: 1.0e-04 loss: 2.592e-01] my_first_lora_v6: 51%|#####1 | 3063/6000 [01:35<1:13:58, 1.51s/it, lr: 1.0e-04 loss: 2.592e-01] my_first_lora_v6: 51%|#####1 | 3064/6000 [01:37<1:14:52, 1.53s/it, lr: 1.0e-04 loss: 2.465e-01] my_first_lora_v6: 51%|#####1 | 3064/6000 [01:37<1:14:52, 1.53s/it, lr: 1.0e-04 loss: 2.465e-01] my_first_lora_v6: 51%|#####1 | 3065/6000 [01:40<1:15:32, 1.54s/it, lr: 1.0e-04 loss: 7.540e-01] my_first_lora_v6: 51%|#####1 | 3065/6000 [01:40<1:15:32, 1.54s/it, lr: 1.0e-04 loss: 7.540e-01] my_first_lora_v6: 51%|#####1 | 3066/6000 [01:41<1:14:53, 1.53s/it, lr: 1.0e-04 loss: 2.915e-01] my_first_lora_v6: 51%|#####1 | 3066/6000 [01:41<1:14:53, 1.53s/it, lr: 1.0e-04 loss: 2.915e-01] my_first_lora_v6: 51%|#####1 | 3067/6000 [01:41<1:14:14, 1.52s/it, lr: 1.0e-04 loss: 2.673e-01] my_first_lora_v6: 51%|#####1 | 3067/6000 [01:41<1:14:14, 1.52s/it, lr: 1.0e-04 loss: 2.673e-01] my_first_lora_v6: 51%|#####1 | 3068/6000 [01:43<1:14:05, 1.52s/it, lr: 1.0e-04 loss: 7.935e-01] my_first_lora_v6: 51%|#####1 | 3068/6000 [01:43<1:14:05, 1.52s/it, lr: 1.0e-04 loss: 7.935e-01] my_first_lora_v6: 51%|#####1 | 3069/6000 [01:43<1:13:28, 1.50s/it, lr: 1.0e-04 loss: 6.465e-01] my_first_lora_v6: 51%|#####1 | 3069/6000 [01:43<1:13:28, 1.50s/it, lr: 1.0e-04 loss: 6.465e-01] my_first_lora_v6: 51%|#####1 | 3070/6000 [01:44<1:12:55, 1.49s/it, lr: 1.0e-04 loss: 3.587e-01] my_first_lora_v6: 51%|#####1 | 3070/6000 [01:44<1:12:55, 1.49s/it, lr: 1.0e-04 loss: 3.587e-01] my_first_lora_v6: 51%|#####1 | 3071/6000 [01:46<1:12:56, 1.49s/it, lr: 1.0e-04 loss: 2.830e-01] my_first_lora_v6: 51%|#####1 | 3071/6000 [01:46<1:12:56, 1.49s/it, lr: 1.0e-04 loss: 2.830e-01] my_first_lora_v6: 51%|#####1 | 3072/6000 [01:47<1:12:36, 1.49s/it, lr: 1.0e-04 loss: 4.459e-01] my_first_lora_v6: 51%|#####1 | 3072/6000 [01:47<1:12:36, 1.49s/it, lr: 1.0e-04 loss: 4.459e-01] my_first_lora_v6: 51%|#####1 | 3073/6000 [01:47<1:12:02, 1.48s/it, lr: 1.0e-04 loss: 7.747e-01] my_first_lora_v6: 51%|#####1 | 3073/6000 [01:47<1:12:02, 1.48s/it, lr: 1.0e-04 loss: 7.747e-01] my_first_lora_v6: 51%|#####1 | 3074/6000 [01:50<1:12:39, 1.49s/it, lr: 1.0e-04 loss: 4.419e-01] my_first_lora_v6: 51%|#####1 | 3074/6000 [01:50<1:12:39, 1.49s/it, lr: 1.0e-04 loss: 4.419e-01] my_first_lora_v6: 51%|#####1 | 3075/6000 [01:50<1:12:06, 1.48s/it, lr: 1.0e-04 loss: 7.500e-01] my_first_lora_v6: 51%|#####1 | 3075/6000 [01:50<1:12:06, 1.48s/it, lr: 1.0e-04 loss: 7.500e-01] my_first_lora_v6: 51%|#####1 | 3076/6000 [01:52<1:12:00, 1.48s/it, lr: 1.0e-04 loss: 4.891e-01] my_first_lora_v6: 51%|#####1 | 3076/6000 [01:52<1:12:00, 1.48s/it, lr: 1.0e-04 loss: 4.891e-01] my_first_lora_v6: 51%|#####1 | 3077/6000 [01:54<1:12:26, 1.49s/it, lr: 1.0e-04 loss: 7.532e-01] my_first_lora_v6: 51%|#####1 | 3077/6000 [01:54<1:12:26, 1.49s/it, lr: 1.0e-04 loss: 7.532e-01] my_first_lora_v6: 51%|#####1 | 3078/6000 [01:56<1:12:52, 1.50s/it, lr: 1.0e-04 loss: 1.967e-01] my_first_lora_v6: 51%|#####1 | 3078/6000 [01:56<1:12:52, 1.50s/it, lr: 1.0e-04 loss: 1.967e-01] my_first_lora_v6: 51%|#####1 | 3079/6000 [01:58<1:12:45, 1.49s/it, lr: 1.0e-04 loss: 3.271e-01] my_first_lora_v6: 51%|#####1 | 3079/6000 [01:58<1:12:45, 1.49s/it, lr: 1.0e-04 loss: 3.271e-01] my_first_lora_v6: 51%|#####1 | 3080/6000 [02:00<1:13:18, 1.51s/it, lr: 1.0e-04 loss: 3.478e-01] my_first_lora_v6: 51%|#####1 | 3080/6000 [02:00<1:13:18, 1.51s/it, lr: 1.0e-04 loss: 3.478e-01] my_first_lora_v6: 51%|#####1 | 3081/6000 [02:01<1:12:46, 1.50s/it, lr: 1.0e-04 loss: 4.888e-01] my_first_lora_v6: 51%|#####1 | 3081/6000 [02:01<1:12:46, 1.50s/it, lr: 1.0e-04 loss: 4.888e-01] my_first_lora_v6: 51%|#####1 | 3082/6000 [02:02<1:12:39, 1.49s/it, lr: 1.0e-04 loss: 1.389e-01] my_first_lora_v6: 51%|#####1 | 3082/6000 [02:02<1:12:39, 1.49s/it, lr: 1.0e-04 loss: 1.389e-01] my_first_lora_v6: 51%|#####1 | 3083/6000 [02:05<1:13:20, 1.51s/it, lr: 1.0e-04 loss: 5.759e-01] my_first_lora_v6: 51%|#####1 | 3083/6000 [02:05<1:13:20, 1.51s/it, lr: 1.0e-04 loss: 5.759e-01] my_first_lora_v6: 51%|#####1 | 3084/6000 [02:06<1:13:13, 1.51s/it, lr: 1.0e-04 loss: 2.403e-01] my_first_lora_v6: 51%|#####1 | 3084/6000 [02:06<1:13:13, 1.51s/it, lr: 1.0e-04 loss: 2.403e-01] my_first_lora_v6: 51%|#####1 | 3085/6000 [02:07<1:12:43, 1.50s/it, lr: 1.0e-04 loss: 6.756e-01] my_first_lora_v6: 51%|#####1 | 3085/6000 [02:07<1:12:43, 1.50s/it, lr: 1.0e-04 loss: 6.756e-01] my_first_lora_v6: 51%|#####1 | 3086/6000 [02:08<1:12:23, 1.49s/it, lr: 1.0e-04 loss: 7.614e-01] my_first_lora_v6: 51%|#####1 | 3086/6000 [02:08<1:12:23, 1.49s/it, lr: 1.0e-04 loss: 7.614e-01] my_first_lora_v6: 51%|#####1 | 3087/6000 [02:10<1:12:53, 1.50s/it, lr: 1.0e-04 loss: 6.851e-01] my_first_lora_v6: 51%|#####1 | 3087/6000 [02:10<1:12:53, 1.50s/it, lr: 1.0e-04 loss: 6.851e-01] my_first_lora_v6: 51%|#####1 | 3088/6000 [02:11<1:12:41, 1.50s/it, lr: 1.0e-04 loss: 6.645e-01] my_first_lora_v6: 51%|#####1 | 3088/6000 [02:11<1:12:41, 1.50s/it, lr: 1.0e-04 loss: 6.645e-01] my_first_lora_v6: 51%|#####1 | 3089/6000 [02:12<1:12:13, 1.49s/it, lr: 1.0e-04 loss: 5.665e-02] my_first_lora_v6: 51%|#####1 | 3089/6000 [02:12<1:12:13, 1.49s/it, lr: 1.0e-04 loss: 5.665e-02] my_first_lora_v6: 52%|#####1 | 3090/6000 [02:14<1:12:42, 1.50s/it, lr: 1.0e-04 loss: 2.953e-01] my_first_lora_v6: 52%|#####1 | 3090/6000 [02:14<1:12:42, 1.50s/it, lr: 1.0e-04 loss: 2.953e-01] my_first_lora_v6: 52%|#####1 | 3091/6000 [02:16<1:12:36, 1.50s/it, lr: 1.0e-04 loss: 5.896e-01] my_first_lora_v6: 52%|#####1 | 3091/6000 [02:16<1:12:36, 1.50s/it, lr: 1.0e-04 loss: 5.896e-01] my_first_lora_v6: 52%|#####1 | 3092/6000 [02:17<1:12:25, 1.49s/it, lr: 1.0e-04 loss: 8.579e-01] my_first_lora_v6: 52%|#####1 | 3092/6000 [02:17<1:12:25, 1.49s/it, lr: 1.0e-04 loss: 8.579e-01] my_first_lora_v6: 52%|#####1 | 3093/6000 [02:18<1:12:19, 1.49s/it, lr: 1.0e-04 loss: 2.377e-01] my_first_lora_v6: 52%|#####1 | 3093/6000 [02:18<1:12:19, 1.49s/it, lr: 1.0e-04 loss: 2.377e-01] my_first_lora_v6: 52%|#####1 | 3094/6000 [02:19<1:11:53, 1.48s/it, lr: 1.0e-04 loss: 8.287e-01] my_first_lora_v6: 52%|#####1 | 3094/6000 [02:19<1:11:53, 1.48s/it, lr: 1.0e-04 loss: 8.287e-01] my_first_lora_v6: 52%|#####1 | 3095/6000 [02:20<1:11:32, 1.48s/it, lr: 1.0e-04 loss: 5.377e-01] my_first_lora_v6: 52%|#####1 | 3095/6000 [02:20<1:11:32, 1.48s/it, lr: 1.0e-04 loss: 5.377e-01] my_first_lora_v6: 52%|#####1 | 3096/6000 [02:21<1:11:07, 1.47s/it, lr: 1.0e-04 loss: 5.436e-01] my_first_lora_v6: 52%|#####1 | 3096/6000 [02:21<1:11:07, 1.47s/it, lr: 1.0e-04 loss: 5.436e-01] my_first_lora_v6: 52%|#####1 | 3097/6000 [02:21<1:10:41, 1.46s/it, lr: 1.0e-04 loss: 7.326e-01] my_first_lora_v6: 52%|#####1 | 3097/6000 [02:21<1:10:41, 1.46s/it, lr: 1.0e-04 loss: 7.326e-01] my_first_lora_v6: 52%|#####1 | 3098/6000 [02:22<1:10:17, 1.45s/it, lr: 1.0e-04 loss: 3.737e-01] my_first_lora_v6: 52%|#####1 | 3098/6000 [02:22<1:10:17, 1.45s/it, lr: 1.0e-04 loss: 3.737e-01] my_first_lora_v6: 52%|#####1 | 3099/6000 [02:23<1:10:13, 1.45s/it, lr: 1.0e-04 loss: 1.667e-01] my_first_lora_v6: 52%|#####1 | 3099/6000 [02:23<1:10:13, 1.45s/it, lr: 1.0e-04 loss: 1.667e-01] my_first_lora_v6: 52%|#####1 | 3100/6000 [02:26<1:10:35, 1.46s/it, lr: 1.0e-04 loss: 2.562e-01] my_first_lora_v6: 52%|#####1 | 3100/6000 [02:26<1:10:35, 1.46s/it, lr: 1.0e-04 loss: 2.562e-01] my_first_lora_v6: 52%|#####1 | 3101/6000 [02:27<1:10:35, 1.46s/it, lr: 1.0e-04 loss: 4.136e-01] my_first_lora_v6: 52%|#####1 | 3101/6000 [02:27<1:10:35, 1.46s/it, lr: 1.0e-04 loss: 4.136e-01] my_first_lora_v6: 52%|#####1 | 3102/6000 [02:28<1:10:30, 1.46s/it, lr: 1.0e-04 loss: 4.972e-01] my_first_lora_v6: 52%|#####1 | 3102/6000 [02:28<1:10:30, 1.46s/it, lr: 1.0e-04 loss: 4.972e-01] my_first_lora_v6: 52%|#####1 | 3103/6000 [02:29<1:10:07, 1.45s/it, lr: 1.0e-04 loss: 5.136e-01] my_first_lora_v6: 52%|#####1 | 3103/6000 [02:29<1:10:07, 1.45s/it, lr: 1.0e-04 loss: 5.136e-01] my_first_lora_v6: 52%|#####1 | 3104/6000 [02:30<1:09:45, 1.45s/it, lr: 1.0e-04 loss: 1.706e-02] my_first_lora_v6: 52%|#####1 | 3104/6000 [02:30<1:09:45, 1.45s/it, lr: 1.0e-04 loss: 1.706e-02] my_first_lora_v6: 52%|#####1 | 3105/6000 [02:32<1:10:04, 1.45s/it, lr: 1.0e-04 loss: 7.526e-01] my_first_lora_v6: 52%|#####1 | 3105/6000 [02:32<1:10:04, 1.45s/it, lr: 1.0e-04 loss: 7.526e-01] my_first_lora_v6: 52%|#####1 | 3106/6000 [02:33<1:10:00, 1.45s/it, lr: 1.0e-04 loss: 1.265e-01] my_first_lora_v6: 52%|#####1 | 3106/6000 [02:33<1:10:00, 1.45s/it, lr: 1.0e-04 loss: 1.265e-01] my_first_lora_v6: 52%|#####1 | 3107/6000 [02:36<1:10:26, 1.46s/it, lr: 1.0e-04 loss: 2.181e-01] my_first_lora_v6: 52%|#####1 | 3107/6000 [02:36<1:10:26, 1.46s/it, lr: 1.0e-04 loss: 2.181e-01] my_first_lora_v6: 52%|#####1 | 3108/6000 [02:37<1:10:21, 1.46s/it, lr: 1.0e-04 loss: 2.118e-01] my_first_lora_v6: 52%|#####1 | 3108/6000 [02:37<1:10:21, 1.46s/it, lr: 1.0e-04 loss: 2.118e-01] my_first_lora_v6: 52%|#####1 | 3109/6000 [02:40<1:10:53, 1.47s/it, lr: 1.0e-04 loss: 5.634e-01] my_first_lora_v6: 52%|#####1 | 3109/6000 [02:40<1:10:53, 1.47s/it, lr: 1.0e-04 loss: 5.634e-01] my_first_lora_v6: 52%|#####1 | 3110/6000 [02:42<1:11:17, 1.48s/it, lr: 1.0e-04 loss: 4.126e-01] my_first_lora_v6: 52%|#####1 | 3110/6000 [02:42<1:11:17, 1.48s/it, lr: 1.0e-04 loss: 4.126e-01] my_first_lora_v6: 52%|#####1 | 3111/6000 [02:43<1:10:55, 1.47s/it, lr: 1.0e-04 loss: 5.049e-01] my_first_lora_v6: 52%|#####1 | 3111/6000 [02:43<1:10:55, 1.47s/it, lr: 1.0e-04 loss: 5.049e-01] my_first_lora_v6: 52%|#####1 | 3112/6000 [02:44<1:10:46, 1.47s/it, lr: 1.0e-04 loss: 6.292e-01] my_first_lora_v6: 52%|#####1 | 3112/6000 [02:44<1:10:46, 1.47s/it, lr: 1.0e-04 loss: 6.292e-01] my_first_lora_v6: 52%|#####1 | 3113/6000 [02:47<1:11:10, 1.48s/it, lr: 1.0e-04 loss: 6.581e-01] my_first_lora_v6: 52%|#####1 | 3113/6000 [02:47<1:11:10, 1.48s/it, lr: 1.0e-04 loss: 6.581e-01] my_first_lora_v6: 52%|#####1 | 3114/6000 [02:47<1:10:49, 1.47s/it, lr: 1.0e-04 loss: 7.891e-01] my_first_lora_v6: 52%|#####1 | 3114/6000 [02:47<1:10:49, 1.47s/it, lr: 1.0e-04 loss: 7.891e-01] my_first_lora_v6: 52%|#####1 | 3115/6000 [02:49<1:10:51, 1.47s/it, lr: 1.0e-04 loss: 3.833e-01] my_first_lora_v6: 52%|#####1 | 3115/6000 [02:49<1:10:51, 1.47s/it, lr: 1.0e-04 loss: 3.833e-01] my_first_lora_v6: 52%|#####1 | 3116/6000 [02:51<1:11:14, 1.48s/it, lr: 1.0e-04 loss: 4.443e-01] my_first_lora_v6: 52%|#####1 | 3116/6000 [02:51<1:11:14, 1.48s/it, lr: 1.0e-04 loss: 4.443e-01] my_first_lora_v6: 52%|#####1 | 3117/6000 [02:53<1:11:10, 1.48s/it, lr: 1.0e-04 loss: 7.175e-01] my_first_lora_v6: 52%|#####1 | 3117/6000 [02:53<1:11:10, 1.48s/it, lr: 1.0e-04 loss: 7.175e-01] my_first_lora_v6: 52%|#####1 | 3118/6000 [02:54<1:11:05, 1.48s/it, lr: 1.0e-04 loss: 4.013e-01] my_first_lora_v6: 52%|#####1 | 3118/6000 [02:54<1:11:05, 1.48s/it, lr: 1.0e-04 loss: 4.013e-01] my_first_lora_v6: 52%|#####1 | 3119/6000 [02:55<1:10:50, 1.48s/it, lr: 1.0e-04 loss: 7.607e-01] my_first_lora_v6: 52%|#####1 | 3119/6000 [02:55<1:10:50, 1.48s/it, lr: 1.0e-04 loss: 7.607e-01] my_first_lora_v6: 52%|#####2 | 3120/6000 [02:56<1:10:41, 1.47s/it, lr: 1.0e-04 loss: 7.118e-01] my_first_lora_v6: 52%|#####2 | 3120/6000 [02:56<1:10:41, 1.47s/it, lr: 1.0e-04 loss: 7.118e-01] my_first_lora_v6: 52%|#####2 | 3121/6000 [02:58<1:10:58, 1.48s/it, lr: 1.0e-04 loss: 7.497e-01] my_first_lora_v6: 52%|#####2 | 3121/6000 [02:58<1:10:58, 1.48s/it, lr: 1.0e-04 loss: 7.497e-01] my_first_lora_v6: 52%|#####2 | 3122/6000 [03:00<1:10:54, 1.48s/it, lr: 1.0e-04 loss: 4.722e-01] my_first_lora_v6: 52%|#####2 | 3122/6000 [03:00<1:10:54, 1.48s/it, lr: 1.0e-04 loss: 4.722e-01] my_first_lora_v6: 52%|#####2 | 3123/6000 [03:01<1:10:50, 1.48s/it, lr: 1.0e-04 loss: 3.058e-01] my_first_lora_v6: 52%|#####2 | 3123/6000 [03:01<1:10:50, 1.48s/it, lr: 1.0e-04 loss: 3.058e-01] my_first_lora_v6: 52%|#####2 | 3124/6000 [03:03<1:10:47, 1.48s/it, lr: 1.0e-04 loss: 1.574e-02] my_first_lora_v6: 52%|#####2 | 3124/6000 [03:03<1:10:47, 1.48s/it, lr: 1.0e-04 loss: 1.574e-02] my_first_lora_v6: 52%|#####2 | 3125/6000 [03:03<1:10:28, 1.47s/it, lr: 1.0e-04 loss: 8.139e-01] my_first_lora_v6: 52%|#####2 | 3125/6000 [03:03<1:10:28, 1.47s/it, lr: 1.0e-04 loss: 8.139e-01] my_first_lora_v6: 52%|#####2 | 3126/6000 [03:05<1:10:23, 1.47s/it, lr: 1.0e-04 loss: 5.810e-01] my_first_lora_v6: 52%|#####2 | 3126/6000 [03:05<1:10:23, 1.47s/it, lr: 1.0e-04 loss: 5.810e-01] my_first_lora_v6: 52%|#####2 | 3127/6000 [03:07<1:10:45, 1.48s/it, lr: 1.0e-04 loss: 1.245e-01] my_first_lora_v6: 52%|#####2 | 3127/6000 [03:07<1:10:45, 1.48s/it, lr: 1.0e-04 loss: 1.245e-01] my_first_lora_v6: 52%|#####2 | 3128/6000 [03:10<1:11:06, 1.49s/it, lr: 1.0e-04 loss: 5.291e-01] my_first_lora_v6: 52%|#####2 | 3128/6000 [03:10<1:11:06, 1.49s/it, lr: 1.0e-04 loss: 5.291e-01] my_first_lora_v6: 52%|#####2 | 3129/6000 [03:12<1:11:33, 1.50s/it, lr: 1.0e-04 loss: 3.150e-01] my_first_lora_v6: 52%|#####2 | 3129/6000 [03:12<1:11:33, 1.50s/it, lr: 1.0e-04 loss: 3.150e-01] my_first_lora_v6: 52%|#####2 | 3130/6000 [03:15<1:11:48, 1.50s/it, lr: 1.0e-04 loss: 7.679e-01] my_first_lora_v6: 52%|#####2 | 3130/6000 [03:15<1:11:48, 1.50s/it, lr: 1.0e-04 loss: 7.679e-01] my_first_lora_v6: 52%|#####2 | 3131/6000 [03:16<1:11:44, 1.50s/it, lr: 1.0e-04 loss: 3.402e-01] my_first_lora_v6: 52%|#####2 | 3131/6000 [03:16<1:11:44, 1.50s/it, lr: 1.0e-04 loss: 3.402e-01] my_first_lora_v6: 52%|#####2 | 3132/6000 [03:17<1:11:24, 1.49s/it, lr: 1.0e-04 loss: 3.651e-01] my_first_lora_v6: 52%|#####2 | 3132/6000 [03:17<1:11:24, 1.49s/it, lr: 1.0e-04 loss: 3.651e-01] my_first_lora_v6: 52%|#####2 | 3133/6000 [03:17<1:11:06, 1.49s/it, lr: 1.0e-04 loss: 1.619e-01] my_first_lora_v6: 52%|#####2 | 3133/6000 [03:17<1:11:06, 1.49s/it, lr: 1.0e-04 loss: 1.619e-01] my_first_lora_v6: 52%|#####2 | 3134/6000 [03:18<1:10:47, 1.48s/it, lr: 1.0e-04 loss: 6.640e-01] my_first_lora_v6: 52%|#####2 | 3134/6000 [03:18<1:10:47, 1.48s/it, lr: 1.0e-04 loss: 6.640e-01] my_first_lora_v6: 52%|#####2 | 3135/6000 [03:19<1:10:39, 1.48s/it, lr: 1.0e-04 loss: 7.204e-01] my_first_lora_v6: 52%|#####2 | 3135/6000 [03:19<1:10:39, 1.48s/it, lr: 1.0e-04 loss: 7.204e-01] my_first_lora_v6: 52%|#####2 | 3136/6000 [03:22<1:11:04, 1.49s/it, lr: 1.0e-04 loss: 4.649e-01] my_first_lora_v6: 52%|#####2 | 3136/6000 [03:22<1:11:04, 1.49s/it, lr: 1.0e-04 loss: 4.649e-01] my_first_lora_v6: 52%|#####2 | 3137/6000 [03:23<1:10:59, 1.49s/it, lr: 1.0e-04 loss: 3.826e-01] my_first_lora_v6: 52%|#####2 | 3137/6000 [03:23<1:10:59, 1.49s/it, lr: 1.0e-04 loss: 3.826e-01] my_first_lora_v6: 52%|#####2 | 3138/6000 [03:24<1:10:41, 1.48s/it, lr: 1.0e-04 loss: 4.785e-01] my_first_lora_v6: 52%|#####2 | 3138/6000 [03:24<1:10:41, 1.48s/it, lr: 1.0e-04 loss: 4.785e-01] my_first_lora_v6: 52%|#####2 | 3139/6000 [03:25<1:10:37, 1.48s/it, lr: 1.0e-04 loss: 1.514e-01] my_first_lora_v6: 52%|#####2 | 3139/6000 [03:25<1:10:37, 1.48s/it, lr: 1.0e-04 loss: 1.514e-01] my_first_lora_v6: 52%|#####2 | 3140/6000 [03:28<1:10:56, 1.49s/it, lr: 1.0e-04 loss: 7.521e-01] my_first_lora_v6: 52%|#####2 | 3140/6000 [03:28<1:10:56, 1.49s/it, lr: 1.0e-04 loss: 7.521e-01] my_first_lora_v6: 52%|#####2 | 3141/6000 [03:29<1:10:38, 1.48s/it, lr: 1.0e-04 loss: 7.788e-01] my_first_lora_v6: 52%|#####2 | 3141/6000 [03:29<1:10:38, 1.48s/it, lr: 1.0e-04 loss: 7.788e-01] my_first_lora_v6: 52%|#####2 | 3142/6000 [03:29<1:10:20, 1.48s/it, lr: 1.0e-04 loss: 5.849e-01] my_first_lora_v6: 52%|#####2 | 3142/6000 [03:29<1:10:20, 1.48s/it, lr: 1.0e-04 loss: 5.849e-01] my_first_lora_v6: 52%|#####2 | 3143/6000 [03:32<1:10:42, 1.49s/it, lr: 1.0e-04 loss: 2.606e-01] my_first_lora_v6: 52%|#####2 | 3143/6000 [03:32<1:10:42, 1.49s/it, lr: 1.0e-04 loss: 2.606e-01] my_first_lora_v6: 52%|#####2 | 3144/6000 [03:33<1:10:38, 1.48s/it, lr: 1.0e-04 loss: 4.658e-01] my_first_lora_v6: 52%|#####2 | 3144/6000 [03:33<1:10:38, 1.48s/it, lr: 1.0e-04 loss: 4.658e-01] my_first_lora_v6: 52%|#####2 | 3145/6000 [03:35<1:10:34, 1.48s/it, lr: 1.0e-04 loss: 4.137e-01] my_first_lora_v6: 52%|#####2 | 3145/6000 [03:35<1:10:34, 1.48s/it, lr: 1.0e-04 loss: 4.137e-01] my_first_lora_v6: 52%|#####2 | 3146/6000 [03:36<1:10:26, 1.48s/it, lr: 1.0e-04 loss: 5.707e-01] my_first_lora_v6: 52%|#####2 | 3146/6000 [03:36<1:10:26, 1.48s/it, lr: 1.0e-04 loss: 5.707e-01] my_first_lora_v6: 52%|#####2 | 3147/6000 [03:37<1:10:22, 1.48s/it, lr: 1.0e-04 loss: 3.239e-01] my_first_lora_v6: 52%|#####2 | 3147/6000 [03:37<1:10:22, 1.48s/it, lr: 1.0e-04 loss: 3.239e-01] my_first_lora_v6: 52%|#####2 | 3148/6000 [03:38<1:10:06, 1.47s/it, lr: 1.0e-04 loss: 7.598e-01] my_first_lora_v6: 52%|#####2 | 3148/6000 [03:38<1:10:06, 1.47s/it, lr: 1.0e-04 loss: 7.598e-01] my_first_lora_v6: 52%|#####2 | 3149/6000 [03:38<1:09:50, 1.47s/it, lr: 1.0e-04 loss: 6.489e-01] my_first_lora_v6: 52%|#####2 | 3149/6000 [03:38<1:09:50, 1.47s/it, lr: 1.0e-04 loss: 6.489e-01] my_first_lora_v6: 52%|#####2 | 3150/6000 [03:39<1:09:34, 1.46s/it, lr: 1.0e-04 loss: 4.545e-01] my_first_lora_v6: 52%|#####2 | 3150/6000 [03:39<1:09:34, 1.46s/it, lr: 1.0e-04 loss: 4.545e-01] my_first_lora_v6: 53%|#####2 | 3151/6000 [03:40<1:09:18, 1.46s/it, lr: 1.0e-04 loss: 7.511e-01] my_first_lora_v6: 53%|#####2 | 3151/6000 [03:40<1:09:18, 1.46s/it, lr: 1.0e-04 loss: 7.511e-01] my_first_lora_v6: 53%|#####2 | 3152/6000 [03:43<1:09:40, 1.47s/it, lr: 1.0e-04 loss: 6.104e-01] my_first_lora_v6: 53%|#####2 | 3152/6000 [03:43<1:09:40, 1.47s/it, lr: 1.0e-04 loss: 6.104e-01] my_first_lora_v6: 53%|#####2 | 3153/6000 [03:44<1:09:36, 1.47s/it, lr: 1.0e-04 loss: 6.242e-01] my_first_lora_v6: 53%|#####2 | 3153/6000 [03:44<1:09:36, 1.47s/it, lr: 1.0e-04 loss: 6.242e-01] my_first_lora_v6: 53%|#####2 | 3154/6000 [03:45<1:09:30, 1.47s/it, lr: 1.0e-04 loss: 8.491e-01] my_first_lora_v6: 53%|#####2 | 3154/6000 [03:45<1:09:30, 1.47s/it, lr: 1.0e-04 loss: 8.491e-01] my_first_lora_v6: 53%|#####2 | 3155/6000 [03:48<1:09:47, 1.47s/it, lr: 1.0e-04 loss: 2.281e-01] my_first_lora_v6: 53%|#####2 | 3155/6000 [03:48<1:09:47, 1.47s/it, lr: 1.0e-04 loss: 2.281e-01] my_first_lora_v6: 53%|#####2 | 3156/6000 [03:49<1:09:43, 1.47s/it, lr: 1.0e-04 loss: 5.376e-01] my_first_lora_v6: 53%|#####2 | 3156/6000 [03:49<1:09:43, 1.47s/it, lr: 1.0e-04 loss: 5.376e-01] my_first_lora_v6: 53%|#####2 | 3157/6000 [03:51<1:09:55, 1.48s/it, lr: 1.0e-04 loss: 7.118e-02] my_first_lora_v6: 53%|#####2 | 3157/6000 [03:51<1:09:55, 1.48s/it, lr: 1.0e-04 loss: 7.118e-02] my_first_lora_v6: 53%|#####2 | 3158/6000 [03:54<1:10:14, 1.48s/it, lr: 1.0e-04 loss: 6.885e-01] my_first_lora_v6: 53%|#####2 | 3158/6000 [03:54<1:10:14, 1.48s/it, lr: 1.0e-04 loss: 6.885e-01] my_first_lora_v6: 53%|#####2 | 3159/6000 [03:55<1:10:10, 1.48s/it, lr: 1.0e-04 loss: 5.152e-01] my_first_lora_v6: 53%|#####2 | 3159/6000 [03:55<1:10:10, 1.48s/it, lr: 1.0e-04 loss: 5.152e-01] my_first_lora_v6: 53%|#####2 | 3160/6000 [03:56<1:09:54, 1.48s/it, lr: 1.0e-04 loss: 4.234e-01] my_first_lora_v6: 53%|#####2 | 3160/6000 [03:56<1:09:54, 1.48s/it, lr: 1.0e-04 loss: 4.234e-01] my_first_lora_v6: 53%|#####2 | 3161/6000 [03:58<1:10:10, 1.48s/it, lr: 1.0e-04 loss: 2.625e-01] my_first_lora_v6: 53%|#####2 | 3161/6000 [03:58<1:10:10, 1.48s/it, lr: 1.0e-04 loss: 2.625e-01] my_first_lora_v6: 53%|#####2 | 3162/6000 [04:00<1:10:06, 1.48s/it, lr: 1.0e-04 loss: 3.299e-01] my_first_lora_v6: 53%|#####2 | 3162/6000 [04:00<1:10:06, 1.48s/it, lr: 1.0e-04 loss: 3.299e-01] my_first_lora_v6: 53%|#####2 | 3163/6000 [04:02<1:10:22, 1.49s/it, lr: 1.0e-04 loss: 3.242e-01] my_first_lora_v6: 53%|#####2 | 3163/6000 [04:02<1:10:22, 1.49s/it, lr: 1.0e-04 loss: 3.242e-01] my_first_lora_v6: 53%|#####2 | 3164/6000 [04:03<1:10:07, 1.48s/it, lr: 1.0e-04 loss: 7.717e-01] my_first_lora_v6: 53%|#####2 | 3164/6000 [04:03<1:10:07, 1.48s/it, lr: 1.0e-04 loss: 7.717e-01] my_first_lora_v6: 53%|#####2 | 3165/6000 [04:03<1:09:52, 1.48s/it, lr: 1.0e-04 loss: 5.707e-01] my_first_lora_v6: 53%|#####2 | 3165/6000 [04:03<1:09:52, 1.48s/it, lr: 1.0e-04 loss: 5.707e-01] my_first_lora_v6: 53%|#####2 | 3166/6000 [04:04<1:09:36, 1.47s/it, lr: 1.0e-04 loss: 7.031e-01] my_first_lora_v6: 53%|#####2 | 3166/6000 [04:04<1:09:36, 1.47s/it, lr: 1.0e-04 loss: 7.031e-01] my_first_lora_v6: 53%|#####2 | 3167/6000 [04:05<1:09:25, 1.47s/it, lr: 1.0e-04 loss: 6.947e-01] my_first_lora_v6: 53%|#####2 | 3167/6000 [04:05<1:09:25, 1.47s/it, lr: 1.0e-04 loss: 6.947e-01] my_first_lora_v6: 53%|#####2 | 3168/6000 [04:06<1:09:11, 1.47s/it, lr: 1.0e-04 loss: 2.362e-01] my_first_lora_v6: 53%|#####2 | 3168/6000 [04:06<1:09:11, 1.47s/it, lr: 1.0e-04 loss: 2.362e-01] my_first_lora_v6: 53%|#####2 | 3169/6000 [04:07<1:09:07, 1.47s/it, lr: 1.0e-04 loss: 5.887e-01] my_first_lora_v6: 53%|#####2 | 3169/6000 [04:07<1:09:07, 1.47s/it, lr: 1.0e-04 loss: 5.887e-01] my_first_lora_v6: 53%|#####2 | 3170/6000 [04:08<1:09:04, 1.46s/it, lr: 1.0e-04 loss: 5.464e-01] my_first_lora_v6: 53%|#####2 | 3170/6000 [04:08<1:09:04, 1.46s/it, lr: 1.0e-04 loss: 5.464e-01] my_first_lora_v6: 53%|#####2 | 3171/6000 [04:10<1:09:01, 1.46s/it, lr: 1.0e-04 loss: 3.081e-01] my_first_lora_v6: 53%|#####2 | 3171/6000 [04:10<1:09:01, 1.46s/it, lr: 1.0e-04 loss: 3.081e-01] my_first_lora_v6: 53%|#####2 | 3172/6000 [04:11<1:08:52, 1.46s/it, lr: 1.0e-04 loss: 7.353e-01] my_first_lora_v6: 53%|#####2 | 3172/6000 [04:11<1:08:52, 1.46s/it, lr: 1.0e-04 loss: 7.353e-01] my_first_lora_v6: 53%|#####2 | 3173/6000 [04:14<1:09:11, 1.47s/it, lr: 1.0e-04 loss: 7.221e-01] my_first_lora_v6: 53%|#####2 | 3173/6000 [04:14<1:09:11, 1.47s/it, lr: 1.0e-04 loss: 7.221e-01] my_first_lora_v6: 53%|#####2 | 3174/6000 [04:15<1:09:08, 1.47s/it, lr: 1.0e-04 loss: 4.874e-01] my_first_lora_v6: 53%|#####2 | 3174/6000 [04:15<1:09:08, 1.47s/it, lr: 1.0e-04 loss: 4.874e-01] my_first_lora_v6: 53%|#####2 | 3175/6000 [04:17<1:09:22, 1.47s/it, lr: 1.0e-04 loss: 7.159e-01] my_first_lora_v6: 53%|#####2 | 3175/6000 [04:17<1:09:22, 1.47s/it, lr: 1.0e-04 loss: 7.159e-01] my_first_lora_v6: 53%|#####2 | 3176/6000 [04:19<1:09:16, 1.47s/it, lr: 1.0e-04 loss: 8.423e-01] my_first_lora_v6: 53%|#####2 | 3176/6000 [04:19<1:09:16, 1.47s/it, lr: 1.0e-04 loss: 8.423e-01] my_first_lora_v6: 53%|#####2 | 3177/6000 [04:21<1:09:27, 1.48s/it, lr: 1.0e-04 loss: 1.731e-01] my_first_lora_v6: 53%|#####2 | 3177/6000 [04:21<1:09:27, 1.48s/it, lr: 1.0e-04 loss: 1.731e-01] my_first_lora_v6: 53%|#####2 | 3178/6000 [04:23<1:09:37, 1.48s/it, lr: 1.0e-04 loss: 5.858e-01] my_first_lora_v6: 53%|#####2 | 3178/6000 [04:23<1:09:37, 1.48s/it, lr: 1.0e-04 loss: 5.858e-01] my_first_lora_v6: 53%|#####2 | 3179/6000 [04:24<1:09:24, 1.48s/it, lr: 1.0e-04 loss: 5.792e-01] my_first_lora_v6: 53%|#####2 | 3179/6000 [04:24<1:09:24, 1.48s/it, lr: 1.0e-04 loss: 5.792e-01] my_first_lora_v6: 53%|#####3 | 3180/6000 [04:24<1:09:09, 1.47s/it, lr: 1.0e-04 loss: 4.418e-01] my_first_lora_v6: 53%|#####3 | 3180/6000 [04:24<1:09:09, 1.47s/it, lr: 1.0e-04 loss: 4.418e-01] my_first_lora_v6: 53%|#####3 | 3181/6000 [04:25<1:08:56, 1.47s/it, lr: 1.0e-04 loss: 7.207e-01] my_first_lora_v6: 53%|#####3 | 3181/6000 [04:25<1:08:56, 1.47s/it, lr: 1.0e-04 loss: 7.207e-01] my_first_lora_v6: 53%|#####3 | 3182/6000 [04:28<1:09:09, 1.47s/it, lr: 1.0e-04 loss: 7.089e-01] my_first_lora_v6: 53%|#####3 | 3182/6000 [04:28<1:09:09, 1.47s/it, lr: 1.0e-04 loss: 7.089e-01] my_first_lora_v6: 53%|#####3 | 3183/6000 [04:28<1:08:56, 1.47s/it, lr: 1.0e-04 loss: 4.548e-01] my_first_lora_v6: 53%|#####3 | 3183/6000 [04:28<1:08:56, 1.47s/it, lr: 1.0e-04 loss: 4.548e-01] my_first_lora_v6: 53%|#####3 | 3184/6000 [04:30<1:08:53, 1.47s/it, lr: 1.0e-04 loss: 3.791e-01] my_first_lora_v6: 53%|#####3 | 3184/6000 [04:30<1:08:53, 1.47s/it, lr: 1.0e-04 loss: 3.791e-01] my_first_lora_v6: 53%|#####3 | 3185/6000 [04:32<1:09:07, 1.47s/it, lr: 1.0e-04 loss: 7.384e-01] my_first_lora_v6: 53%|#####3 | 3185/6000 [04:32<1:09:07, 1.47s/it, lr: 1.0e-04 loss: 7.384e-01] my_first_lora_v6: 53%|#####3 | 3186/6000 [04:34<1:09:20, 1.48s/it, lr: 1.0e-04 loss: 7.251e-01] my_first_lora_v6: 53%|#####3 | 3186/6000 [04:34<1:09:20, 1.48s/it, lr: 1.0e-04 loss: 7.251e-01] my_first_lora_v6: 53%|#####3 | 3187/6000 [04:36<1:09:20, 1.48s/it, lr: 1.0e-04 loss: 2.794e-01] my_first_lora_v6: 53%|#####3 | 3187/6000 [04:36<1:09:20, 1.48s/it, lr: 1.0e-04 loss: 2.794e-01] my_first_lora_v6: 53%|#####3 | 3188/6000 [04:37<1:09:17, 1.48s/it, lr: 1.0e-04 loss: 3.256e-01] my_first_lora_v6: 53%|#####3 | 3188/6000 [04:37<1:09:17, 1.48s/it, lr: 1.0e-04 loss: 3.256e-01] my_first_lora_v6: 53%|#####3 | 3189/6000 [04:39<1:09:11, 1.48s/it, lr: 1.0e-04 loss: 8.382e-01] my_first_lora_v6: 53%|#####3 | 3189/6000 [04:39<1:09:11, 1.48s/it, lr: 1.0e-04 loss: 8.382e-01] my_first_lora_v6: 53%|#####3 | 3190/6000 [04:39<1:08:59, 1.47s/it, lr: 1.0e-04 loss: 1.280e-01] my_first_lora_v6: 53%|#####3 | 3190/6000 [04:39<1:08:59, 1.47s/it, lr: 1.0e-04 loss: 1.280e-01] my_first_lora_v6: 53%|#####3 | 3191/6000 [04:42<1:09:11, 1.48s/it, lr: 1.0e-04 loss: 5.410e-01] my_first_lora_v6: 53%|#####3 | 3191/6000 [04:42<1:09:11, 1.48s/it, lr: 1.0e-04 loss: 5.410e-01] my_first_lora_v6: 53%|#####3 | 3192/6000 [04:42<1:08:58, 1.47s/it, lr: 1.0e-04 loss: 4.390e-02] my_first_lora_v6: 53%|#####3 | 3192/6000 [04:42<1:08:58, 1.47s/it, lr: 1.0e-04 loss: 4.390e-02] my_first_lora_v6: 53%|#####3 | 3193/6000 [04:44<1:08:55, 1.47s/it, lr: 1.0e-04 loss: 6.464e-01] my_first_lora_v6: 53%|#####3 | 3193/6000 [04:44<1:08:55, 1.47s/it, lr: 1.0e-04 loss: 6.464e-01] my_first_lora_v6: 53%|#####3 | 3194/6000 [04:46<1:09:07, 1.48s/it, lr: 1.0e-04 loss: 1.899e-01] my_first_lora_v6: 53%|#####3 | 3194/6000 [04:46<1:09:07, 1.48s/it, lr: 1.0e-04 loss: 1.899e-01] my_first_lora_v6: 53%|#####3 | 3195/6000 [04:47<1:08:54, 1.47s/it, lr: 1.0e-04 loss: 3.211e-01] my_first_lora_v6: 53%|#####3 | 3195/6000 [04:47<1:08:54, 1.47s/it, lr: 1.0e-04 loss: 3.211e-01] my_first_lora_v6: 53%|#####3 | 3196/6000 [04:48<1:08:42, 1.47s/it, lr: 1.0e-04 loss: 3.828e-01] my_first_lora_v6: 53%|#####3 | 3196/6000 [04:48<1:08:42, 1.47s/it, lr: 1.0e-04 loss: 3.828e-01] my_first_lora_v6: 53%|#####3 | 3197/6000 [04:49<1:08:36, 1.47s/it, lr: 1.0e-04 loss: 6.878e-01] my_first_lora_v6: 53%|#####3 | 3197/6000 [04:49<1:08:36, 1.47s/it, lr: 1.0e-04 loss: 6.878e-01] my_first_lora_v6: 53%|#####3 | 3198/6000 [04:50<1:08:33, 1.47s/it, lr: 1.0e-04 loss: 4.752e-01] my_first_lora_v6: 53%|#####3 | 3198/6000 [04:50<1:08:33, 1.47s/it, lr: 1.0e-04 loss: 4.752e-01] my_first_lora_v6: 53%|#####3 | 3199/6000 [04:51<1:08:28, 1.47s/it, lr: 1.0e-04 loss: 8.529e-01] my_first_lora_v6: 53%|#####3 | 3199/6000 [04:51<1:08:28, 1.47s/it, lr: 1.0e-04 loss: 8.529e-01] my_first_lora_v6: 53%|#####3 | 3200/6000 [04:52<1:08:16, 1.46s/it, lr: 1.0e-04 loss: 4.904e-01] my_first_lora_v6: 53%|#####3 | 3200/6000 [04:52<1:08:16, 1.46s/it, lr: 1.0e-04 loss: 4.904e-01] my_first_lora_v6: 53%|#####3 | 3201/6000 [04:54<1:08:16, 1.46s/it, lr: 1.0e-04 loss: 5.963e-01] my_first_lora_v6: 53%|#####3 | 3201/6000 [04:54<1:08:16, 1.46s/it, lr: 1.0e-04 loss: 5.963e-01] my_first_lora_v6: 53%|#####3 | 3202/6000 [04:54<1:08:05, 1.46s/it, lr: 1.0e-04 loss: 1.486e-01] my_first_lora_v6: 53%|#####3 | 3202/6000 [04:54<1:08:05, 1.46s/it, lr: 1.0e-04 loss: 1.486e-01] my_first_lora_v6: 53%|#####3 | 3203/6000 [04:56<1:08:02, 1.46s/it, lr: 1.0e-04 loss: 6.515e-01] my_first_lora_v6: 53%|#####3 | 3203/6000 [04:56<1:08:02, 1.46s/it, lr: 1.0e-04 loss: 6.515e-01] my_first_lora_v6: 53%|#####3 | 3204/6000 [04:57<1:07:59, 1.46s/it, lr: 1.0e-04 loss: 1.018e-01] my_first_lora_v6: 53%|#####3 | 3204/6000 [04:57<1:07:59, 1.46s/it, lr: 1.0e-04 loss: 1.018e-01] my_first_lora_v6: 53%|#####3 | 3205/6000 [04:58<1:07:47, 1.46s/it, lr: 1.0e-04 loss: 7.099e-01] my_first_lora_v6: 53%|#####3 | 3205/6000 [04:58<1:07:47, 1.46s/it, lr: 1.0e-04 loss: 7.099e-01] my_first_lora_v6: 53%|#####3 | 3206/6000 [05:01<1:08:02, 1.46s/it, lr: 1.0e-04 loss: 5.071e-01] my_first_lora_v6: 53%|#####3 | 3206/6000 [05:01<1:08:02, 1.46s/it, lr: 1.0e-04 loss: 5.071e-01] my_first_lora_v6: 53%|#####3 | 3207/6000 [05:01<1:07:51, 1.46s/it, lr: 1.0e-04 loss: 5.401e-01] my_first_lora_v6: 53%|#####3 | 3207/6000 [05:01<1:07:51, 1.46s/it, lr: 1.0e-04 loss: 5.401e-01] my_first_lora_v6: 53%|#####3 | 3208/6000 [05:04<1:08:00, 1.46s/it, lr: 1.0e-04 loss: 8.447e-02] my_first_lora_v6: 53%|#####3 | 3208/6000 [05:04<1:08:00, 1.46s/it, lr: 1.0e-04 loss: 8.447e-02] my_first_lora_v6: 53%|#####3 | 3209/6000 [05:06<1:08:12, 1.47s/it, lr: 1.0e-04 loss: 3.611e-01] my_first_lora_v6: 53%|#####3 | 3209/6000 [05:06<1:08:12, 1.47s/it, lr: 1.0e-04 loss: 3.611e-01] my_first_lora_v6: 54%|#####3 | 3210/6000 [05:08<1:08:24, 1.47s/it, lr: 1.0e-04 loss: 1.574e-01] my_first_lora_v6: 54%|#####3 | 3210/6000 [05:08<1:08:24, 1.47s/it, lr: 1.0e-04 loss: 1.574e-01] my_first_lora_v6: 54%|#####3 | 3211/6000 [05:10<1:08:21, 1.47s/it, lr: 1.0e-04 loss: 4.074e-02] my_first_lora_v6: 54%|#####3 | 3211/6000 [05:10<1:08:21, 1.47s/it, lr: 1.0e-04 loss: 4.074e-02] my_first_lora_v6: 54%|#####3 | 3212/6000 [05:11<1:08:18, 1.47s/it, lr: 1.0e-04 loss: 5.416e-01] my_first_lora_v6: 54%|#####3 | 3212/6000 [05:11<1:08:18, 1.47s/it, lr: 1.0e-04 loss: 5.416e-01] my_first_lora_v6: 54%|#####3 | 3213/6000 [05:12<1:08:06, 1.47s/it, lr: 1.0e-04 loss: 7.544e-01] my_first_lora_v6: 54%|#####3 | 3213/6000 [05:12<1:08:06, 1.47s/it, lr: 1.0e-04 loss: 7.544e-01] my_first_lora_v6: 54%|#####3 | 3214/6000 [05:14<1:08:17, 1.47s/it, lr: 1.0e-04 loss: 5.605e-01] my_first_lora_v6: 54%|#####3 | 3214/6000 [05:14<1:08:17, 1.47s/it, lr: 1.0e-04 loss: 5.605e-01] my_first_lora_v6: 54%|#####3 | 3215/6000 [05:16<1:08:14, 1.47s/it, lr: 1.0e-04 loss: 7.618e-01] my_first_lora_v6: 54%|#####3 | 3215/6000 [05:16<1:08:14, 1.47s/it, lr: 1.0e-04 loss: 7.618e-01] my_first_lora_v6: 54%|#####3 | 3216/6000 [05:18<1:08:25, 1.47s/it, lr: 1.0e-04 loss: 6.515e-01] my_first_lora_v6: 54%|#####3 | 3216/6000 [05:18<1:08:25, 1.47s/it, lr: 1.0e-04 loss: 6.515e-01] my_first_lora_v6: 54%|#####3 | 3217/6000 [05:19<1:08:13, 1.47s/it, lr: 1.0e-04 loss: 2.409e-01] my_first_lora_v6: 54%|#####3 | 3217/6000 [05:19<1:08:13, 1.47s/it, lr: 1.0e-04 loss: 2.409e-01] my_first_lora_v6: 54%|#####3 | 3218/6000 [05:19<1:08:02, 1.47s/it, lr: 1.0e-04 loss: 5.209e-01] my_first_lora_v6: 54%|#####3 | 3218/6000 [05:19<1:08:02, 1.47s/it, lr: 1.0e-04 loss: 5.209e-01] my_first_lora_v6: 54%|#####3 | 3219/6000 [05:21<1:07:59, 1.47s/it, lr: 1.0e-04 loss: 2.938e-01] my_first_lora_v6: 54%|#####3 | 3219/6000 [05:21<1:07:59, 1.47s/it, lr: 1.0e-04 loss: 2.938e-01] my_first_lora_v6: 54%|#####3 | 3220/6000 [05:22<1:07:54, 1.47s/it, lr: 1.0e-04 loss: 5.944e-01] my_first_lora_v6: 54%|#####3 | 3220/6000 [05:22<1:07:54, 1.47s/it, lr: 1.0e-04 loss: 5.944e-01] my_first_lora_v6: 54%|#####3 | 3221/6000 [05:23<1:07:49, 1.46s/it, lr: 1.0e-04 loss: 7.504e-01] my_first_lora_v6: 54%|#####3 | 3221/6000 [05:23<1:07:49, 1.46s/it, lr: 1.0e-04 loss: 7.504e-01] my_first_lora_v6: 54%|#####3 | 3222/6000 [05:24<1:07:46, 1.46s/it, lr: 1.0e-04 loss: 5.518e-01] my_first_lora_v6: 54%|#####3 | 3222/6000 [05:24<1:07:46, 1.46s/it, lr: 1.0e-04 loss: 5.518e-01] my_first_lora_v6: 54%|#####3 | 3223/6000 [05:27<1:07:54, 1.47s/it, lr: 1.0e-04 loss: 5.312e-02] my_first_lora_v6: 54%|#####3 | 3223/6000 [05:27<1:07:54, 1.47s/it, lr: 1.0e-04 loss: 5.312e-02] my_first_lora_v6: 54%|#####3 | 3224/6000 [05:29<1:08:02, 1.47s/it, lr: 1.0e-04 loss: 4.408e-01] my_first_lora_v6: 54%|#####3 | 3224/6000 [05:29<1:08:02, 1.47s/it, lr: 1.0e-04 loss: 4.408e-01] my_first_lora_v6: 54%|#####3 | 3225/6000 [05:30<1:07:52, 1.47s/it, lr: 1.0e-04 loss: 1.478e-01] my_first_lora_v6: 54%|#####3 | 3225/6000 [05:30<1:07:52, 1.47s/it, lr: 1.0e-04 loss: 1.478e-01] my_first_lora_v6: 54%|#####3 | 3226/6000 [05:32<1:08:06, 1.47s/it, lr: 1.0e-04 loss: 6.308e-01] my_first_lora_v6: 54%|#####3 | 3226/6000 [05:32<1:08:06, 1.47s/it, lr: 1.0e-04 loss: 6.308e-01] my_first_lora_v6: 54%|#####3 | 3227/6000 [05:33<1:07:55, 1.47s/it, lr: 1.0e-04 loss: 7.804e-01] my_first_lora_v6: 54%|#####3 | 3227/6000 [05:33<1:07:55, 1.47s/it, lr: 1.0e-04 loss: 7.804e-01] my_first_lora_v6: 54%|#####3 | 3228/6000 [05:34<1:07:44, 1.47s/it, lr: 1.0e-04 loss: 3.649e-01] my_first_lora_v6: 54%|#####3 | 3228/6000 [05:34<1:07:44, 1.47s/it, lr: 1.0e-04 loss: 3.649e-01] my_first_lora_v6: 54%|#####3 | 3229/6000 [05:36<1:07:56, 1.47s/it, lr: 1.0e-04 loss: 1.049e-01] my_first_lora_v6: 54%|#####3 | 3229/6000 [05:36<1:07:56, 1.47s/it, lr: 1.0e-04 loss: 1.049e-01] my_first_lora_v6: 54%|#####3 | 3230/6000 [05:38<1:07:53, 1.47s/it, lr: 1.0e-04 loss: 7.166e-01] my_first_lora_v6: 54%|#####3 | 3230/6000 [05:38<1:07:53, 1.47s/it, lr: 1.0e-04 loss: 7.166e-01] my_first_lora_v6: 54%|#####3 | 3231/6000 [05:39<1:07:51, 1.47s/it, lr: 1.0e-04 loss: 3.220e-01] my_first_lora_v6: 54%|#####3 | 3231/6000 [05:39<1:07:51, 1.47s/it, lr: 1.0e-04 loss: 3.220e-01] my_first_lora_v6: 54%|#####3 | 3232/6000 [05:40<1:07:40, 1.47s/it, lr: 1.0e-04 loss: 9.828e-02] my_first_lora_v6: 54%|#####3 | 3232/6000 [05:40<1:07:40, 1.47s/it, lr: 1.0e-04 loss: 9.828e-02] my_first_lora_v6: 54%|#####3 | 3233/6000 [05:41<1:07:38, 1.47s/it, lr: 1.0e-04 loss: 6.423e-01] my_first_lora_v6: 54%|#####3 | 3233/6000 [05:41<1:07:38, 1.47s/it, lr: 1.0e-04 loss: 6.423e-01] my_first_lora_v6: 54%|#####3 | 3234/6000 [05:42<1:07:27, 1.46s/it, lr: 1.0e-04 loss: 7.839e-01] my_first_lora_v6: 54%|#####3 | 3234/6000 [05:42<1:07:27, 1.46s/it, lr: 1.0e-04 loss: 7.839e-01] my_first_lora_v6: 54%|#####3 | 3235/6000 [05:43<1:07:25, 1.46s/it, lr: 1.0e-04 loss: 1.063e-01] my_first_lora_v6: 54%|#####3 | 3235/6000 [05:43<1:07:25, 1.46s/it, lr: 1.0e-04 loss: 1.063e-01] my_first_lora_v6: 54%|#####3 | 3236/6000 [05:46<1:07:35, 1.47s/it, lr: 1.0e-04 loss: 5.809e-01] my_first_lora_v6: 54%|#####3 | 3236/6000 [05:46<1:07:35, 1.47s/it, lr: 1.0e-04 loss: 5.809e-01] my_first_lora_v6: 54%|#####3 | 3237/6000 [05:48<1:07:45, 1.47s/it, lr: 1.0e-04 loss: 2.373e-01] my_first_lora_v6: 54%|#####3 | 3237/6000 [05:48<1:07:45, 1.47s/it, lr: 1.0e-04 loss: 2.373e-01] my_first_lora_v6: 54%|#####3 | 3238/6000 [05:50<1:07:43, 1.47s/it, lr: 1.0e-04 loss: 7.868e-01] my_first_lora_v6: 54%|#####3 | 3238/6000 [05:50<1:07:43, 1.47s/it, lr: 1.0e-04 loss: 7.868e-01] my_first_lora_v6: 54%|#####3 | 3239/6000 [05:51<1:07:42, 1.47s/it, lr: 1.0e-04 loss: 4.116e-01] my_first_lora_v6: 54%|#####3 | 3239/6000 [05:51<1:07:42, 1.47s/it, lr: 1.0e-04 loss: 4.116e-01] my_first_lora_v6: 54%|#####4 | 3240/6000 [05:54<1:07:55, 1.48s/it, lr: 1.0e-04 loss: 6.988e-01] my_first_lora_v6: 54%|#####4 | 3240/6000 [05:54<1:07:55, 1.48s/it, lr: 1.0e-04 loss: 6.988e-01] my_first_lora_v6: 54%|#####4 | 3241/6000 [05:55<1:07:45, 1.47s/it, lr: 1.0e-04 loss: 3.902e-01] my_first_lora_v6: 54%|#####4 | 3241/6000 [05:55<1:07:45, 1.47s/it, lr: 1.0e-04 loss: 3.902e-01] my_first_lora_v6: 54%|#####4 | 3242/6000 [05:57<1:07:52, 1.48s/it, lr: 1.0e-04 loss: 4.973e-01] my_first_lora_v6: 54%|#####4 | 3242/6000 [05:57<1:07:52, 1.48s/it, lr: 1.0e-04 loss: 4.973e-01] my_first_lora_v6: 54%|#####4 | 3243/6000 [05:59<1:08:02, 1.48s/it, lr: 1.0e-04 loss: 5.535e-01] my_first_lora_v6: 54%|#####4 | 3243/6000 [05:59<1:08:02, 1.48s/it, lr: 1.0e-04 loss: 5.535e-01] my_first_lora_v6: 54%|#####4 | 3244/6000 [06:00<1:07:56, 1.48s/it, lr: 1.0e-04 loss: 3.146e-01] my_first_lora_v6: 54%|#####4 | 3244/6000 [06:00<1:07:56, 1.48s/it, lr: 1.0e-04 loss: 3.146e-01] my_first_lora_v6: 54%|#####4 | 3245/6000 [06:02<1:07:53, 1.48s/it, lr: 1.0e-04 loss: 4.553e-01] my_first_lora_v6: 54%|#####4 | 3245/6000 [06:02<1:07:53, 1.48s/it, lr: 1.0e-04 loss: 4.553e-01] my_first_lora_v6: 54%|#####4 | 3246/6000 [06:02<1:07:43, 1.48s/it, lr: 1.0e-04 loss: 9.520e-02] my_first_lora_v6: 54%|#####4 | 3246/6000 [06:02<1:07:43, 1.48s/it, lr: 1.0e-04 loss: 9.520e-02] my_first_lora_v6: 54%|#####4 | 3247/6000 [06:04<1:07:41, 1.48s/it, lr: 1.0e-04 loss: 3.137e-01] my_first_lora_v6: 54%|#####4 | 3247/6000 [06:04<1:07:41, 1.48s/it, lr: 1.0e-04 loss: 3.137e-01] my_first_lora_v6: 54%|#####4 | 3248/6000 [06:05<1:07:30, 1.47s/it, lr: 1.0e-04 loss: 6.591e-01] my_first_lora_v6: 54%|#####4 | 3248/6000 [06:05<1:07:30, 1.47s/it, lr: 1.0e-04 loss: 6.591e-01] my_first_lora_v6: 54%|#####4 | 3249/6000 [06:06<1:07:28, 1.47s/it, lr: 1.0e-04 loss: 8.874e-02] my_first_lora_v6: 54%|#####4 | 3249/6000 [06:06<1:07:28, 1.47s/it, lr: 1.0e-04 loss: 8.874e-02]Unloading assistant lora
Generating Images: 0%| | 0/5 [00:00<?, ?it/s] Generating Images: 0%| | 0/5 [00:00<?, ?it/s]
Generating Images: 20%|## | 1/5 [00:07<00:31, 7.90s/it] Generating Images: 20%|## | 1/5 [00:07<00:31, 7.90s/it]
Generating Images: 40%|#### | 2/5 [00:15<00:23, 7.82s/it] Generating Images: 40%|#### | 2/5 [00:15<00:23, 7.82s/it]
Generating Images: 60%|###### | 3/5 [00:23<00:15, 7.80s/it] Generating Images: 60%|###### | 3/5 [00:23<00:15, 7.80s/it]
Generating Images: 80%|######## | 4/5 [00:31<00:07, 7.78s/it] Generating Images: 80%|######## | 4/5 [00:31<00:07, 7.78s/it]
Generating Images: 100%|##########| 5/5 [00:38<00:00, 7.74s/it] Generating Images: 100%|##########| 5/5 [00:38<00:00, 7.74s/it]
Loading assistant lora
my_first_lora_v6: 54%|#####4 | 3250/6000 [06:08<1:07:37, 1.48s/it, lr: 1.0e-04 loss: 6.195e-01] my_first_lora_v6: 54%|#####4 | 3250/6000 [06:08<1:07:37, 1.48s/it, lr: 1.0e-04 loss: 6.195e-01] my_first_lora_v6: 54%|#####4 | 3251/6000 [06:09<1:07:27, 1.47s/it, lr: 1.0e-04 loss: 5.248e-01] my_first_lora_v6: 54%|#####4 | 3251/6000 [06:09<1:07:27, 1.47s/it, lr: 1.0e-04 loss: 5.248e-01] my_first_lora_v6: 54%|#####4 | 3252/6000 [06:10<1:07:24, 1.47s/it, lr: 1.0e-04 loss: 2.263e-01] my_first_lora_v6: 54%|#####4 | 3252/6000 [06:10<1:07:24, 1.47s/it, lr: 1.0e-04 loss: 2.263e-01] my_first_lora_v6: 54%|#####4 | 3253/6000 [06:13<1:07:34, 1.48s/it, lr: 1.0e-04 loss: 7.448e-01] my_first_lora_v6: 54%|#####4 | 3253/6000 [06:13<1:07:34, 1.48s/it, lr: 1.0e-04 loss: 7.448e-01] my_first_lora_v6: 54%|#####4 | 3254/6000 [06:14<1:07:31, 1.48s/it, lr: 1.0e-04 loss: 7.282e-01] my_first_lora_v6: 54%|#####4 | 3254/6000 [06:14<1:07:31, 1.48s/it, lr: 1.0e-04 loss: 7.282e-01] my_first_lora_v6: 54%|#####4 | 3255/6000 [06:16<1:07:38, 1.48s/it, lr: 1.0e-04 loss: 3.846e-02] my_first_lora_v6: 54%|#####4 | 3255/6000 [06:16<1:07:38, 1.48s/it, lr: 1.0e-04 loss: 3.846e-02] my_first_lora_v6: 54%|#####4 | 3256/6000 [06:18<1:07:33, 1.48s/it, lr: 1.0e-04 loss: 6.324e-01] my_first_lora_v6: 54%|#####4 | 3256/6000 [06:18<1:07:33, 1.48s/it, lr: 1.0e-04 loss: 6.324e-01] my_first_lora_v6: 54%|#####4 | 3257/6000 [06:18<1:07:23, 1.47s/it, lr: 1.0e-04 loss: 5.317e-01] my_first_lora_v6: 54%|#####4 | 3257/6000 [06:18<1:07:23, 1.47s/it, lr: 1.0e-04 loss: 5.317e-01] my_first_lora_v6: 54%|#####4 | 3258/6000 [06:19<1:07:18, 1.47s/it, lr: 1.0e-04 loss: 8.411e-01] my_first_lora_v6: 54%|#####4 | 3258/6000 [06:19<1:07:18, 1.47s/it, lr: 1.0e-04 loss: 8.411e-01] my_first_lora_v6: 54%|#####4 | 3259/6000 [06:20<1:07:08, 1.47s/it, lr: 1.0e-04 loss: 7.845e-01] my_first_lora_v6: 54%|#####4 | 3259/6000 [06:20<1:07:08, 1.47s/it, lr: 1.0e-04 loss: 7.845e-01] my_first_lora_v6: 54%|#####4 | 3260/6000 [06:23<1:07:17, 1.47s/it, lr: 1.0e-04 loss: 6.734e-01] my_first_lora_v6: 54%|#####4 | 3260/6000 [06:23<1:07:17, 1.47s/it, lr: 1.0e-04 loss: 6.734e-01] my_first_lora_v6: 54%|#####4 | 3261/6000 [06:24<1:07:14, 1.47s/it, lr: 1.0e-04 loss: 3.788e-01] my_first_lora_v6: 54%|#####4 | 3261/6000 [06:24<1:07:14, 1.47s/it, lr: 1.0e-04 loss: 3.788e-01] my_first_lora_v6: 54%|#####4 | 3262/6000 [06:25<1:07:05, 1.47s/it, lr: 1.0e-04 loss: 2.001e-01] my_first_lora_v6: 54%|#####4 | 3262/6000 [06:25<1:07:05, 1.47s/it, lr: 1.0e-04 loss: 2.001e-01] my_first_lora_v6: 54%|#####4 | 3263/6000 [06:26<1:06:59, 1.47s/it, lr: 1.0e-04 loss: 2.656e-01] my_first_lora_v6: 54%|#####4 | 3263/6000 [06:26<1:06:59, 1.47s/it, lr: 1.0e-04 loss: 2.656e-01] my_first_lora_v6: 54%|#####4 | 3264/6000 [06:27<1:07:00, 1.47s/it, lr: 1.0e-04 loss: 2.172e-01] my_first_lora_v6: 54%|#####4 | 3264/6000 [06:27<1:07:00, 1.47s/it, lr: 1.0e-04 loss: 2.172e-01] my_first_lora_v6: 54%|#####4 | 3265/6000 [06:29<1:06:57, 1.47s/it, lr: 1.0e-04 loss: 2.083e-01] my_first_lora_v6: 54%|#####4 | 3265/6000 [06:29<1:06:57, 1.47s/it, lr: 1.0e-04 loss: 2.083e-01] my_first_lora_v6: 54%|#####4 | 3266/6000 [06:30<1:06:48, 1.47s/it, lr: 1.0e-04 loss: 3.683e-01] my_first_lora_v6: 54%|#####4 | 3266/6000 [06:30<1:06:48, 1.47s/it, lr: 1.0e-04 loss: 3.683e-01] my_first_lora_v6: 54%|#####4 | 3267/6000 [06:31<1:06:46, 1.47s/it, lr: 1.0e-04 loss: 3.004e-01] my_first_lora_v6: 54%|#####4 | 3267/6000 [06:31<1:06:46, 1.47s/it, lr: 1.0e-04 loss: 3.004e-01] my_first_lora_v6: 54%|#####4 | 3268/6000 [06:33<1:06:55, 1.47s/it, lr: 1.0e-04 loss: 1.183e-01] my_first_lora_v6: 54%|#####4 | 3268/6000 [06:33<1:06:55, 1.47s/it, lr: 1.0e-04 loss: 1.183e-01] my_first_lora_v6: 54%|#####4 | 3269/6000 [06:36<1:07:01, 1.47s/it, lr: 1.0e-04 loss: 6.541e-01] my_first_lora_v6: 54%|#####4 | 3269/6000 [06:36<1:07:01, 1.47s/it, lr: 1.0e-04 loss: 6.541e-01] my_first_lora_v6: 55%|#####4 | 3270/6000 [06:37<1:06:58, 1.47s/it, lr: 1.0e-04 loss: 7.537e-01] my_first_lora_v6: 55%|#####4 | 3270/6000 [06:37<1:06:58, 1.47s/it, lr: 1.0e-04 loss: 7.537e-01] my_first_lora_v6: 55%|#####4 | 3271/6000 [06:38<1:06:49, 1.47s/it, lr: 1.0e-04 loss: 3.572e-01] my_first_lora_v6: 55%|#####4 | 3271/6000 [06:38<1:06:49, 1.47s/it, lr: 1.0e-04 loss: 3.572e-01] my_first_lora_v6: 55%|#####4 | 3272/6000 [06:38<1:06:40, 1.47s/it, lr: 1.0e-04 loss: 7.445e-01] my_first_lora_v6: 55%|#####4 | 3272/6000 [06:38<1:06:40, 1.47s/it, lr: 1.0e-04 loss: 7.445e-01] my_first_lora_v6: 55%|#####4 | 3273/6000 [06:40<1:06:37, 1.47s/it, lr: 1.0e-04 loss: 1.092e-01] my_first_lora_v6: 55%|#####4 | 3273/6000 [06:40<1:06:37, 1.47s/it, lr: 1.0e-04 loss: 1.092e-01] my_first_lora_v6: 55%|#####4 | 3274/6000 [06:42<1:06:45, 1.47s/it, lr: 1.0e-04 loss: 1.804e-02] my_first_lora_v6: 55%|#####4 | 3274/6000 [06:42<1:06:45, 1.47s/it, lr: 1.0e-04 loss: 1.804e-02] my_first_lora_v6: 55%|#####4 | 3275/6000 [06:43<1:06:36, 1.47s/it, lr: 1.0e-04 loss: 1.709e-01] my_first_lora_v6: 55%|#####4 | 3275/6000 [06:43<1:06:36, 1.47s/it, lr: 1.0e-04 loss: 1.709e-01] my_first_lora_v6: 55%|#####4 | 3276/6000 [06:45<1:06:42, 1.47s/it, lr: 1.0e-04 loss: 1.871e-01] my_first_lora_v6: 55%|#####4 | 3276/6000 [06:45<1:06:42, 1.47s/it, lr: 1.0e-04 loss: 1.871e-01] my_first_lora_v6: 55%|#####4 | 3277/6000 [06:46<1:06:33, 1.47s/it, lr: 1.0e-04 loss: 1.528e-01] my_first_lora_v6: 55%|#####4 | 3277/6000 [06:46<1:06:33, 1.47s/it, lr: 1.0e-04 loss: 1.528e-01] my_first_lora_v6: 55%|#####4 | 3278/6000 [06:48<1:06:44, 1.47s/it, lr: 1.0e-04 loss: 3.576e-01] my_first_lora_v6: 55%|#####4 | 3278/6000 [06:48<1:06:44, 1.47s/it, lr: 1.0e-04 loss: 3.576e-01] my_first_lora_v6: 55%|#####4 | 3279/6000 [06:50<1:06:40, 1.47s/it, lr: 1.0e-04 loss: 3.951e-01] my_first_lora_v6: 55%|#####4 | 3279/6000 [06:50<1:06:40, 1.47s/it, lr: 1.0e-04 loss: 3.951e-01] my_first_lora_v6: 55%|#####4 | 3280/6000 [06:50<1:06:30, 1.47s/it, lr: 1.0e-04 loss: 2.183e-01] my_first_lora_v6: 55%|#####4 | 3280/6000 [06:50<1:06:30, 1.47s/it, lr: 1.0e-04 loss: 2.183e-01] my_first_lora_v6: 55%|#####4 | 3281/6000 [06:52<1:06:28, 1.47s/it, lr: 1.0e-04 loss: 7.397e-01] my_first_lora_v6: 55%|#####4 | 3281/6000 [06:52<1:06:28, 1.47s/it, lr: 1.0e-04 loss: 7.397e-01] my_first_lora_v6: 55%|#####4 | 3282/6000 [06:54<1:06:36, 1.47s/it, lr: 1.0e-04 loss: 7.517e-01] my_first_lora_v6: 55%|#####4 | 3282/6000 [06:54<1:06:36, 1.47s/it, lr: 1.0e-04 loss: 7.517e-01] my_first_lora_v6: 55%|#####4 | 3283/6000 [06:55<1:06:32, 1.47s/it, lr: 1.0e-04 loss: 6.334e-01] my_first_lora_v6: 55%|#####4 | 3283/6000 [06:55<1:06:32, 1.47s/it, lr: 1.0e-04 loss: 6.334e-01] my_first_lora_v6: 55%|#####4 | 3284/6000 [06:58<1:06:42, 1.47s/it, lr: 1.0e-04 loss: 3.023e-01] my_first_lora_v6: 55%|#####4 | 3284/6000 [06:58<1:06:42, 1.47s/it, lr: 1.0e-04 loss: 3.023e-01] my_first_lora_v6: 55%|#####4 | 3285/6000 [06:59<1:06:40, 1.47s/it, lr: 1.0e-04 loss: 7.408e-01] my_first_lora_v6: 55%|#####4 | 3285/6000 [06:59<1:06:40, 1.47s/it, lr: 1.0e-04 loss: 7.408e-01] my_first_lora_v6: 55%|#####4 | 3286/6000 [07:00<1:06:31, 1.47s/it, lr: 1.0e-04 loss: 3.267e-01] my_first_lora_v6: 55%|#####4 | 3286/6000 [07:00<1:06:31, 1.47s/it, lr: 1.0e-04 loss: 3.267e-01] my_first_lora_v6: 55%|#####4 | 3287/6000 [07:02<1:06:31, 1.47s/it, lr: 1.0e-04 loss: 1.272e-01] my_first_lora_v6: 55%|#####4 | 3287/6000 [07:02<1:06:31, 1.47s/it, lr: 1.0e-04 loss: 1.272e-01] my_first_lora_v6: 55%|#####4 | 3288/6000 [07:02<1:06:22, 1.47s/it, lr: 1.0e-04 loss: 4.570e-01] my_first_lora_v6: 55%|#####4 | 3288/6000 [07:02<1:06:22, 1.47s/it, lr: 1.0e-04 loss: 4.570e-01] my_first_lora_v6: 55%|#####4 | 3289/6000 [07:03<1:06:14, 1.47s/it, lr: 1.0e-04 loss: 5.341e-01] my_first_lora_v6: 55%|#####4 | 3289/6000 [07:03<1:06:14, 1.47s/it, lr: 1.0e-04 loss: 5.341e-01] my_first_lora_v6: 55%|#####4 | 3290/6000 [07:04<1:06:10, 1.46s/it, lr: 1.0e-04 loss: 1.968e-01] my_first_lora_v6: 55%|#####4 | 3290/6000 [07:04<1:06:10, 1.46s/it, lr: 1.0e-04 loss: 1.968e-01] my_first_lora_v6: 55%|#####4 | 3291/6000 [07:07<1:06:18, 1.47s/it, lr: 1.0e-04 loss: 1.640e-01] my_first_lora_v6: 55%|#####4 | 3291/6000 [07:07<1:06:18, 1.47s/it, lr: 1.0e-04 loss: 1.640e-01] my_first_lora_v6: 55%|#####4 | 3292/6000 [07:08<1:06:13, 1.47s/it, lr: 1.0e-04 loss: 6.878e-01] my_first_lora_v6: 55%|#####4 | 3292/6000 [07:08<1:06:13, 1.47s/it, lr: 1.0e-04 loss: 6.878e-01] my_first_lora_v6: 55%|#####4 | 3293/6000 [07:10<1:06:21, 1.47s/it, lr: 1.0e-04 loss: 2.532e-01] my_first_lora_v6: 55%|#####4 | 3293/6000 [07:10<1:06:21, 1.47s/it, lr: 1.0e-04 loss: 2.532e-01] my_first_lora_v6: 55%|#####4 | 3294/6000 [07:12<1:06:18, 1.47s/it, lr: 1.0e-04 loss: 1.553e-01] my_first_lora_v6: 55%|#####4 | 3294/6000 [07:12<1:06:18, 1.47s/it, lr: 1.0e-04 loss: 1.553e-01] my_first_lora_v6: 55%|#####4 | 3295/6000 [07:14<1:06:26, 1.47s/it, lr: 1.0e-04 loss: 6.602e-01] my_first_lora_v6: 55%|#####4 | 3295/6000 [07:14<1:06:26, 1.47s/it, lr: 1.0e-04 loss: 6.602e-01] my_first_lora_v6: 55%|#####4 | 3296/6000 [07:16<1:06:23, 1.47s/it, lr: 1.0e-04 loss: 6.113e-01] my_first_lora_v6: 55%|#####4 | 3296/6000 [07:16<1:06:23, 1.47s/it, lr: 1.0e-04 loss: 6.113e-01] my_first_lora_v6: 55%|#####4 | 3297/6000 [07:18<1:06:33, 1.48s/it, lr: 1.0e-04 loss: 2.853e-01] my_first_lora_v6: 55%|#####4 | 3297/6000 [07:18<1:06:33, 1.48s/it, lr: 1.0e-04 loss: 2.853e-01] my_first_lora_v6: 55%|#####4 | 3298/6000 [07:19<1:06:25, 1.47s/it, lr: 1.0e-04 loss: 3.435e-01] my_first_lora_v6: 55%|#####4 | 3298/6000 [07:19<1:06:25, 1.47s/it, lr: 1.0e-04 loss: 3.435e-01] my_first_lora_v6: 55%|#####4 | 3299/6000 [07:20<1:06:22, 1.47s/it, lr: 1.0e-04 loss: 2.034e-01] my_first_lora_v6: 55%|#####4 | 3299/6000 [07:20<1:06:22, 1.47s/it, lr: 1.0e-04 loss: 2.034e-01] my_first_lora_v6: 55%|#####5 | 3300/6000 [07:22<1:06:20, 1.47s/it, lr: 1.0e-04 loss: 7.343e-01] my_first_lora_v6: 55%|#####5 | 3300/6000 [07:22<1:06:20, 1.47s/it, lr: 1.0e-04 loss: 7.343e-01] my_first_lora_v6: 55%|#####5 | 3301/6000 [07:22<1:06:11, 1.47s/it, lr: 1.0e-04 loss: 6.067e-01] my_first_lora_v6: 55%|#####5 | 3301/6000 [07:22<1:06:11, 1.47s/it, lr: 1.0e-04 loss: 6.067e-01] my_first_lora_v6: 55%|#####5 | 3302/6000 [07:24<1:06:07, 1.47s/it, lr: 1.0e-04 loss: 4.280e-01] my_first_lora_v6: 55%|#####5 | 3302/6000 [07:24<1:06:07, 1.47s/it, lr: 1.0e-04 loss: 4.280e-01] my_first_lora_v6: 55%|#####5 | 3303/6000 [07:26<1:06:13, 1.47s/it, lr: 1.0e-04 loss: 2.074e-01] my_first_lora_v6: 55%|#####5 | 3303/6000 [07:26<1:06:13, 1.47s/it, lr: 1.0e-04 loss: 2.074e-01] my_first_lora_v6: 55%|#####5 | 3304/6000 [07:28<1:06:18, 1.48s/it, lr: 1.0e-04 loss: 7.244e-01] my_first_lora_v6: 55%|#####5 | 3304/6000 [07:28<1:06:18, 1.48s/it, lr: 1.0e-04 loss: 7.244e-01] my_first_lora_v6: 55%|#####5 | 3305/6000 [07:29<1:06:15, 1.48s/it, lr: 1.0e-04 loss: 1.664e-01] my_first_lora_v6: 55%|#####5 | 3305/6000 [07:29<1:06:15, 1.48s/it, lr: 1.0e-04 loss: 1.664e-01] my_first_lora_v6: 55%|#####5 | 3306/6000 [07:30<1:06:07, 1.47s/it, lr: 1.0e-04 loss: 6.346e-01] my_first_lora_v6: 55%|#####5 | 3306/6000 [07:30<1:06:07, 1.47s/it, lr: 1.0e-04 loss: 6.346e-01] my_first_lora_v6: 55%|#####5 | 3307/6000 [07:33<1:06:16, 1.48s/it, lr: 1.0e-04 loss: 3.120e-01] my_first_lora_v6: 55%|#####5 | 3307/6000 [07:33<1:06:16, 1.48s/it, lr: 1.0e-04 loss: 3.120e-01] my_first_lora_v6: 55%|#####5 | 3308/6000 [07:34<1:06:08, 1.47s/it, lr: 1.0e-04 loss: 1.306e-01] my_first_lora_v6: 55%|#####5 | 3308/6000 [07:34<1:06:08, 1.47s/it, lr: 1.0e-04 loss: 1.306e-01] my_first_lora_v6: 55%|#####5 | 3309/6000 [07:34<1:06:00, 1.47s/it, lr: 1.0e-04 loss: 7.620e-01] my_first_lora_v6: 55%|#####5 | 3309/6000 [07:34<1:06:00, 1.47s/it, lr: 1.0e-04 loss: 7.620e-01] my_first_lora_v6: 55%|#####5 | 3310/6000 [07:36<1:05:57, 1.47s/it, lr: 1.0e-04 loss: 1.225e-01] my_first_lora_v6: 55%|#####5 | 3310/6000 [07:36<1:05:57, 1.47s/it, lr: 1.0e-04 loss: 1.225e-01] my_first_lora_v6: 55%|#####5 | 3311/6000 [07:37<1:05:55, 1.47s/it, lr: 1.0e-04 loss: 2.244e-01] my_first_lora_v6: 55%|#####5 | 3311/6000 [07:37<1:05:55, 1.47s/it, lr: 1.0e-04 loss: 2.244e-01] my_first_lora_v6: 55%|#####5 | 3312/6000 [07:38<1:05:52, 1.47s/it, lr: 1.0e-04 loss: 6.139e-01] my_first_lora_v6: 55%|#####5 | 3312/6000 [07:38<1:05:52, 1.47s/it, lr: 1.0e-04 loss: 6.139e-01] my_first_lora_v6: 55%|#####5 | 3313/6000 [07:40<1:05:50, 1.47s/it, lr: 1.0e-04 loss: 6.684e-01] my_first_lora_v6: 55%|#####5 | 3313/6000 [07:40<1:05:50, 1.47s/it, lr: 1.0e-04 loss: 6.684e-01] my_first_lora_v6: 55%|#####5 | 3314/6000 [07:42<1:05:59, 1.47s/it, lr: 1.0e-04 loss: 1.088e-01] my_first_lora_v6: 55%|#####5 | 3314/6000 [07:42<1:05:59, 1.47s/it, lr: 1.0e-04 loss: 1.088e-01] my_first_lora_v6: 55%|#####5 | 3315/6000 [07:43<1:05:52, 1.47s/it, lr: 1.0e-04 loss: 5.675e-01] my_first_lora_v6: 55%|#####5 | 3315/6000 [07:43<1:05:52, 1.47s/it, lr: 1.0e-04 loss: 5.675e-01] my_first_lora_v6: 55%|#####5 | 3316/6000 [07:45<1:05:57, 1.47s/it, lr: 1.0e-04 loss: 2.157e-01] my_first_lora_v6: 55%|#####5 | 3316/6000 [07:45<1:05:57, 1.47s/it, lr: 1.0e-04 loss: 2.157e-01] my_first_lora_v6: 55%|#####5 | 3317/6000 [07:46<1:05:49, 1.47s/it, lr: 1.0e-04 loss: 4.984e-01] my_first_lora_v6: 55%|#####5 | 3317/6000 [07:46<1:05:49, 1.47s/it, lr: 1.0e-04 loss: 4.984e-01] my_first_lora_v6: 55%|#####5 | 3318/6000 [07:47<1:05:46, 1.47s/it, lr: 1.0e-04 loss: 4.159e-01] my_first_lora_v6: 55%|#####5 | 3318/6000 [07:47<1:05:46, 1.47s/it, lr: 1.0e-04 loss: 4.159e-01] my_first_lora_v6: 55%|#####5 | 3319/6000 [07:48<1:05:38, 1.47s/it, lr: 1.0e-04 loss: 4.639e-02] my_first_lora_v6: 55%|#####5 | 3319/6000 [07:48<1:05:38, 1.47s/it, lr: 1.0e-04 loss: 4.639e-02] my_first_lora_v6: 55%|#####5 | 3320/6000 [07:49<1:05:31, 1.47s/it, lr: 1.0e-04 loss: 3.846e-01] my_first_lora_v6: 55%|#####5 | 3320/6000 [07:49<1:05:31, 1.47s/it, lr: 1.0e-04 loss: 3.846e-01] my_first_lora_v6: 55%|#####5 | 3321/6000 [07:50<1:05:28, 1.47s/it, lr: 1.0e-04 loss: 2.205e-01] my_first_lora_v6: 55%|#####5 | 3321/6000 [07:50<1:05:28, 1.47s/it, lr: 1.0e-04 loss: 2.205e-01] my_first_lora_v6: 55%|#####5 | 3322/6000 [07:51<1:05:24, 1.47s/it, lr: 1.0e-04 loss: 2.617e-01] my_first_lora_v6: 55%|#####5 | 3322/6000 [07:51<1:05:24, 1.47s/it, lr: 1.0e-04 loss: 2.617e-01] my_first_lora_v6: 55%|#####5 | 3323/6000 [07:52<1:05:16, 1.46s/it, lr: 1.0e-04 loss: 6.831e-01] my_first_lora_v6: 55%|#####5 | 3323/6000 [07:52<1:05:16, 1.46s/it, lr: 1.0e-04 loss: 6.831e-01] my_first_lora_v6: 55%|#####5 | 3324/6000 [07:53<1:05:14, 1.46s/it, lr: 1.0e-04 loss: 2.771e-01] my_first_lora_v6: 55%|#####5 | 3324/6000 [07:53<1:05:14, 1.46s/it, lr: 1.0e-04 loss: 2.771e-01] my_first_lora_v6: 55%|#####5 | 3325/6000 [07:55<1:05:11, 1.46s/it, lr: 1.0e-04 loss: 6.610e-01] my_first_lora_v6: 55%|#####5 | 3325/6000 [07:55<1:05:11, 1.46s/it, lr: 1.0e-04 loss: 6.610e-01] my_first_lora_v6: 55%|#####5 | 3326/6000 [07:57<1:05:18, 1.47s/it, lr: 1.0e-04 loss: 7.358e-01] my_first_lora_v6: 55%|#####5 | 3326/6000 [07:57<1:05:18, 1.47s/it, lr: 1.0e-04 loss: 7.358e-01] my_first_lora_v6: 55%|#####5 | 3327/6000 [07:58<1:05:11, 1.46s/it, lr: 1.0e-04 loss: 2.949e-01] my_first_lora_v6: 55%|#####5 | 3327/6000 [07:58<1:05:11, 1.46s/it, lr: 1.0e-04 loss: 2.949e-01] my_first_lora_v6: 55%|#####5 | 3328/6000 [08:00<1:05:16, 1.47s/it, lr: 1.0e-04 loss: 5.671e-01] my_first_lora_v6: 55%|#####5 | 3328/6000 [08:00<1:05:16, 1.47s/it, lr: 1.0e-04 loss: 5.671e-01] my_first_lora_v6: 55%|#####5 | 3329/6000 [08:01<1:05:12, 1.46s/it, lr: 1.0e-04 loss: 2.174e-01] my_first_lora_v6: 55%|#####5 | 3329/6000 [08:01<1:05:12, 1.46s/it, lr: 1.0e-04 loss: 2.174e-01] my_first_lora_v6: 56%|#####5 | 3330/6000 [08:04<1:05:19, 1.47s/it, lr: 1.0e-04 loss: 5.532e-01] my_first_lora_v6: 56%|#####5 | 3330/6000 [08:04<1:05:19, 1.47s/it, lr: 1.0e-04 loss: 5.532e-01] my_first_lora_v6: 56%|#####5 | 3331/6000 [08:06<1:05:25, 1.47s/it, lr: 1.0e-04 loss: 3.642e-01] my_first_lora_v6: 56%|#####5 | 3331/6000 [08:06<1:05:25, 1.47s/it, lr: 1.0e-04 loss: 3.642e-01] my_first_lora_v6: 56%|#####5 | 3332/6000 [08:09<1:05:32, 1.47s/it, lr: 1.0e-04 loss: 6.621e-01] my_first_lora_v6: 56%|#####5 | 3332/6000 [08:09<1:05:32, 1.47s/it, lr: 1.0e-04 loss: 6.621e-01] my_first_lora_v6: 56%|#####5 | 3333/6000 [08:10<1:05:30, 1.47s/it, lr: 1.0e-04 loss: 3.127e-01] my_first_lora_v6: 56%|#####5 | 3333/6000 [08:10<1:05:30, 1.47s/it, lr: 1.0e-04 loss: 3.127e-01] my_first_lora_v6: 56%|#####5 | 3334/6000 [08:11<1:05:22, 1.47s/it, lr: 1.0e-04 loss: 3.300e-01] my_first_lora_v6: 56%|#####5 | 3334/6000 [08:11<1:05:22, 1.47s/it, lr: 1.0e-04 loss: 3.300e-01] my_first_lora_v6: 56%|#####5 | 3335/6000 [08:12<1:05:21, 1.47s/it, lr: 1.0e-04 loss: 2.077e-01] my_first_lora_v6: 56%|#####5 | 3335/6000 [08:12<1:05:21, 1.47s/it, lr: 1.0e-04 loss: 2.077e-01] my_first_lora_v6: 56%|#####5 | 3336/6000 [08:15<1:05:30, 1.48s/it, lr: 1.0e-04 loss: 6.986e-01] my_first_lora_v6: 56%|#####5 | 3336/6000 [08:15<1:05:30, 1.48s/it, lr: 1.0e-04 loss: 6.986e-01] my_first_lora_v6: 56%|#####5 | 3337/6000 [08:16<1:05:22, 1.47s/it, lr: 1.0e-04 loss: 4.274e-01] my_first_lora_v6: 56%|#####5 | 3337/6000 [08:16<1:05:22, 1.47s/it, lr: 1.0e-04 loss: 4.274e-01] my_first_lora_v6: 56%|#####5 | 3338/6000 [08:17<1:05:19, 1.47s/it, lr: 1.0e-04 loss: 3.130e-01] my_first_lora_v6: 56%|#####5 | 3338/6000 [08:17<1:05:19, 1.47s/it, lr: 1.0e-04 loss: 3.130e-01] my_first_lora_v6: 56%|#####5 | 3339/6000 [08:18<1:05:12, 1.47s/it, lr: 1.0e-04 loss: 7.366e-01] my_first_lora_v6: 56%|#####5 | 3339/6000 [08:18<1:05:12, 1.47s/it, lr: 1.0e-04 loss: 7.366e-01] my_first_lora_v6: 56%|#####5 | 3340/6000 [08:20<1:05:18, 1.47s/it, lr: 1.0e-04 loss: 6.324e-01] my_first_lora_v6: 56%|#####5 | 3340/6000 [08:20<1:05:18, 1.47s/it, lr: 1.0e-04 loss: 6.324e-01] my_first_lora_v6: 56%|#####5 | 3341/6000 [08:23<1:05:27, 1.48s/it, lr: 1.0e-04 loss: 5.562e-01] my_first_lora_v6: 56%|#####5 | 3341/6000 [08:23<1:05:27, 1.48s/it, lr: 1.0e-04 loss: 5.562e-01] my_first_lora_v6: 56%|#####5 | 3342/6000 [08:24<1:05:19, 1.47s/it, lr: 1.0e-04 loss: 2.769e-01] my_first_lora_v6: 56%|#####5 | 3342/6000 [08:24<1:05:19, 1.47s/it, lr: 1.0e-04 loss: 2.769e-01] my_first_lora_v6: 56%|#####5 | 3343/6000 [08:25<1:05:17, 1.47s/it, lr: 1.0e-04 loss: 7.362e-01] my_first_lora_v6: 56%|#####5 | 3343/6000 [08:25<1:05:17, 1.47s/it, lr: 1.0e-04 loss: 7.362e-01] my_first_lora_v6: 56%|#####5 | 3344/6000 [08:27<1:05:21, 1.48s/it, lr: 1.0e-04 loss: 4.603e-01] my_first_lora_v6: 56%|#####5 | 3344/6000 [08:27<1:05:21, 1.48s/it, lr: 1.0e-04 loss: 4.603e-01] my_first_lora_v6: 56%|#####5 | 3345/6000 [08:28<1:05:13, 1.47s/it, lr: 1.0e-04 loss: 1.536e-01] my_first_lora_v6: 56%|#####5 | 3345/6000 [08:28<1:05:13, 1.47s/it, lr: 1.0e-04 loss: 1.536e-01] my_first_lora_v6: 56%|#####5 | 3346/6000 [08:29<1:05:09, 1.47s/it, lr: 1.0e-04 loss: 7.935e-01] my_first_lora_v6: 56%|#####5 | 3346/6000 [08:29<1:05:09, 1.47s/it, lr: 1.0e-04 loss: 7.935e-01] my_first_lora_v6: 56%|#####5 | 3347/6000 [08:30<1:05:02, 1.47s/it, lr: 1.0e-04 loss: 5.964e-01] my_first_lora_v6: 56%|#####5 | 3347/6000 [08:30<1:05:02, 1.47s/it, lr: 1.0e-04 loss: 5.964e-01] my_first_lora_v6: 56%|#####5 | 3348/6000 [08:31<1:04:55, 1.47s/it, lr: 1.0e-04 loss: 4.089e-01] my_first_lora_v6: 56%|#####5 | 3348/6000 [08:31<1:04:55, 1.47s/it, lr: 1.0e-04 loss: 4.089e-01] my_first_lora_v6: 56%|#####5 | 3349/6000 [08:33<1:05:01, 1.47s/it, lr: 1.0e-04 loss: 4.278e-01] my_first_lora_v6: 56%|#####5 | 3349/6000 [08:33<1:05:01, 1.47s/it, lr: 1.0e-04 loss: 4.278e-01] my_first_lora_v6: 56%|#####5 | 3350/6000 [08:35<1:04:59, 1.47s/it, lr: 1.0e-04 loss: 8.049e-02] my_first_lora_v6: 56%|#####5 | 3350/6000 [08:35<1:04:59, 1.47s/it, lr: 1.0e-04 loss: 8.049e-02] my_first_lora_v6: 56%|#####5 | 3351/6000 [08:35<1:04:54, 1.47s/it, lr: 1.0e-04 loss: 5.613e-01] my_first_lora_v6: 56%|#####5 | 3351/6000 [08:35<1:04:54, 1.47s/it, lr: 1.0e-04 loss: 5.613e-01] my_first_lora_v6: 56%|#####5 | 3352/6000 [08:37<1:04:51, 1.47s/it, lr: 1.0e-04 loss: 3.877e-01] my_first_lora_v6: 56%|#####5 | 3352/6000 [08:37<1:04:51, 1.47s/it, lr: 1.0e-04 loss: 3.877e-01] my_first_lora_v6: 56%|#####5 | 3353/6000 [08:38<1:04:49, 1.47s/it, lr: 1.0e-04 loss: 6.690e-01] my_first_lora_v6: 56%|#####5 | 3353/6000 [08:38<1:04:49, 1.47s/it, lr: 1.0e-04 loss: 6.690e-01] my_first_lora_v6: 56%|#####5 | 3354/6000 [08:39<1:04:45, 1.47s/it, lr: 1.0e-04 loss: 2.214e-01] my_first_lora_v6: 56%|#####5 | 3354/6000 [08:39<1:04:45, 1.47s/it, lr: 1.0e-04 loss: 2.214e-01] my_first_lora_v6: 56%|#####5 | 3355/6000 [08:41<1:04:43, 1.47s/it, lr: 1.0e-04 loss: 5.005e-01] my_first_lora_v6: 56%|#####5 | 3355/6000 [08:41<1:04:43, 1.47s/it, lr: 1.0e-04 loss: 5.005e-01] my_first_lora_v6: 56%|#####5 | 3356/6000 [08:41<1:04:36, 1.47s/it, lr: 1.0e-04 loss: 7.220e-01] my_first_lora_v6: 56%|#####5 | 3356/6000 [08:41<1:04:36, 1.47s/it, lr: 1.0e-04 loss: 7.220e-01] my_first_lora_v6: 56%|#####5 | 3357/6000 [08:44<1:04:40, 1.47s/it, lr: 1.0e-04 loss: 3.373e-01] my_first_lora_v6: 56%|#####5 | 3357/6000 [08:44<1:04:40, 1.47s/it, lr: 1.0e-04 loss: 3.373e-01] my_first_lora_v6: 56%|#####5 | 3358/6000 [08:46<1:04:46, 1.47s/it, lr: 1.0e-04 loss: 1.554e-01] my_first_lora_v6: 56%|#####5 | 3358/6000 [08:46<1:04:46, 1.47s/it, lr: 1.0e-04 loss: 1.554e-01] my_first_lora_v6: 56%|#####5 | 3359/6000 [08:48<1:04:46, 1.47s/it, lr: 1.0e-04 loss: 7.491e-01] my_first_lora_v6: 56%|#####5 | 3359/6000 [08:48<1:04:46, 1.47s/it, lr: 1.0e-04 loss: 7.491e-01] my_first_lora_v6: 56%|#####6 | 3360/6000 [08:50<1:04:51, 1.47s/it, lr: 1.0e-04 loss: 7.236e-01] my_first_lora_v6: 56%|#####6 | 3360/6000 [08:50<1:04:51, 1.47s/it, lr: 1.0e-04 loss: 7.236e-01] my_first_lora_v6: 56%|#####6 | 3361/6000 [08:51<1:04:44, 1.47s/it, lr: 1.0e-04 loss: 2.419e-01] my_first_lora_v6: 56%|#####6 | 3361/6000 [08:51<1:04:44, 1.47s/it, lr: 1.0e-04 loss: 2.419e-01] my_first_lora_v6: 56%|#####6 | 3362/6000 [08:53<1:04:48, 1.47s/it, lr: 1.0e-04 loss: 7.536e-01] my_first_lora_v6: 56%|#####6 | 3362/6000 [08:53<1:04:48, 1.47s/it, lr: 1.0e-04 loss: 7.536e-01] my_first_lora_v6: 56%|#####6 | 3363/6000 [08:55<1:04:46, 1.47s/it, lr: 1.0e-04 loss: 6.536e-01] my_first_lora_v6: 56%|#####6 | 3363/6000 [08:55<1:04:46, 1.47s/it, lr: 1.0e-04 loss: 6.536e-01] my_first_lora_v6: 56%|#####6 | 3364/6000 [08:56<1:04:44, 1.47s/it, lr: 1.0e-04 loss: 3.535e-01] my_first_lora_v6: 56%|#####6 | 3364/6000 [08:56<1:04:44, 1.47s/it, lr: 1.0e-04 loss: 3.535e-01] my_first_lora_v6: 56%|#####6 | 3365/6000 [08:59<1:04:51, 1.48s/it, lr: 1.0e-04 loss: 3.082e-01] my_first_lora_v6: 56%|#####6 | 3365/6000 [08:59<1:04:51, 1.48s/it, lr: 1.0e-04 loss: 3.082e-01] my_first_lora_v6: 56%|#####6 | 3366/6000 [09:01<1:04:56, 1.48s/it, lr: 1.0e-04 loss: 3.326e-01] my_first_lora_v6: 56%|#####6 | 3366/6000 [09:01<1:04:56, 1.48s/it, lr: 1.0e-04 loss: 3.326e-01] my_first_lora_v6: 56%|#####6 | 3367/6000 [09:03<1:05:01, 1.48s/it, lr: 1.0e-04 loss: 5.585e-01] my_first_lora_v6: 56%|#####6 | 3367/6000 [09:03<1:05:01, 1.48s/it, lr: 1.0e-04 loss: 5.585e-01] my_first_lora_v6: 56%|#####6 | 3368/6000 [09:05<1:04:59, 1.48s/it, lr: 1.0e-04 loss: 4.320e-01] my_first_lora_v6: 56%|#####6 | 3368/6000 [09:05<1:04:59, 1.48s/it, lr: 1.0e-04 loss: 4.320e-01] my_first_lora_v6: 56%|#####6 | 3369/6000 [09:06<1:04:57, 1.48s/it, lr: 1.0e-04 loss: 2.923e-01] my_first_lora_v6: 56%|#####6 | 3369/6000 [09:06<1:04:57, 1.48s/it, lr: 1.0e-04 loss: 2.923e-01] my_first_lora_v6: 56%|#####6 | 3370/6000 [09:07<1:04:50, 1.48s/it, lr: 1.0e-04 loss: 1.648e-01] my_first_lora_v6: 56%|#####6 | 3370/6000 [09:07<1:04:50, 1.48s/it, lr: 1.0e-04 loss: 1.648e-01] my_first_lora_v6: 56%|#####6 | 3371/6000 [09:07<1:04:42, 1.48s/it, lr: 1.0e-04 loss: 2.392e-01] my_first_lora_v6: 56%|#####6 | 3371/6000 [09:07<1:04:42, 1.48s/it, lr: 1.0e-04 loss: 2.392e-01] my_first_lora_v6: 56%|#####6 | 3372/6000 [09:10<1:04:48, 1.48s/it, lr: 1.0e-04 loss: 3.590e-01] my_first_lora_v6: 56%|#####6 | 3372/6000 [09:10<1:04:48, 1.48s/it, lr: 1.0e-04 loss: 3.590e-01] my_first_lora_v6: 56%|#####6 | 3373/6000 [09:11<1:04:44, 1.48s/it, lr: 1.0e-04 loss: 6.154e-01] my_first_lora_v6: 56%|#####6 | 3373/6000 [09:11<1:04:44, 1.48s/it, lr: 1.0e-04 loss: 6.154e-01] my_first_lora_v6: 56%|#####6 | 3374/6000 [09:12<1:04:42, 1.48s/it, lr: 1.0e-04 loss: 6.716e-01] my_first_lora_v6: 56%|#####6 | 3374/6000 [09:12<1:04:42, 1.48s/it, lr: 1.0e-04 loss: 6.716e-01] my_first_lora_v6: 56%|#####6 | 3375/6000 [09:13<1:04:35, 1.48s/it, lr: 1.0e-04 loss: 4.798e-01] my_first_lora_v6: 56%|#####6 | 3375/6000 [09:13<1:04:35, 1.48s/it, lr: 1.0e-04 loss: 4.798e-01] my_first_lora_v6: 56%|#####6 | 3376/6000 [09:14<1:04:33, 1.48s/it, lr: 1.0e-04 loss: 3.241e-01] my_first_lora_v6: 56%|#####6 | 3376/6000 [09:14<1:04:33, 1.48s/it, lr: 1.0e-04 loss: 3.241e-01] my_first_lora_v6: 56%|#####6 | 3377/6000 [09:17<1:04:40, 1.48s/it, lr: 1.0e-04 loss: 5.830e-01] my_first_lora_v6: 56%|#####6 | 3377/6000 [09:17<1:04:40, 1.48s/it, lr: 1.0e-04 loss: 5.830e-01] my_first_lora_v6: 56%|#####6 | 3378/6000 [09:18<1:04:36, 1.48s/it, lr: 1.0e-04 loss: 1.949e-01] my_first_lora_v6: 56%|#####6 | 3378/6000 [09:18<1:04:36, 1.48s/it, lr: 1.0e-04 loss: 1.949e-01] my_first_lora_v6: 56%|#####6 | 3379/6000 [09:19<1:04:31, 1.48s/it, lr: 1.0e-04 loss: 3.910e-02] my_first_lora_v6: 56%|#####6 | 3379/6000 [09:19<1:04:31, 1.48s/it, lr: 1.0e-04 loss: 3.910e-02] my_first_lora_v6: 56%|#####6 | 3380/6000 [09:20<1:04:24, 1.48s/it, lr: 1.0e-04 loss: 3.540e-01] my_first_lora_v6: 56%|#####6 | 3380/6000 [09:20<1:04:24, 1.48s/it, lr: 1.0e-04 loss: 3.540e-01] my_first_lora_v6: 56%|#####6 | 3381/6000 [09:21<1:04:17, 1.47s/it, lr: 1.0e-04 loss: 7.152e-01] my_first_lora_v6: 56%|#####6 | 3381/6000 [09:21<1:04:17, 1.47s/it, lr: 1.0e-04 loss: 7.152e-01] my_first_lora_v6: 56%|#####6 | 3382/6000 [09:21<1:04:10, 1.47s/it, lr: 1.0e-04 loss: 5.783e-01] my_first_lora_v6: 56%|#####6 | 3382/6000 [09:21<1:04:10, 1.47s/it, lr: 1.0e-04 loss: 5.783e-01] my_first_lora_v6: 56%|#####6 | 3383/6000 [09:24<1:04:17, 1.47s/it, lr: 1.0e-04 loss: 7.240e-01] my_first_lora_v6: 56%|#####6 | 3383/6000 [09:24<1:04:17, 1.47s/it, lr: 1.0e-04 loss: 7.240e-01] my_first_lora_v6: 56%|#####6 | 3384/6000 [09:25<1:04:15, 1.47s/it, lr: 1.0e-04 loss: 3.795e-02] my_first_lora_v6: 56%|#####6 | 3384/6000 [09:25<1:04:15, 1.47s/it, lr: 1.0e-04 loss: 3.795e-02] my_first_lora_v6: 56%|#####6 | 3385/6000 [09:26<1:04:08, 1.47s/it, lr: 1.0e-04 loss: 3.965e-02] my_first_lora_v6: 56%|#####6 | 3385/6000 [09:26<1:04:08, 1.47s/it, lr: 1.0e-04 loss: 3.965e-02] my_first_lora_v6: 56%|#####6 | 3386/6000 [09:28<1:04:06, 1.47s/it, lr: 1.0e-04 loss: 2.293e-01] my_first_lora_v6: 56%|#####6 | 3386/6000 [09:28<1:04:06, 1.47s/it, lr: 1.0e-04 loss: 2.293e-01] my_first_lora_v6: 56%|#####6 | 3387/6000 [09:29<1:04:03, 1.47s/it, lr: 1.0e-04 loss: 5.984e-01] my_first_lora_v6: 56%|#####6 | 3387/6000 [09:29<1:04:03, 1.47s/it, lr: 1.0e-04 loss: 5.984e-01] my_first_lora_v6: 56%|#####6 | 3388/6000 [09:29<1:03:56, 1.47s/it, lr: 1.0e-04 loss: 3.144e-01] my_first_lora_v6: 56%|#####6 | 3388/6000 [09:29<1:03:56, 1.47s/it, lr: 1.0e-04 loss: 3.144e-01] my_first_lora_v6: 56%|#####6 | 3389/6000 [09:30<1:03:49, 1.47s/it, lr: 1.0e-04 loss: 6.880e-01] my_first_lora_v6: 56%|#####6 | 3389/6000 [09:30<1:03:49, 1.47s/it, lr: 1.0e-04 loss: 6.880e-01] my_first_lora_v6: 56%|#####6 | 3390/6000 [09:31<1:03:47, 1.47s/it, lr: 1.0e-04 loss: 8.440e-02] my_first_lora_v6: 56%|#####6 | 3390/6000 [09:31<1:03:47, 1.47s/it, lr: 1.0e-04 loss: 8.440e-02] my_first_lora_v6: 57%|#####6 | 3391/6000 [09:33<1:03:45, 1.47s/it, lr: 1.0e-04 loss: 6.328e-01] my_first_lora_v6: 57%|#####6 | 3391/6000 [09:33<1:03:45, 1.47s/it, lr: 1.0e-04 loss: 6.328e-01] my_first_lora_v6: 57%|#####6 | 3392/6000 [09:34<1:03:43, 1.47s/it, lr: 1.0e-04 loss: 5.303e-01] my_first_lora_v6: 57%|#####6 | 3392/6000 [09:34<1:03:43, 1.47s/it, lr: 1.0e-04 loss: 5.303e-01] my_first_lora_v6: 57%|#####6 | 3393/6000 [09:36<1:03:42, 1.47s/it, lr: 1.0e-04 loss: 3.699e-01] my_first_lora_v6: 57%|#####6 | 3393/6000 [09:36<1:03:42, 1.47s/it, lr: 1.0e-04 loss: 3.699e-01] my_first_lora_v6: 57%|#####6 | 3394/6000 [09:36<1:03:35, 1.46s/it, lr: 1.0e-04 loss: 6.046e-01] my_first_lora_v6: 57%|#####6 | 3394/6000 [09:36<1:03:35, 1.46s/it, lr: 1.0e-04 loss: 6.046e-01] my_first_lora_v6: 57%|#####6 | 3395/6000 [09:39<1:03:41, 1.47s/it, lr: 1.0e-04 loss: 5.240e-01] my_first_lora_v6: 57%|#####6 | 3395/6000 [09:39<1:03:41, 1.47s/it, lr: 1.0e-04 loss: 5.240e-01] my_first_lora_v6: 57%|#####6 | 3396/6000 [09:40<1:03:34, 1.46s/it, lr: 1.0e-04 loss: 7.741e-01] my_first_lora_v6: 57%|#####6 | 3396/6000 [09:40<1:03:34, 1.46s/it, lr: 1.0e-04 loss: 7.741e-01] my_first_lora_v6: 57%|#####6 | 3397/6000 [09:41<1:03:32, 1.46s/it, lr: 1.0e-04 loss: 7.068e-02] my_first_lora_v6: 57%|#####6 | 3397/6000 [09:41<1:03:32, 1.46s/it, lr: 1.0e-04 loss: 7.068e-02] my_first_lora_v6: 57%|#####6 | 3398/6000 [09:43<1:03:37, 1.47s/it, lr: 1.0e-04 loss: 3.492e-01] my_first_lora_v6: 57%|#####6 | 3398/6000 [09:43<1:03:37, 1.47s/it, lr: 1.0e-04 loss: 3.492e-01] my_first_lora_v6: 57%|#####6 | 3399/6000 [09:46<1:03:44, 1.47s/it, lr: 1.0e-04 loss: 4.706e-02] my_first_lora_v6: 57%|#####6 | 3399/6000 [09:46<1:03:44, 1.47s/it, lr: 1.0e-04 loss: 4.706e-02] my_first_lora_v6: 57%|#####6 | 3400/6000 [09:47<1:03:37, 1.47s/it, lr: 1.0e-04 loss: 3.447e-01] my_first_lora_v6: 57%|#####6 | 3400/6000 [09:47<1:03:37, 1.47s/it, lr: 1.0e-04 loss: 3.447e-01] my_first_lora_v6: 57%|#####6 | 3401/6000 [09:49<1:03:41, 1.47s/it, lr: 1.0e-04 loss: 3.653e-01] my_first_lora_v6: 57%|#####6 | 3401/6000 [09:49<1:03:41, 1.47s/it, lr: 1.0e-04 loss: 3.653e-01] my_first_lora_v6: 57%|#####6 | 3402/6000 [09:51<1:03:44, 1.47s/it, lr: 1.0e-04 loss: 3.128e-01] my_first_lora_v6: 57%|#####6 | 3402/6000 [09:51<1:03:44, 1.47s/it, lr: 1.0e-04 loss: 3.128e-01] my_first_lora_v6: 57%|#####6 | 3403/6000 [09:54<1:03:49, 1.47s/it, lr: 1.0e-04 loss: 3.824e-01] my_first_lora_v6: 57%|#####6 | 3403/6000 [09:54<1:03:49, 1.47s/it, lr: 1.0e-04 loss: 3.824e-01] my_first_lora_v6: 57%|#####6 | 3404/6000 [09:55<1:03:43, 1.47s/it, lr: 1.0e-04 loss: 5.301e-01] my_first_lora_v6: 57%|#####6 | 3404/6000 [09:55<1:03:43, 1.47s/it, lr: 1.0e-04 loss: 5.301e-01] my_first_lora_v6: 57%|#####6 | 3405/6000 [09:55<1:03:36, 1.47s/it, lr: 1.0e-04 loss: 4.774e-01] my_first_lora_v6: 57%|#####6 | 3405/6000 [09:55<1:03:36, 1.47s/it, lr: 1.0e-04 loss: 4.774e-01] my_first_lora_v6: 57%|#####6 | 3406/6000 [09:57<1:03:34, 1.47s/it, lr: 1.0e-04 loss: 7.809e-01] my_first_lora_v6: 57%|#####6 | 3406/6000 [09:57<1:03:34, 1.47s/it, lr: 1.0e-04 loss: 7.809e-01] my_first_lora_v6: 57%|#####6 | 3407/6000 [09:58<1:03:33, 1.47s/it, lr: 1.0e-04 loss: 7.664e-02] my_first_lora_v6: 57%|#####6 | 3407/6000 [09:58<1:03:33, 1.47s/it, lr: 1.0e-04 loss: 7.664e-02] my_first_lora_v6: 57%|#####6 | 3408/6000 [10:01<1:03:40, 1.47s/it, lr: 1.0e-04 loss: 4.126e-01] my_first_lora_v6: 57%|#####6 | 3408/6000 [10:01<1:03:40, 1.47s/it, lr: 1.0e-04 loss: 4.126e-01] my_first_lora_v6: 57%|#####6 | 3409/6000 [10:02<1:03:33, 1.47s/it, lr: 1.0e-04 loss: 6.188e-01] my_first_lora_v6: 57%|#####6 | 3409/6000 [10:02<1:03:33, 1.47s/it, lr: 1.0e-04 loss: 6.188e-01] my_first_lora_v6: 57%|#####6 | 3410/6000 [10:02<1:03:27, 1.47s/it, lr: 1.0e-04 loss: 1.671e-01] my_first_lora_v6: 57%|#####6 | 3410/6000 [10:02<1:03:27, 1.47s/it, lr: 1.0e-04 loss: 1.671e-01] my_first_lora_v6: 57%|#####6 | 3411/6000 [10:04<1:03:25, 1.47s/it, lr: 1.0e-04 loss: 2.566e-01] my_first_lora_v6: 57%|#####6 | 3411/6000 [10:04<1:03:25, 1.47s/it, lr: 1.0e-04 loss: 2.566e-01] my_first_lora_v6: 57%|#####6 | 3412/6000 [10:04<1:03:19, 1.47s/it, lr: 1.0e-04 loss: 7.495e-01] my_first_lora_v6: 57%|#####6 | 3412/6000 [10:04<1:03:19, 1.47s/it, lr: 1.0e-04 loss: 7.495e-01] my_first_lora_v6: 57%|#####6 | 3413/6000 [10:05<1:03:12, 1.47s/it, lr: 1.0e-04 loss: 1.969e-01] my_first_lora_v6: 57%|#####6 | 3413/6000 [10:05<1:03:12, 1.47s/it, lr: 1.0e-04 loss: 1.969e-01] my_first_lora_v6: 57%|#####6 | 3414/6000 [10:08<1:03:17, 1.47s/it, lr: 1.0e-04 loss: 2.025e-01] my_first_lora_v6: 57%|#####6 | 3414/6000 [10:08<1:03:17, 1.47s/it, lr: 1.0e-04 loss: 2.025e-01] my_first_lora_v6: 57%|#####6 | 3415/6000 [10:08<1:03:11, 1.47s/it, lr: 1.0e-04 loss: 1.425e-01] my_first_lora_v6: 57%|#####6 | 3415/6000 [10:08<1:03:11, 1.47s/it, lr: 1.0e-04 loss: 1.425e-01] my_first_lora_v6: 57%|#####6 | 3416/6000 [10:10<1:03:09, 1.47s/it, lr: 1.0e-04 loss: 4.117e-01] my_first_lora_v6: 57%|#####6 | 3416/6000 [10:10<1:03:09, 1.47s/it, lr: 1.0e-04 loss: 4.117e-01] my_first_lora_v6: 57%|#####6 | 3417/6000 [10:11<1:03:07, 1.47s/it, lr: 1.0e-04 loss: 5.443e-01] my_first_lora_v6: 57%|#####6 | 3417/6000 [10:11<1:03:07, 1.47s/it, lr: 1.0e-04 loss: 5.443e-01] my_first_lora_v6: 57%|#####6 | 3418/6000 [10:12<1:03:01, 1.46s/it, lr: 1.0e-04 loss: 6.270e-01] my_first_lora_v6: 57%|#####6 | 3418/6000 [10:12<1:03:01, 1.46s/it, lr: 1.0e-04 loss: 6.270e-01] my_first_lora_v6: 57%|#####6 | 3419/6000 [10:13<1:02:59, 1.46s/it, lr: 1.0e-04 loss: 5.678e-01] my_first_lora_v6: 57%|#####6 | 3419/6000 [10:13<1:02:59, 1.46s/it, lr: 1.0e-04 loss: 5.678e-01] my_first_lora_v6: 57%|#####6 | 3420/6000 [10:14<1:02:57, 1.46s/it, lr: 1.0e-04 loss: 7.900e-01] my_first_lora_v6: 57%|#####6 | 3420/6000 [10:14<1:02:57, 1.46s/it, lr: 1.0e-04 loss: 7.900e-01] my_first_lora_v6: 57%|#####7 | 3421/6000 [10:17<1:03:03, 1.47s/it, lr: 1.0e-04 loss: 5.254e-01] my_first_lora_v6: 57%|#####7 | 3421/6000 [10:17<1:03:03, 1.47s/it, lr: 1.0e-04 loss: 5.254e-01] my_first_lora_v6: 57%|#####7 | 3422/6000 [10:20<1:03:07, 1.47s/it, lr: 1.0e-04 loss: 6.415e-01] my_first_lora_v6: 57%|#####7 | 3422/6000 [10:20<1:03:07, 1.47s/it, lr: 1.0e-04 loss: 6.415e-01] my_first_lora_v6: 57%|#####7 | 3423/6000 [10:21<1:03:04, 1.47s/it, lr: 1.0e-04 loss: 1.389e-01] my_first_lora_v6: 57%|#####7 | 3423/6000 [10:21<1:03:04, 1.47s/it, lr: 1.0e-04 loss: 1.389e-01] my_first_lora_v6: 57%|#####7 | 3424/6000 [10:21<1:02:58, 1.47s/it, lr: 1.0e-04 loss: 7.777e-02] my_first_lora_v6: 57%|#####7 | 3424/6000 [10:21<1:02:58, 1.47s/it, lr: 1.0e-04 loss: 7.777e-02] my_first_lora_v6: 57%|#####7 | 3425/6000 [10:23<1:02:56, 1.47s/it, lr: 1.0e-04 loss: 6.126e-01] my_first_lora_v6: 57%|#####7 | 3425/6000 [10:23<1:02:56, 1.47s/it, lr: 1.0e-04 loss: 6.126e-01] my_first_lora_v6: 57%|#####7 | 3426/6000 [10:25<1:03:01, 1.47s/it, lr: 1.0e-04 loss: 2.621e-01] my_first_lora_v6: 57%|#####7 | 3426/6000 [10:25<1:03:01, 1.47s/it, lr: 1.0e-04 loss: 2.621e-01] my_first_lora_v6: 57%|#####7 | 3427/6000 [10:26<1:02:57, 1.47s/it, lr: 1.0e-04 loss: 7.197e-01] my_first_lora_v6: 57%|#####7 | 3427/6000 [10:26<1:02:57, 1.47s/it, lr: 1.0e-04 loss: 7.197e-01] my_first_lora_v6: 57%|#####7 | 3428/6000 [10:27<1:02:51, 1.47s/it, lr: 1.0e-04 loss: 4.120e-01] my_first_lora_v6: 57%|#####7 | 3428/6000 [10:27<1:02:51, 1.47s/it, lr: 1.0e-04 loss: 4.120e-01] my_first_lora_v6: 57%|#####7 | 3429/6000 [10:30<1:02:56, 1.47s/it, lr: 1.0e-04 loss: 2.170e-01] my_first_lora_v6: 57%|#####7 | 3429/6000 [10:30<1:02:56, 1.47s/it, lr: 1.0e-04 loss: 2.170e-01] my_first_lora_v6: 57%|#####7 | 3430/6000 [10:32<1:02:59, 1.47s/it, lr: 1.0e-04 loss: 6.600e-01] my_first_lora_v6: 57%|#####7 | 3430/6000 [10:32<1:02:59, 1.47s/it, lr: 1.0e-04 loss: 6.600e-01] my_first_lora_v6: 57%|#####7 | 3431/6000 [10:33<1:02:55, 1.47s/it, lr: 1.0e-04 loss: 1.065e-01] my_first_lora_v6: 57%|#####7 | 3431/6000 [10:33<1:02:55, 1.47s/it, lr: 1.0e-04 loss: 1.065e-01] my_first_lora_v6: 57%|#####7 | 3432/6000 [10:34<1:02:53, 1.47s/it, lr: 1.0e-04 loss: 5.411e-01] my_first_lora_v6: 57%|#####7 | 3432/6000 [10:34<1:02:53, 1.47s/it, lr: 1.0e-04 loss: 5.411e-01] my_first_lora_v6: 57%|#####7 | 3433/6000 [10:35<1:02:46, 1.47s/it, lr: 1.0e-04 loss: 5.806e-01] my_first_lora_v6: 57%|#####7 | 3433/6000 [10:35<1:02:46, 1.47s/it, lr: 1.0e-04 loss: 5.806e-01] my_first_lora_v6: 57%|#####7 | 3434/6000 [10:36<1:02:43, 1.47s/it, lr: 1.0e-04 loss: 7.291e-01] my_first_lora_v6: 57%|#####7 | 3434/6000 [10:36<1:02:43, 1.47s/it, lr: 1.0e-04 loss: 7.291e-01] my_first_lora_v6: 57%|#####7 | 3435/6000 [10:37<1:02:37, 1.46s/it, lr: 1.0e-04 loss: 3.710e-01] my_first_lora_v6: 57%|#####7 | 3435/6000 [10:37<1:02:37, 1.46s/it, lr: 1.0e-04 loss: 3.710e-01] my_first_lora_v6: 57%|#####7 | 3436/6000 [10:39<1:02:42, 1.47s/it, lr: 1.0e-04 loss: 6.059e-02] my_first_lora_v6: 57%|#####7 | 3436/6000 [10:39<1:02:42, 1.47s/it, lr: 1.0e-04 loss: 6.059e-02] my_first_lora_v6: 57%|#####7 | 3437/6000 [10:41<1:02:42, 1.47s/it, lr: 1.0e-04 loss: 7.390e-01] my_first_lora_v6: 57%|#####7 | 3437/6000 [10:41<1:02:42, 1.47s/it, lr: 1.0e-04 loss: 7.390e-01] my_first_lora_v6: 57%|#####7 | 3438/6000 [10:42<1:02:39, 1.47s/it, lr: 1.0e-04 loss: 2.069e-02] my_first_lora_v6: 57%|#####7 | 3438/6000 [10:42<1:02:39, 1.47s/it, lr: 1.0e-04 loss: 2.069e-02] my_first_lora_v6: 57%|#####7 | 3439/6000 [10:44<1:02:37, 1.47s/it, lr: 1.0e-04 loss: 7.776e-01] my_first_lora_v6: 57%|#####7 | 3439/6000 [10:44<1:02:37, 1.47s/it, lr: 1.0e-04 loss: 7.776e-01] my_first_lora_v6: 57%|#####7 | 3440/6000 [10:45<1:02:35, 1.47s/it, lr: 1.0e-04 loss: 7.199e-01] my_first_lora_v6: 57%|#####7 | 3440/6000 [10:45<1:02:35, 1.47s/it, lr: 1.0e-04 loss: 7.199e-01] my_first_lora_v6: 57%|#####7 | 3441/6000 [10:48<1:02:41, 1.47s/it, lr: 1.0e-04 loss: 1.680e-01] my_first_lora_v6: 57%|#####7 | 3441/6000 [10:48<1:02:41, 1.47s/it, lr: 1.0e-04 loss: 1.680e-01] my_first_lora_v6: 57%|#####7 | 3442/6000 [10:48<1:02:35, 1.47s/it, lr: 1.0e-04 loss: 3.061e-01] my_first_lora_v6: 57%|#####7 | 3442/6000 [10:48<1:02:35, 1.47s/it, lr: 1.0e-04 loss: 3.061e-01] my_first_lora_v6: 57%|#####7 | 3443/6000 [10:51<1:02:40, 1.47s/it, lr: 1.0e-04 loss: 7.486e-01] my_first_lora_v6: 57%|#####7 | 3443/6000 [10:51<1:02:40, 1.47s/it, lr: 1.0e-04 loss: 7.486e-01] my_first_lora_v6: 57%|#####7 | 3444/6000 [10:52<1:02:34, 1.47s/it, lr: 1.0e-04 loss: 7.400e-01] my_first_lora_v6: 57%|#####7 | 3444/6000 [10:52<1:02:34, 1.47s/it, lr: 1.0e-04 loss: 7.400e-01] my_first_lora_v6: 57%|#####7 | 3445/6000 [10:53<1:02:31, 1.47s/it, lr: 1.0e-04 loss: 5.853e-01] my_first_lora_v6: 57%|#####7 | 3445/6000 [10:53<1:02:31, 1.47s/it, lr: 1.0e-04 loss: 5.853e-01] my_first_lora_v6: 57%|#####7 | 3446/6000 [10:53<1:02:25, 1.47s/it, lr: 1.0e-04 loss: 7.730e-01] my_first_lora_v6: 57%|#####7 | 3446/6000 [10:53<1:02:25, 1.47s/it, lr: 1.0e-04 loss: 7.730e-01] my_first_lora_v6: 57%|#####7 | 3447/6000 [10:56<1:02:29, 1.47s/it, lr: 1.0e-04 loss: 4.749e-02] my_first_lora_v6: 57%|#####7 | 3447/6000 [10:56<1:02:29, 1.47s/it, lr: 1.0e-04 loss: 4.749e-02] my_first_lora_v6: 57%|#####7 | 3448/6000 [10:58<1:02:32, 1.47s/it, lr: 1.0e-04 loss: 7.881e-01] my_first_lora_v6: 57%|#####7 | 3448/6000 [10:58<1:02:32, 1.47s/it, lr: 1.0e-04 loss: 7.881e-01] my_first_lora_v6: 57%|#####7 | 3449/6000 [11:00<1:02:35, 1.47s/it, lr: 1.0e-04 loss: 8.661e-02] my_first_lora_v6: 57%|#####7 | 3449/6000 [11:00<1:02:35, 1.47s/it, lr: 1.0e-04 loss: 8.661e-02] my_first_lora_v6: 57%|#####7 | 3450/6000 [11:02<1:02:33, 1.47s/it, lr: 1.0e-04 loss: 7.345e-01] my_first_lora_v6: 57%|#####7 | 3450/6000 [11:02<1:02:33, 1.47s/it, lr: 1.0e-04 loss: 7.345e-01] my_first_lora_v6: 58%|#####7 | 3451/6000 [11:03<1:02:29, 1.47s/it, lr: 1.0e-04 loss: 6.763e-01] my_first_lora_v6: 58%|#####7 | 3451/6000 [11:03<1:02:29, 1.47s/it, lr: 1.0e-04 loss: 6.763e-01] my_first_lora_v6: 58%|#####7 | 3452/6000 [11:05<1:02:33, 1.47s/it, lr: 1.0e-04 loss: 2.170e-01] my_first_lora_v6: 58%|#####7 | 3452/6000 [11:05<1:02:33, 1.47s/it, lr: 1.0e-04 loss: 2.170e-01] my_first_lora_v6: 58%|#####7 | 3453/6000 [11:07<1:02:31, 1.47s/it, lr: 1.0e-04 loss: 1.515e-01] my_first_lora_v6: 58%|#####7 | 3453/6000 [11:07<1:02:31, 1.47s/it, lr: 1.0e-04 loss: 1.515e-01] my_first_lora_v6: 58%|#####7 | 3454/6000 [11:07<1:02:25, 1.47s/it, lr: 1.0e-04 loss: 3.796e-01] my_first_lora_v6: 58%|#####7 | 3454/6000 [11:07<1:02:25, 1.47s/it, lr: 1.0e-04 loss: 3.796e-01] my_first_lora_v6: 58%|#####7 | 3455/6000 [11:10<1:02:30, 1.47s/it, lr: 1.0e-04 loss: 7.539e-01] my_first_lora_v6: 58%|#####7 | 3455/6000 [11:10<1:02:30, 1.47s/it, lr: 1.0e-04 loss: 7.539e-01] my_first_lora_v6: 58%|#####7 | 3456/6000 [11:11<1:02:28, 1.47s/it, lr: 1.0e-04 loss: 1.298e-01] my_first_lora_v6: 58%|#####7 | 3456/6000 [11:11<1:02:28, 1.47s/it, lr: 1.0e-04 loss: 1.298e-01] my_first_lora_v6: 58%|#####7 | 3457/6000 [11:12<1:02:22, 1.47s/it, lr: 1.0e-04 loss: 1.979e-01] my_first_lora_v6: 58%|#####7 | 3457/6000 [11:12<1:02:22, 1.47s/it, lr: 1.0e-04 loss: 1.979e-01] my_first_lora_v6: 58%|#####7 | 3458/6000 [11:13<1:02:20, 1.47s/it, lr: 1.0e-04 loss: 7.304e-01] my_first_lora_v6: 58%|#####7 | 3458/6000 [11:13<1:02:20, 1.47s/it, lr: 1.0e-04 loss: 7.304e-01] my_first_lora_v6: 58%|#####7 | 3459/6000 [11:15<1:02:18, 1.47s/it, lr: 1.0e-04 loss: 6.414e-01] my_first_lora_v6: 58%|#####7 | 3459/6000 [11:15<1:02:18, 1.47s/it, lr: 1.0e-04 loss: 6.414e-01] my_first_lora_v6: 58%|#####7 | 3460/6000 [11:15<1:02:12, 1.47s/it, lr: 1.0e-04 loss: 2.060e-01] my_first_lora_v6: 58%|#####7 | 3460/6000 [11:15<1:02:12, 1.47s/it, lr: 1.0e-04 loss: 2.060e-01] my_first_lora_v6: 58%|#####7 | 3461/6000 [11:17<1:02:10, 1.47s/it, lr: 1.0e-04 loss: 4.620e-01] my_first_lora_v6: 58%|#####7 | 3461/6000 [11:17<1:02:10, 1.47s/it, lr: 1.0e-04 loss: 4.620e-01] my_first_lora_v6: 58%|#####7 | 3462/6000 [11:19<1:02:14, 1.47s/it, lr: 1.0e-04 loss: 3.649e-01] my_first_lora_v6: 58%|#####7 | 3462/6000 [11:19<1:02:14, 1.47s/it, lr: 1.0e-04 loss: 3.649e-01] my_first_lora_v6: 58%|#####7 | 3463/6000 [11:21<1:02:12, 1.47s/it, lr: 1.0e-04 loss: 1.633e-01] my_first_lora_v6: 58%|#####7 | 3463/6000 [11:21<1:02:12, 1.47s/it, lr: 1.0e-04 loss: 1.633e-01] my_first_lora_v6: 58%|#####7 | 3464/6000 [11:23<1:02:16, 1.47s/it, lr: 1.0e-04 loss: 7.361e-01] my_first_lora_v6: 58%|#####7 | 3464/6000 [11:23<1:02:16, 1.47s/it, lr: 1.0e-04 loss: 7.361e-01] my_first_lora_v6: 58%|#####7 | 3465/6000 [11:26<1:02:20, 1.48s/it, lr: 1.0e-04 loss: 4.412e-01] my_first_lora_v6: 58%|#####7 | 3465/6000 [11:26<1:02:20, 1.48s/it, lr: 1.0e-04 loss: 4.412e-01] my_first_lora_v6: 58%|#####7 | 3466/6000 [11:26<1:02:15, 1.47s/it, lr: 1.0e-04 loss: 7.480e-01] my_first_lora_v6: 58%|#####7 | 3466/6000 [11:26<1:02:15, 1.47s/it, lr: 1.0e-04 loss: 7.480e-01] my_first_lora_v6: 58%|#####7 | 3467/6000 [11:27<1:02:09, 1.47s/it, lr: 1.0e-04 loss: 7.095e-02] my_first_lora_v6: 58%|#####7 | 3467/6000 [11:27<1:02:09, 1.47s/it, lr: 1.0e-04 loss: 7.095e-02] my_first_lora_v6: 58%|#####7 | 3468/6000 [11:29<1:02:12, 1.47s/it, lr: 1.0e-04 loss: 4.971e-01] my_first_lora_v6: 58%|#####7 | 3468/6000 [11:29<1:02:12, 1.47s/it, lr: 1.0e-04 loss: 4.971e-01] my_first_lora_v6: 58%|#####7 | 3469/6000 [11:31<1:02:09, 1.47s/it, lr: 1.0e-04 loss: 2.675e-01] my_first_lora_v6: 58%|#####7 | 3469/6000 [11:31<1:02:09, 1.47s/it, lr: 1.0e-04 loss: 2.675e-01] my_first_lora_v6: 58%|#####7 | 3470/6000 [11:32<1:02:06, 1.47s/it, lr: 1.0e-04 loss: 8.513e-01] my_first_lora_v6: 58%|#####7 | 3470/6000 [11:32<1:02:06, 1.47s/it, lr: 1.0e-04 loss: 8.513e-01] my_first_lora_v6: 58%|#####7 | 3471/6000 [11:34<1:02:11, 1.48s/it, lr: 1.0e-04 loss: 3.844e-01] my_first_lora_v6: 58%|#####7 | 3471/6000 [11:34<1:02:11, 1.48s/it, lr: 1.0e-04 loss: 3.844e-01] my_first_lora_v6: 58%|#####7 | 3472/6000 [11:35<1:02:05, 1.47s/it, lr: 1.0e-04 loss: 7.038e-01] my_first_lora_v6: 58%|#####7 | 3472/6000 [11:35<1:02:05, 1.47s/it, lr: 1.0e-04 loss: 7.038e-01] my_first_lora_v6: 58%|#####7 | 3473/6000 [11:36<1:02:03, 1.47s/it, lr: 1.0e-04 loss: 7.304e-01] my_first_lora_v6: 58%|#####7 | 3473/6000 [11:36<1:02:03, 1.47s/it, lr: 1.0e-04 loss: 7.304e-01] my_first_lora_v6: 58%|#####7 | 3474/6000 [11:37<1:01:57, 1.47s/it, lr: 1.0e-04 loss: 4.134e-01] my_first_lora_v6: 58%|#####7 | 3474/6000 [11:37<1:01:57, 1.47s/it, lr: 1.0e-04 loss: 4.134e-01] my_first_lora_v6: 58%|#####7 | 3475/6000 [11:38<1:01:52, 1.47s/it, lr: 1.0e-04 loss: 1.951e-01] my_first_lora_v6: 58%|#####7 | 3475/6000 [11:38<1:01:52, 1.47s/it, lr: 1.0e-04 loss: 1.951e-01] my_first_lora_v6: 58%|#####7 | 3476/6000 [11:40<1:01:56, 1.47s/it, lr: 1.0e-04 loss: 6.991e-01] my_first_lora_v6: 58%|#####7 | 3476/6000 [11:40<1:01:56, 1.47s/it, lr: 1.0e-04 loss: 6.991e-01] my_first_lora_v6: 58%|#####7 | 3477/6000 [11:42<1:01:54, 1.47s/it, lr: 1.0e-04 loss: 7.287e-01] my_first_lora_v6: 58%|#####7 | 3477/6000 [11:42<1:01:54, 1.47s/it, lr: 1.0e-04 loss: 7.287e-01] my_first_lora_v6: 58%|#####7 | 3478/6000 [11:42<1:01:48, 1.47s/it, lr: 1.0e-04 loss: 8.189e-01] my_first_lora_v6: 58%|#####7 | 3478/6000 [11:42<1:01:48, 1.47s/it, lr: 1.0e-04 loss: 8.189e-01] my_first_lora_v6: 58%|#####7 | 3479/6000 [11:45<1:01:54, 1.47s/it, lr: 1.0e-04 loss: 1.837e-01] my_first_lora_v6: 58%|#####7 | 3479/6000 [11:45<1:01:54, 1.47s/it, lr: 1.0e-04 loss: 1.837e-01] my_first_lora_v6: 58%|#####8 | 3480/6000 [11:47<1:01:54, 1.47s/it, lr: 1.0e-04 loss: 6.140e-01] my_first_lora_v6: 58%|#####8 | 3480/6000 [11:47<1:01:54, 1.47s/it, lr: 1.0e-04 loss: 6.140e-01] my_first_lora_v6: 58%|#####8 | 3481/6000 [11:48<1:01:48, 1.47s/it, lr: 1.0e-04 loss: 6.047e-01] my_first_lora_v6: 58%|#####8 | 3481/6000 [11:48<1:01:48, 1.47s/it, lr: 1.0e-04 loss: 6.047e-01] my_first_lora_v6: 58%|#####8 | 3482/6000 [11:50<1:01:51, 1.47s/it, lr: 1.0e-04 loss: 7.800e-01] my_first_lora_v6: 58%|#####8 | 3482/6000 [11:50<1:01:51, 1.47s/it, lr: 1.0e-04 loss: 7.800e-01] my_first_lora_v6: 58%|#####8 | 3483/6000 [11:51<1:01:45, 1.47s/it, lr: 1.0e-04 loss: 3.083e-02] my_first_lora_v6: 58%|#####8 | 3483/6000 [11:51<1:01:45, 1.47s/it, lr: 1.0e-04 loss: 3.083e-02] my_first_lora_v6: 58%|#####8 | 3484/6000 [11:51<1:01:40, 1.47s/it, lr: 1.0e-04 loss: 7.070e-01] my_first_lora_v6: 58%|#####8 | 3484/6000 [11:51<1:01:40, 1.47s/it, lr: 1.0e-04 loss: 7.070e-01] my_first_lora_v6: 58%|#####8 | 3485/6000 [11:52<1:01:34, 1.47s/it, lr: 1.0e-04 loss: 7.373e-01] my_first_lora_v6: 58%|#####8 | 3485/6000 [11:52<1:01:34, 1.47s/it, lr: 1.0e-04 loss: 7.373e-01] my_first_lora_v6: 58%|#####8 | 3486/6000 [11:53<1:01:32, 1.47s/it, lr: 1.0e-04 loss: 7.773e-01] my_first_lora_v6: 58%|#####8 | 3486/6000 [11:53<1:01:32, 1.47s/it, lr: 1.0e-04 loss: 7.773e-01] my_first_lora_v6: 58%|#####8 | 3487/6000 [11:55<1:01:29, 1.47s/it, lr: 1.0e-04 loss: 2.200e-01] my_first_lora_v6: 58%|#####8 | 3487/6000 [11:55<1:01:29, 1.47s/it, lr: 1.0e-04 loss: 2.200e-01] my_first_lora_v6: 58%|#####8 | 3488/6000 [11:57<1:01:33, 1.47s/it, lr: 1.0e-04 loss: 2.973e-01] my_first_lora_v6: 58%|#####8 | 3488/6000 [11:57<1:01:33, 1.47s/it, lr: 1.0e-04 loss: 2.973e-01] my_first_lora_v6: 58%|#####8 | 3489/6000 [11:58<1:01:31, 1.47s/it, lr: 1.0e-04 loss: 4.745e-01] my_first_lora_v6: 58%|#####8 | 3489/6000 [11:58<1:01:31, 1.47s/it, lr: 1.0e-04 loss: 4.745e-01] my_first_lora_v6: 58%|#####8 | 3490/6000 [11:59<1:01:26, 1.47s/it, lr: 1.0e-04 loss: 2.466e-01] my_first_lora_v6: 58%|#####8 | 3490/6000 [11:59<1:01:26, 1.47s/it, lr: 1.0e-04 loss: 2.466e-01] my_first_lora_v6: 58%|#####8 | 3491/6000 [12:00<1:01:24, 1.47s/it, lr: 1.0e-04 loss: 7.376e-01] my_first_lora_v6: 58%|#####8 | 3491/6000 [12:00<1:01:24, 1.47s/it, lr: 1.0e-04 loss: 7.376e-01] my_first_lora_v6: 58%|#####8 | 3492/6000 [12:01<1:01:18, 1.47s/it, lr: 1.0e-04 loss: 8.902e-02] my_first_lora_v6: 58%|#####8 | 3492/6000 [12:01<1:01:18, 1.47s/it, lr: 1.0e-04 loss: 8.902e-02] my_first_lora_v6: 58%|#####8 | 3493/6000 [12:02<1:01:13, 1.47s/it, lr: 1.0e-04 loss: 3.505e-01] my_first_lora_v6: 58%|#####8 | 3493/6000 [12:02<1:01:13, 1.47s/it, lr: 1.0e-04 loss: 3.505e-01] my_first_lora_v6: 58%|#####8 | 3494/6000 [12:03<1:01:10, 1.46s/it, lr: 1.0e-04 loss: 8.062e-01] my_first_lora_v6: 58%|#####8 | 3494/6000 [12:03<1:01:10, 1.46s/it, lr: 1.0e-04 loss: 8.062e-01] my_first_lora_v6: 58%|#####8 | 3495/6000 [12:06<1:01:15, 1.47s/it, lr: 1.0e-04 loss: 1.369e-01] my_first_lora_v6: 58%|#####8 | 3495/6000 [12:06<1:01:15, 1.47s/it, lr: 1.0e-04 loss: 1.369e-01] my_first_lora_v6: 58%|#####8 | 3496/6000 [12:08<1:01:19, 1.47s/it, lr: 1.0e-04 loss: 3.166e-01] my_first_lora_v6: 58%|#####8 | 3496/6000 [12:08<1:01:19, 1.47s/it, lr: 1.0e-04 loss: 3.166e-01] my_first_lora_v6: 58%|#####8 | 3497/6000 [12:11<1:01:21, 1.47s/it, lr: 1.0e-04 loss: 1.633e-01] my_first_lora_v6: 58%|#####8 | 3497/6000 [12:11<1:01:21, 1.47s/it, lr: 1.0e-04 loss: 1.633e-01] my_first_lora_v6: 58%|#####8 | 3498/6000 [12:13<1:01:25, 1.47s/it, lr: 1.0e-04 loss: 3.157e-01] my_first_lora_v6: 58%|#####8 | 3498/6000 [12:13<1:01:25, 1.47s/it, lr: 1.0e-04 loss: 3.157e-01] my_first_lora_v6: 58%|#####8 | 3499/6000 [12:14<1:01:19, 1.47s/it, lr: 1.0e-04 loss: 2.942e-01] my_first_lora_v6: 58%|#####8 | 3499/6000 [12:14<1:01:19, 1.47s/it, lr: 1.0e-04 loss: 2.942e-01]
Saving at step 3500
Saved checkpoint to /teamspace/studios/this_studio/ai-toolkit/output/my_first_lora_v6/my_first_lora_v6_000003500.safetensors
Saved optimizer to /teamspace/studios/this_studio/ai-toolkit/output/my_first_lora_v6/optimizer.pt
Unloading assistant lora
Generating Images: 0%| | 0/5 [00:00<?, ?it/s] Generating Images: 0%| | 0/5 [00:00<?, ?it/s]
Generating Images: 20%|## | 1/5 [00:08<00:32, 8.00s/it] Generating Images: 20%|## | 1/5 [00:08<00:32, 8.00s/it]
Generating Images: 40%|#### | 2/5 [00:15<00:23, 7.91s/it] Generating Images: 40%|#### | 2/5 [00:15<00:23, 7.91s/it]
Generating Images: 60%|###### | 3/5 [00:23<00:15, 7.87s/it] Generating Images: 60%|###### | 3/5 [00:23<00:15, 7.87s/it]
Generating Images: 80%|######## | 4/5 [00:31<00:07, 7.83s/it] Generating Images: 80%|######## | 4/5 [00:31<00:07, 7.83s/it]
Generating Images: 100%|##########| 5/5 [00:39<00:00, 7.79s/it] Generating Images: 100%|##########| 5/5 [00:39<00:00, 7.79s/it]
Loading assistant lora
my_first_lora_v6: 58%|#####8 | 3500/6000 [12:15<1:01:19, 1.47s/it, lr: 1.0e-04 loss: 7.247e-01] my_first_lora_v6: 58%|#####8 | 3500/6000 [12:15<1:01:19, 1.47s/it, lr: 1.0e-04 loss: 7.247e-01] my_first_lora_v6: 58%|#####8 | 3501/6000 [12:17<1:01:17, 1.47s/it, lr: 1.0e-04 loss: 1.477e-01] my_first_lora_v6: 58%|#####8 | 3501/6000 [12:17<1:01:17, 1.47s/it, lr: 1.0e-04 loss: 1.477e-01] my_first_lora_v6: 58%|#####8 | 3502/6000 [12:18<1:01:15, 1.47s/it, lr: 1.0e-04 loss: 6.666e-01] my_first_lora_v6: 58%|#####8 | 3502/6000 [12:18<1:01:15, 1.47s/it, lr: 1.0e-04 loss: 6.666e-01] my_first_lora_v6: 58%|#####8 | 3503/6000 [12:21<1:01:20, 1.47s/it, lr: 1.0e-04 loss: 5.058e-02] my_first_lora_v6: 58%|#####8 | 3503/6000 [12:21<1:01:20, 1.47s/it, lr: 1.0e-04 loss: 5.058e-02] my_first_lora_v6: 58%|#####8 | 3504/6000 [12:23<1:01:24, 1.48s/it, lr: 1.0e-04 loss: 3.062e-03] my_first_lora_v6: 58%|#####8 | 3504/6000 [12:23<1:01:24, 1.48s/it, lr: 1.0e-04 loss: 3.062e-03] my_first_lora_v6: 58%|#####8 | 3505/6000 [12:25<1:01:22, 1.48s/it, lr: 1.0e-04 loss: 1.916e-01] my_first_lora_v6: 58%|#####8 | 3505/6000 [12:25<1:01:22, 1.48s/it, lr: 1.0e-04 loss: 1.916e-01] my_first_lora_v6: 58%|#####8 | 3506/6000 [12:25<1:01:16, 1.47s/it, lr: 1.0e-04 loss: 1.683e-01] my_first_lora_v6: 58%|#####8 | 3506/6000 [12:25<1:01:16, 1.47s/it, lr: 1.0e-04 loss: 1.683e-01] my_first_lora_v6: 58%|#####8 | 3507/6000 [12:26<1:01:11, 1.47s/it, lr: 1.0e-04 loss: 1.092e-02] my_first_lora_v6: 58%|#####8 | 3507/6000 [12:26<1:01:11, 1.47s/it, lr: 1.0e-04 loss: 1.092e-02] my_first_lora_v6: 58%|#####8 | 3508/6000 [12:28<1:01:09, 1.47s/it, lr: 1.0e-04 loss: 7.350e-01] my_first_lora_v6: 58%|#####8 | 3508/6000 [12:28<1:01:09, 1.47s/it, lr: 1.0e-04 loss: 7.350e-01] my_first_lora_v6: 58%|#####8 | 3509/6000 [12:29<1:01:07, 1.47s/it, lr: 1.0e-04 loss: 7.089e-01] my_first_lora_v6: 58%|#####8 | 3509/6000 [12:29<1:01:07, 1.47s/it, lr: 1.0e-04 loss: 7.089e-01] my_first_lora_v6: 58%|#####8 | 3510/6000 [12:31<1:01:09, 1.47s/it, lr: 1.0e-04 loss: 7.477e-01] my_first_lora_v6: 58%|#####8 | 3510/6000 [12:31<1:01:09, 1.47s/it, lr: 1.0e-04 loss: 7.477e-01] my_first_lora_v6: 59%|#####8 | 3511/6000 [12:32<1:01:07, 1.47s/it, lr: 1.0e-04 loss: 8.135e-01] my_first_lora_v6: 59%|#####8 | 3511/6000 [12:32<1:01:07, 1.47s/it, lr: 1.0e-04 loss: 8.135e-01] my_first_lora_v6: 59%|#####8 | 3512/6000 [12:34<1:01:04, 1.47s/it, lr: 1.0e-04 loss: 5.903e-01] my_first_lora_v6: 59%|#####8 | 3512/6000 [12:34<1:01:04, 1.47s/it, lr: 1.0e-04 loss: 5.903e-01] my_first_lora_v6: 59%|#####8 | 3513/6000 [12:35<1:01:02, 1.47s/it, lr: 1.0e-04 loss: 6.046e-01] my_first_lora_v6: 59%|#####8 | 3513/6000 [12:35<1:01:02, 1.47s/it, lr: 1.0e-04 loss: 6.046e-01] my_first_lora_v6: 59%|#####8 | 3514/6000 [12:36<1:00:59, 1.47s/it, lr: 1.0e-04 loss: 6.892e-01] my_first_lora_v6: 59%|#####8 | 3514/6000 [12:36<1:00:59, 1.47s/it, lr: 1.0e-04 loss: 6.892e-01] my_first_lora_v6: 59%|#####8 | 3515/6000 [12:37<1:00:54, 1.47s/it, lr: 1.0e-04 loss: 5.616e-01] my_first_lora_v6: 59%|#####8 | 3515/6000 [12:37<1:00:54, 1.47s/it, lr: 1.0e-04 loss: 5.616e-01] my_first_lora_v6: 59%|#####8 | 3516/6000 [12:38<1:00:52, 1.47s/it, lr: 1.0e-04 loss: 6.178e-01] my_first_lora_v6: 59%|#####8 | 3516/6000 [12:38<1:00:52, 1.47s/it, lr: 1.0e-04 loss: 6.178e-01] my_first_lora_v6: 59%|#####8 | 3517/6000 [12:40<1:00:50, 1.47s/it, lr: 1.0e-04 loss: 2.657e-01] my_first_lora_v6: 59%|#####8 | 3517/6000 [12:40<1:00:50, 1.47s/it, lr: 1.0e-04 loss: 2.657e-01] my_first_lora_v6: 59%|#####8 | 3518/6000 [12:40<1:00:45, 1.47s/it, lr: 1.0e-04 loss: 7.031e-01] my_first_lora_v6: 59%|#####8 | 3518/6000 [12:40<1:00:45, 1.47s/it, lr: 1.0e-04 loss: 7.031e-01] my_first_lora_v6: 59%|#####8 | 3519/6000 [12:43<1:00:48, 1.47s/it, lr: 1.0e-04 loss: 2.264e-02] my_first_lora_v6: 59%|#####8 | 3519/6000 [12:43<1:00:48, 1.47s/it, lr: 1.0e-04 loss: 2.264e-02] my_first_lora_v6: 59%|#####8 | 3520/6000 [12:45<1:00:51, 1.47s/it, lr: 1.0e-04 loss: 3.555e-02] my_first_lora_v6: 59%|#####8 | 3520/6000 [12:45<1:00:51, 1.47s/it, lr: 1.0e-04 loss: 3.555e-02] my_first_lora_v6: 59%|#####8 | 3521/6000 [12:46<1:00:48, 1.47s/it, lr: 1.0e-04 loss: 3.333e-01] my_first_lora_v6: 59%|#####8 | 3521/6000 [12:46<1:00:48, 1.47s/it, lr: 1.0e-04 loss: 3.333e-01] my_first_lora_v6: 59%|#####8 | 3522/6000 [12:49<1:00:53, 1.47s/it, lr: 1.0e-04 loss: 3.871e-01] my_first_lora_v6: 59%|#####8 | 3522/6000 [12:49<1:00:53, 1.47s/it, lr: 1.0e-04 loss: 3.871e-01] my_first_lora_v6: 59%|#####8 | 3523/6000 [12:50<1:00:48, 1.47s/it, lr: 1.0e-04 loss: 2.474e-01] my_first_lora_v6: 59%|#####8 | 3523/6000 [12:50<1:00:48, 1.47s/it, lr: 1.0e-04 loss: 2.474e-01] my_first_lora_v6: 59%|#####8 | 3524/6000 [12:50<1:00:42, 1.47s/it, lr: 1.0e-04 loss: 8.016e-01] my_first_lora_v6: 59%|#####8 | 3524/6000 [12:50<1:00:42, 1.47s/it, lr: 1.0e-04 loss: 8.016e-01] my_first_lora_v6: 59%|#####8 | 3525/6000 [12:51<1:00:37, 1.47s/it, lr: 1.0e-04 loss: 3.817e-01] my_first_lora_v6: 59%|#####8 | 3525/6000 [12:51<1:00:37, 1.47s/it, lr: 1.0e-04 loss: 3.817e-01] my_first_lora_v6: 59%|#####8 | 3526/6000 [12:53<1:00:39, 1.47s/it, lr: 1.0e-04 loss: 1.294e-01] my_first_lora_v6: 59%|#####8 | 3526/6000 [12:53<1:00:39, 1.47s/it, lr: 1.0e-04 loss: 1.294e-01] my_first_lora_v6: 59%|#####8 | 3527/6000 [12:56<1:00:43, 1.47s/it, lr: 1.0e-04 loss: 6.957e-01] my_first_lora_v6: 59%|#####8 | 3527/6000 [12:56<1:00:43, 1.47s/it, lr: 1.0e-04 loss: 6.957e-01] my_first_lora_v6: 59%|#####8 | 3528/6000 [12:58<1:00:43, 1.47s/it, lr: 1.0e-04 loss: 6.211e-01] my_first_lora_v6: 59%|#####8 | 3528/6000 [12:58<1:00:43, 1.47s/it, lr: 1.0e-04 loss: 6.211e-01] my_first_lora_v6: 59%|#####8 | 3529/6000 [13:00<1:00:47, 1.48s/it, lr: 1.0e-04 loss: 9.403e-02] my_first_lora_v6: 59%|#####8 | 3529/6000 [13:00<1:00:47, 1.48s/it, lr: 1.0e-04 loss: 9.403e-02] my_first_lora_v6: 59%|#####8 | 3530/6000 [13:02<1:00:45, 1.48s/it, lr: 1.0e-04 loss: 5.548e-01] my_first_lora_v6: 59%|#####8 | 3530/6000 [13:02<1:00:45, 1.48s/it, lr: 1.0e-04 loss: 5.548e-01] my_first_lora_v6: 59%|#####8 | 3531/6000 [13:03<1:00:40, 1.47s/it, lr: 1.0e-04 loss: 5.027e-01] my_first_lora_v6: 59%|#####8 | 3531/6000 [13:03<1:00:40, 1.47s/it, lr: 1.0e-04 loss: 5.027e-01] my_first_lora_v6: 59%|#####8 | 3532/6000 [13:03<1:00:35, 1.47s/it, lr: 1.0e-04 loss: 5.629e-01] my_first_lora_v6: 59%|#####8 | 3532/6000 [13:03<1:00:35, 1.47s/it, lr: 1.0e-04 loss: 5.629e-01] my_first_lora_v6: 59%|#####8 | 3533/6000 [13:05<1:00:33, 1.47s/it, lr: 1.0e-04 loss: 7.349e-01] my_first_lora_v6: 59%|#####8 | 3533/6000 [13:05<1:00:33, 1.47s/it, lr: 1.0e-04 loss: 7.349e-01] my_first_lora_v6: 59%|#####8 | 3534/6000 [13:05<1:00:28, 1.47s/it, lr: 1.0e-04 loss: 7.113e-01] my_first_lora_v6: 59%|#####8 | 3534/6000 [13:05<1:00:28, 1.47s/it, lr: 1.0e-04 loss: 7.113e-01] my_first_lora_v6: 59%|#####8 | 3535/6000 [13:08<1:00:31, 1.47s/it, lr: 1.0e-04 loss: 1.792e-01] my_first_lora_v6: 59%|#####8 | 3535/6000 [13:08<1:00:31, 1.47s/it, lr: 1.0e-04 loss: 1.792e-01] my_first_lora_v6: 59%|#####8 | 3536/6000 [13:10<1:00:33, 1.47s/it, lr: 1.0e-04 loss: 4.750e-01] my_first_lora_v6: 59%|#####8 | 3536/6000 [13:10<1:00:33, 1.47s/it, lr: 1.0e-04 loss: 4.750e-01] my_first_lora_v6: 59%|#####8 | 3537/6000 [13:11<1:00:28, 1.47s/it, lr: 1.0e-04 loss: 6.528e-01] my_first_lora_v6: 59%|#####8 | 3537/6000 [13:11<1:00:28, 1.47s/it, lr: 1.0e-04 loss: 6.528e-01] my_first_lora_v6: 59%|#####8 | 3538/6000 [13:13<1:00:31, 1.48s/it, lr: 1.0e-04 loss: 6.157e-01] my_first_lora_v6: 59%|#####8 | 3538/6000 [13:13<1:00:31, 1.48s/it, lr: 1.0e-04 loss: 6.157e-01] my_first_lora_v6: 59%|#####8 | 3539/6000 [13:14<1:00:29, 1.47s/it, lr: 1.0e-04 loss: 4.934e-01] my_first_lora_v6: 59%|#####8 | 3539/6000 [13:14<1:00:29, 1.47s/it, lr: 1.0e-04 loss: 4.934e-01] my_first_lora_v6: 59%|#####8 | 3540/6000 [13:16<1:00:26, 1.47s/it, lr: 1.0e-04 loss: 4.718e-01] my_first_lora_v6: 59%|#####8 | 3540/6000 [13:16<1:00:26, 1.47s/it, lr: 1.0e-04 loss: 4.718e-01] my_first_lora_v6: 59%|#####9 | 3541/6000 [13:17<1:00:23, 1.47s/it, lr: 1.0e-04 loss: 3.532e-02] my_first_lora_v6: 59%|#####9 | 3541/6000 [13:17<1:00:23, 1.47s/it, lr: 1.0e-04 loss: 3.532e-02] my_first_lora_v6: 59%|#####9 | 3542/6000 [13:19<1:00:27, 1.48s/it, lr: 1.0e-04 loss: 3.563e-01] my_first_lora_v6: 59%|#####9 | 3542/6000 [13:19<1:00:27, 1.48s/it, lr: 1.0e-04 loss: 3.563e-01] my_first_lora_v6: 59%|#####9 | 3543/6000 [13:20<1:00:22, 1.47s/it, lr: 1.0e-04 loss: 3.937e-01] my_first_lora_v6: 59%|#####9 | 3543/6000 [13:20<1:00:22, 1.47s/it, lr: 1.0e-04 loss: 3.937e-01] my_first_lora_v6: 59%|#####9 | 3544/6000 [13:21<1:00:20, 1.47s/it, lr: 1.0e-04 loss: 4.065e-01] my_first_lora_v6: 59%|#####9 | 3544/6000 [13:21<1:00:20, 1.47s/it, lr: 1.0e-04 loss: 4.065e-01] my_first_lora_v6: 59%|#####9 | 3545/6000 [13:24<1:00:22, 1.48s/it, lr: 1.0e-04 loss: 1.725e-01] my_first_lora_v6: 59%|#####9 | 3545/6000 [13:24<1:00:22, 1.48s/it, lr: 1.0e-04 loss: 1.725e-01] my_first_lora_v6: 59%|#####9 | 3546/6000 [13:24<1:00:17, 1.47s/it, lr: 1.0e-04 loss: 1.790e-01] my_first_lora_v6: 59%|#####9 | 3546/6000 [13:24<1:00:17, 1.47s/it, lr: 1.0e-04 loss: 1.790e-01]Error running job: Job stopped
========================================
Result:
- 0 completed jobs
- 1 failure
========================================
Traceback (most recent call last):
Traceback (most recent call last):
File "/teamspace/studios/this_studio/ai-toolkit/run.py", line 120, in <module>
File "/teamspace/studios/this_studio/ai-toolkit/run.py", line 120, in <module>
main()main()
File "/teamspace/studios/this_studio/ai-toolkit/run.py", line 108, in main
File "/teamspace/studios/this_studio/ai-toolkit/run.py", line 108, in main
raise eraise e
File "/teamspace/studios/this_studio/ai-toolkit/run.py", line 96, in main
File "/teamspace/studios/this_studio/ai-toolkit/run.py", line 96, in main
job.run()job.run()
File "/teamspace/studios/this_studio/ai-toolkit/jobs/ExtensionJob.py", line 22, in run
File "/teamspace/studios/this_studio/ai-toolkit/jobs/ExtensionJob.py", line 22, in run
process.run()process.run()
File "/teamspace/studios/this_studio/ai-toolkit/jobs/process/BaseSDTrainProcess.py", line 2353, in run
File "/teamspace/studios/this_studio/ai-toolkit/jobs/process/BaseSDTrainProcess.py", line 2353, in run
self.end_step_hook()self.end_step_hook()
File "/teamspace/studios/this_studio/ai-toolkit/extensions_built_in/sd_trainer/DiffusionTrainer.py", line 264, in end_step_hook
File "/teamspace/studios/this_studio/ai-toolkit/extensions_built_in/sd_trainer/DiffusionTrainer.py", line 264, in end_step_hook
self.maybe_stop()self.maybe_stop()
File "/teamspace/studios/this_studio/ai-toolkit/extensions_built_in/sd_trainer/DiffusionTrainer.py", line 147, in maybe_stop
File "/teamspace/studios/this_studio/ai-toolkit/extensions_built_in/sd_trainer/DiffusionTrainer.py", line 147, in maybe_stop
raise Exception("Job stopped")raise Exception("Job stopped")
ExceptionException: : Job stoppedJob stopped
my_first_lora_v6: 59%|#####9 | 3547/6000 [13:26<1:00:16, 1.47s/it, lr: 1.0e-04 loss: 1.790e-01] my_first_lora_v6: 59%|#####9 | 3547/6000 [13:26<1:00:16, 1.47s/it, lr: 1.0e-04 loss: 1.790e-01]