purplesquirrelnetworks
/

purple-squirrel-r1-multichain-lora

Text Generation

purple-squirrel

local-inference

Model card Files Files and versions

purplesquirrelnetworks commited on Feb 22

Commit

d7c09a2

·

verified ·

1 Parent(s): 6a0c1ac

Upload adapter_config.json with huggingface_hub

Files changed (1) hide show

adapter_config.json +40 -0

adapter_config.json ADDED Viewed

	@@ -0,0 +1,40 @@

+{
+    "adapter_path": "/Volumes/Virtual Server/projects/psm-ops/multichain-day-model/model-output/mlx-adapters",
+    "batch_size": 1,
+    "config": null,
+    "data": "/Volumes/Virtual Server/projects/psm-ops/multichain-day-model/model-output/mlx-training-data",
+    "fine_tune_type": "lora",
+    "grad_accumulation_steps": 1,
+    "grad_checkpoint": true,
+    "iters": 200,
+    "learning_rate": 1e-05,
+    "lora_parameters": {
+        "rank": 8,
+        "dropout": 0.0,
+        "scale": 20.0
+    },
+    "lr_schedule": null,
+    "mask_prompt": false,
+    "max_seq_length": 1024,
+    "model": "mlx-community/DeepSeek-R1-Distill-Llama-8B-4bit",
+    "num_layers": 4,
+    "optimizer": "adam",
+    "optimizer_config": {
+        "adam": {},
+        "adamw": {},
+        "muon": {},
+        "sgd": {},
+        "adafactor": {}
+    },
+    "project_name": null,
+    "report_to": null,
+    "resume_adapter_file": null,
+    "save_every": 100,
+    "seed": 42,
+    "steps_per_eval": 50,
+    "steps_per_report": 10,
+    "test": false,
+    "test_batches": 500,
+    "train": true,
+    "val_batches": 25
+}