bbkdevops/unicosys-hypergraph-bucket / tinymind-native-8b-remote-handoff /native_axiom_regenesis_8b_remote_train_from_hf_bucket.ipynb
bbkdevops's picture
download
raw
3.39 kB
{
"cells": [
{
"cell_type": "markdown",
"metadata": {},
"source": [
"# TinyMind AxiomReGenesis 8B Target Remote Training\n",
"This notebook trains the 8.22B-class native target. It does not claim quality until probes pass.\n"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": [
"!pip -q install -U 'huggingface_hub[hf_transfer]'\n",
"!rm -rf /content/tinymind_remote && mkdir -p /content/tinymind_remote\n",
"!hf sync hf://buckets/bbkdevops/unicosys-hypergraph-bucket/tinymind-native-8b-remote-handoff /content/tinymind_remote/handoff\n",
"!unzip -q /content/tinymind_remote/handoff/tinymind_native_8b_remote_bundle.zip -d /content/tinymind_remote\n",
"%cd /content/tinymind_remote/bundle\n"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": [
"!pip -q install -r requirements.txt || true\n",
"import torch, sys\n",
"print('python', sys.version)\n",
"print('cuda available', torch.cuda.is_available())\n",
"print('gpu', torch.cuda.get_device_name(0) if torch.cuda.is_available() else 'cpu')\n"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": [
"python -m train.cli native-axiom-regenesis-train --dataset /content/tinymind_remote/bundle/data/omni_round_curriculum.jsonl --out-dir /content/tinymind_axiom_regenesis_8b_target --max-steps 50000 --eval-records 256 --limit-records 10000 --dim 2816 --layers 48 --lanes 64 --seq-len 1024 --vocab-size 4096 --tokenizer-mode char_v1 --virtual-dim 1048576 --basis-rank 256 --facets 64 --learning-rate 1.2e-05 --train-batch-size 1 --device cuda\n"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": [
"python -m train.cli native-baseline-probe --out-dir /content/tinymind_axiom_regenesis_8b_probe --native-checkpoint /content/tinymind_axiom_regenesis_8b_target/checkpoint.pt --baseline-report /content/tinymind_remote/bundle/baseline/deep_core_probe_report.json --max-new-tokens 160 --device cuda\n"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": [
"python -m train.cli native-broad-probe --out-dir /content/tinymind_axiom_regenesis_8b_broad_probe --native-checkpoint /content/tinymind_axiom_regenesis_8b_target/checkpoint.pt --max-new-tokens 192 --device cuda\n"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": [
"!zip -qr /content/tinymind_axiom_regenesis_8b_results.zip /content/tinymind_axiom_regenesis_8b_target /content/tinymind_axiom_regenesis_8b_probe /content/tinymind_axiom_regenesis_8b_broad_probe\n",
"files.download('/content/tinymind_axiom_regenesis_8b_results.zip')\n"
]
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3",
"language": "python",
"name": "python3"
}
},
"nbformat": 4,
"nbformat_minor": 5
}

Xet Storage Details

Size:
3.39 kB
·
Xet hash:
dd427cee20f97380af58c11c4d3e04d2eaa820c5967b8613b794677a4a00909e

Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.