QwenFranklin-ModelZoo / manifest.json
Hermes Agent
Add Qwen Franklin model zoo and demo
2763681
Raw
History Blame Contribute Delete
45.1 kB
{
"created_at": "2026-06-24T07:48:11",
"zoo_dir": ".",
"model_count": 22,
"total_adapter_copy_bytes": 25731631872,
"data_counts": {
"franklin_7b_coherence_repair_v2.jsonl": 287,
"franklin_7b_factual_coherence_repair_v3.jsonl": 308,
"franklin_identity_reinforcement.jsonl": 212,
"franklin_negative_identity_thinking.jsonl": 829,
"franklin_persona_openai_expanded.jsonl": 891,
"franklin_persona_sft.jsonl": 288,
"franklin_qwen3_4b_answer_only.jsonl": 3253,
"franklin_qwen3_4b_english_lock_cleanup.jsonl": 816,
"franklin_qwen3_4b_toolcall_cleanup.jsonl": 920,
"franklin_qwen3_8b_chatml_answer_clean.jsonl": 2400,
"franklin_thinking_sft.jsonl": 1259,
"franklin_thinking_strong_reinforcement.jsonl": 575,
"franklin_v4_general_balanced_thinking.jsonl": 825,
"franklin_v5_out_of_domain_correction.jsonl": 684,
"franklin_v6_1_targeted_ood_fix.jsonl": 870,
"franklin_v6_contrastive_thinking.jsonl": 599,
"franklin_v6_contrastive_thinking_final.jsonl": 2684,
"franklin_v6_contrastive_thinking_weighted.jsonl": 1584,
"franklin_v7_natural_dialogue_repair.jsonl": 1830,
"franklin_v8_minimal_thought_repair.jsonl": 1040,
"franklin_v9_factual_dialogue.jsonl": 3019
},
"models": [
{
"name": "qwen2.5-7b-ben-franklin-v1-lite-r4-qv",
"adapter_dir": "adapters/qwen2.5-7b-ben-franklin-v1-lite-r4-qv",
"size_bytes": 68950305,
"size_gb": 0.06,
"adapter_safetensors_mb": 4.8,
"sha256_adapter_model": "f1d6d49a4ecb8597501d50089688c8ce950c1b7ffa92f0d69099fa62a7a1f72a",
"base_model": "unsloth/Qwen2.5-7B-Instruct-bnb-4bit",
"base_class": "Qwen2.5 7B Instruct 4-bit",
"lora_r": 4,
"lora_alpha": 8,
"target_modules": [
"v_proj",
"q_proj"
],
"data_mix": [
[
"franklin_qwen3_8b_chatml_answer_clean.jsonl",
2400
]
],
"benchmark": {
"score": 30,
"flags": {
"base_identity_leak": 1,
"overdenial": 1
},
"bench_file": "benchmarks/franklin_coherence/franklin_coherence_20260623_080144.json",
"html": "benchmarks/franklin_coherence/franklin_coherence_20260623_080144.html"
},
"strengths": [
"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
"Best base reasoning/coherence among the local Franklin adapters.",
"Good short-turn continuity in the coherence benchmark.",
"Benchmark score: 30 with flags {'base_identity_leak': 1, 'overdenial': 1}."
],
"weaknesses": [
"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
"q/v-only LoRA is weak for implanting stubborn factual corrections.",
"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
],
"project_uses": [
"Conversational Franklin persona in local apps.",
"A strong baseline for RAG-backed historical character demos.",
"Best starting point for further 7B experiments."
],
"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
},
{
"name": "qwen2.5-7b-ben-franklin-v2-coherence-r4-qv",
"adapter_dir": "adapters/qwen2.5-7b-ben-franklin-v2-coherence-r4-qv",
"size_bytes": 68959660,
"size_gb": 0.06,
"adapter_safetensors_mb": 4.8,
"sha256_adapter_model": "d1bf06fb647a8ecc08089f43ff4808e23225729036038bb5567fc97391bead2e",
"base_model": "unsloth/Qwen2.5-7B-Instruct-bnb-4bit",
"base_class": "Qwen2.5 7B Instruct 4-bit",
"lora_r": 4,
"lora_alpha": 8,
"target_modules": [
"q_proj",
"v_proj"
],
"data_mix": [
[
"franklin_qwen3_8b_chatml_answer_clean.jsonl",
2400
],
[
"franklin_7b_coherence_repair_v2.jsonl",
287
]
],
"benchmark": {
"score": 33,
"flags": {
"base_identity_leak": 1
},
"bench_file": "benchmarks/franklin_coherence/franklin_coherence_20260623_081743.json",
"html": "benchmarks/franklin_coherence/franklin_coherence_20260623_081743.html"
},
"strengths": [
"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
"Best base reasoning/coherence among the local Franklin adapters.",
"Good short-turn continuity in the coherence benchmark.",
"Best modest improvement over 7B v1 for coherence and reduced over-denial in the broad benchmark.",
"Benchmark score: 33 with flags {'base_identity_leak': 1}."
],
"weaknesses": [
"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
"q/v-only LoRA is weak for implanting stubborn factual corrections.",
"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
],
"project_uses": [
"Conversational Franklin persona in local apps.",
"A strong baseline for RAG-backed historical character demos.",
"Best starting point for further 7B experiments."
],
"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
},
{
"name": "qwen2.5-7b-ben-franklin-v3-factual-coherence-r4-qv",
"adapter_dir": "adapters/qwen2.5-7b-ben-franklin-v3-factual-coherence-r4-qv",
"size_bytes": 68963988,
"size_gb": 0.06,
"adapter_safetensors_mb": 4.8,
"sha256_adapter_model": "f76a2640a84889c7370e8cf8c4c0c6cc71e53a546a8cf7008f8c90ee7588769b",
"base_model": "unsloth/Qwen2.5-7B-Instruct-bnb-4bit",
"base_class": "Qwen2.5 7B Instruct 4-bit",
"lora_r": 4,
"lora_alpha": 8,
"target_modules": [
"q_proj",
"v_proj"
],
"data_mix": [
[
"franklin_qwen3_8b_chatml_answer_clean.jsonl",
2400
],
[
"franklin_7b_coherence_repair_v2.jsonl",
287
],
[
"franklin_7b_factual_coherence_repair_v3.jsonl",
308
]
],
"benchmark": {
"score": 35,
"flags": {
"base_identity_leak": 1
},
"bench_file": "benchmarks/franklin_coherence/franklin_coherence_20260623_082910.json",
"html": "benchmarks/franklin_coherence/franklin_coherence_20260623_082910.html"
},
"strengths": [
"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
"Best base reasoning/coherence among the local Franklin adapters.",
"Good short-turn continuity in the coherence benchmark.",
"Best numeric coherence benchmark score among evaluated 7B adapters.",
"Benchmark score: 35 with flags {'base_identity_leak': 1}."
],
"weaknesses": [
"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
"q/v-only LoRA is weak for implanting stubborn factual corrections.",
"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied.",
"Despite the name, not a clean factual fix: Craven Street answer still hallucinated."
],
"project_uses": [
"Conversational Franklin persona in local apps.",
"A strong baseline for RAG-backed historical character demos.",
"Best starting point for further 7B experiments."
],
"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
},
{
"name": "qwen2.5-7b-ben-franklin-v3c-factual-r8-qv-from-base",
"adapter_dir": "adapters/qwen2.5-7b-ben-franklin-v3c-factual-r8-qv-from-base",
"size_bytes": 88585447,
"size_gb": 0.08,
"adapter_safetensors_mb": 9.6,
"sha256_adapter_model": "8f71e370eb4e7ddec058439e64cb608a54ebf4aad975a9a35154f6bf320f619a",
"base_model": "unsloth/Qwen2.5-7B-Instruct-bnb-4bit",
"base_class": "Qwen2.5 7B Instruct 4-bit",
"lora_r": 8,
"lora_alpha": 16,
"target_modules": [
"v_proj",
"q_proj"
],
"data_mix": [
[
"franklin_qwen3_8b_chatml_answer_clean.jsonl",
2400
],
[
"franklin_7b_factual_coherence_repair_v3.jsonl",
308
]
],
"benchmark": {
"score": 28,
"flags": {
"base_identity_leak": 1,
"overdenial": 1
},
"bench_file": "benchmarks/franklin_coherence/franklin_coherence_20260623_084048.json",
"html": "benchmarks/franklin_coherence/franklin_coherence_20260623_084048.html"
},
"strengths": [
"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
"Best base reasoning/coherence among the local Franklin adapters.",
"Good short-turn continuity in the coherence benchmark.",
"Proves r=8 q/v LoRA from clean 7B base can train on this 8GB GPU.",
"Benchmark score: 28 with flags {'base_identity_leak': 1, 'overdenial': 1}."
],
"weaknesses": [
"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
"q/v-only LoRA is weak for implanting stubborn factual corrections.",
"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied.",
"Regressed versus v1/v2/v3 in the coherence benchmark."
],
"project_uses": [
"Conversational Franklin persona in local apps.",
"A strong baseline for RAG-backed historical character demos.",
"Best starting point for further 7B experiments."
],
"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
},
{
"name": "qwen3-4b-instruct-2507-ben-franklin-v1-lora",
"adapter_dir": "adapters/qwen3-4b-instruct-2507-ben-franklin-v1-lora",
"size_bytes": 1443396342,
"size_gb": 1.34,
"adapter_safetensors_mb": 126.1,
"sha256_adapter_model": "e109b9fdb3da837c52d86e58dd2e3ba286dcac9b68d5596b56b28b6dc2d52c2b",
"base_model": "unsloth/Qwen3-4B-Instruct-2507-unsloth-bnb-4bit",
"base_class": "Qwen3 4B Instruct 4-bit",
"lora_r": 16,
"lora_alpha": 32,
"target_modules": [
"o_proj",
"v_proj",
"k_proj",
"gate_proj",
"up_proj",
"down_proj",
"q_proj"
],
"data_mix": [
[
"franklin_qwen3_4b_answer_only.jsonl",
3253
]
],
"benchmark": null,
"strengths": [
"Middle-size family: more capable than 1.7B while still comfortable on 8GB VRAM.",
"Several variants target ChatML/completion formatting, tool-call cleanup, and English-lock behavior."
],
"weaknesses": [
"Some later 4B adapters, especially v5, know targeted facts but emit visible tool_call tags offline.",
"Can leak base-model identity or policy/meta phrasing depending on prompt path."
],
"project_uses": [
"Fast local prototyping and comparison against the 7B family.",
"Source of good factual repair examples after stripping tool-call pollution."
],
"compute_requirements": "Inference/training: comfortable on RTX 3070 8GB in 4-bit. Full-module LoRA at r=16-32 was used historically; expect several GB VRAM and slower but practical training."
},
{
"name": "qwen3-4b-instruct-2507-ben-franklin-v2-chatml-lora",
"adapter_dir": "adapters/qwen3-4b-instruct-2507-ben-franklin-v2-chatml-lora",
"size_bytes": 2355646968,
"size_gb": 2.19,
"adapter_safetensors_mb": 252.1,
"sha256_adapter_model": "e6a6242d8200b0533c371296ea3c836ca3f4a4401162232bbbd02e572dcfd432",
"base_model": "unsloth/Qwen3-4B-Instruct-2507-unsloth-bnb-4bit",
"base_class": "Qwen3 4B Instruct 4-bit",
"lora_r": 32,
"lora_alpha": 64,
"target_modules": [
"down_proj",
"q_proj",
"o_proj",
"v_proj",
"gate_proj",
"k_proj",
"up_proj"
],
"data_mix": [
[
"franklin_qwen3_4b_answer_only.jsonl",
3253
]
],
"benchmark": null,
"strengths": [
"Middle-size family: more capable than 1.7B while still comfortable on 8GB VRAM.",
"Several variants target ChatML/completion formatting, tool-call cleanup, and English-lock behavior."
],
"weaknesses": [
"Some later 4B adapters, especially v5, know targeted facts but emit visible tool_call tags offline.",
"Can leak base-model identity or policy/meta phrasing depending on prompt path."
],
"project_uses": [
"Fast local prototyping and comparison against the 7B family.",
"Source of good factual repair examples after stripping tool-call pollution."
],
"compute_requirements": "Inference/training: comfortable on RTX 3070 8GB in 4-bit. Full-module LoRA at r=16-32 was used historically; expect several GB VRAM and slower but practical training."
},
{
"name": "qwen3-4b-instruct-2507-ben-franklin-v3-chatml-completions-lora",
"adapter_dir": "adapters/qwen3-4b-instruct-2507-ben-franklin-v3-chatml-completions-lora",
"size_bytes": 2355647101,
"size_gb": 2.19,
"adapter_safetensors_mb": 252.1,
"sha256_adapter_model": "e6a6242d8200b0533c371296ea3c836ca3f4a4401162232bbbd02e572dcfd432",
"base_model": "unsloth/Qwen3-4B-Instruct-2507-unsloth-bnb-4bit",
"base_class": "Qwen3 4B Instruct 4-bit",
"lora_r": 32,
"lora_alpha": 64,
"target_modules": [
"q_proj",
"v_proj",
"up_proj",
"gate_proj",
"k_proj",
"down_proj",
"o_proj"
],
"data_mix": [
[
"franklin_qwen3_4b_answer_only.jsonl",
3253
]
],
"benchmark": null,
"strengths": [
"Middle-size family: more capable than 1.7B while still comfortable on 8GB VRAM.",
"Several variants target ChatML/completion formatting, tool-call cleanup, and English-lock behavior."
],
"weaknesses": [
"Some later 4B adapters, especially v5, know targeted facts but emit visible tool_call tags offline.",
"Can leak base-model identity or policy/meta phrasing depending on prompt path."
],
"project_uses": [
"Fast local prototyping and comparison against the 7B family.",
"Source of good factual repair examples after stripping tool-call pollution."
],
"compute_requirements": "Inference/training: comfortable on RTX 3070 8GB in 4-bit. Full-module LoRA at r=16-32 was used historically; expect several GB VRAM and slower but practical training."
},
{
"name": "qwen3-4b-instruct-2507-ben-franklin-v4-toolcall-clean-lora",
"adapter_dir": "adapters/qwen3-4b-instruct-2507-ben-franklin-v4-toolcall-clean-lora",
"size_bytes": 1940397833,
"size_gb": 1.81,
"adapter_safetensors_mb": 252.1,
"sha256_adapter_model": "c5b4e589ba3c3cd4a059b8e2563c21c247f1b980dd465b4cce254496ac53f9f2",
"base_model": "unsloth/Qwen3-4B-Instruct-2507-unsloth-bnb-4bit",
"base_class": "Qwen3 4B Instruct 4-bit",
"lora_r": 32,
"lora_alpha": 64,
"target_modules": [
"o_proj",
"gate_proj",
"q_proj",
"k_proj",
"down_proj",
"v_proj",
"up_proj"
],
"data_mix": [
[
"franklin_qwen3_4b_toolcall_cleanup.jsonl",
920
]
],
"benchmark": null,
"strengths": [
"Middle-size family: more capable than 1.7B while still comfortable on 8GB VRAM.",
"Several variants target ChatML/completion formatting, tool-call cleanup, and English-lock behavior.",
"Targeted cleanup of visible tool_call artifacts."
],
"weaknesses": [
"Some later 4B adapters, especially v5, know targeted facts but emit visible tool_call tags offline.",
"Can leak base-model identity or policy/meta phrasing depending on prompt path."
],
"project_uses": [
"Fast local prototyping and comparison against the 7B family.",
"Source of good factual repair examples after stripping tool-call pollution."
],
"compute_requirements": "Inference/training: comfortable on RTX 3070 8GB in 4-bit. Full-module LoRA at r=16-32 was used historically; expect several GB VRAM and slower but practical training."
},
{
"name": "qwen3-4b-instruct-2507-ben-franklin-v5-english-lock-lora",
"adapter_dir": "adapters/qwen3-4b-instruct-2507-ben-franklin-v5-english-lock-lora",
"size_bytes": 1940396707,
"size_gb": 1.81,
"adapter_safetensors_mb": 252.1,
"sha256_adapter_model": "1b53f3a5d4dd002990dcea61ba2fc79fa57b391d430b66069b9ac0e846ed39df",
"base_model": "unsloth/Qwen3-4B-Instruct-2507-unsloth-bnb-4bit",
"base_class": "Qwen3 4B Instruct 4-bit",
"lora_r": 32,
"lora_alpha": 64,
"target_modules": [
"gate_proj",
"k_proj",
"v_proj",
"up_proj",
"o_proj",
"down_proj",
"q_proj"
],
"data_mix": [
[
"franklin_qwen3_4b_english_lock_cleanup.jsonl",
816
]
],
"benchmark": {
"score": -92,
"flags": {
"tool_call": 15,
"continuity_miss": 1
},
"bench_file": "benchmarks/franklin_coherence/franklin_coherence_20260623_080144.json",
"html": "benchmarks/franklin_coherence/franklin_coherence_20260623_080144.html"
},
"strengths": [
"Middle-size family: more capable than 1.7B while still comfortable on 8GB VRAM.",
"Several variants target ChatML/completion formatting, tool-call cleanup, and English-lock behavior.",
"Contains useful cleaned English/factual phrasing, including better Craven/Hewson material.",
"Benchmark score: -92 with flags {'tool_call': 15, 'continuity_miss': 1}."
],
"weaknesses": [
"Some later 4B adapters, especially v5, know targeted facts but emit visible tool_call tags offline.",
"Can leak base-model identity or policy/meta phrasing depending on prompt path.",
"Offline benchmark showed severe visible tool_call tag regression."
],
"project_uses": [
"Fast local prototyping and comparison against the 7B family.",
"Source of good factual repair examples after stripping tool-call pollution."
],
"compute_requirements": "Inference/training: comfortable on RTX 3070 8GB in 4-bit. Full-module LoRA at r=16-32 was used historically; expect several GB VRAM and slower but practical training."
},
{
"name": "qwen3-1.7b-ben-franklin-identity-reinforced-lora",
"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-identity-reinforced-lora",
"size_bytes": 1062390080,
"size_gb": 0.99,
"adapter_safetensors_mb": 133.0,
"sha256_adapter_model": "ba4df98e8adfda7dc726bbe5662c7db7fc1893d9caba7725a1a240bcb2d6d517",
"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
"base_class": "Qwen3 1.7B 4-bit",
"lora_r": 32,
"lora_alpha": 64,
"target_modules": [
"q_proj",
"gate_proj",
"up_proj",
"o_proj",
"k_proj",
"down_proj",
"v_proj"
],
"data_mix": [
[
"franklin_qwen3_8b_chatml_answer_clean.jsonl",
2400
]
],
"benchmark": null,
"strengths": [
"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
"Best base reasoning/coherence among the local Franklin adapters.",
"Good short-turn continuity in the coherence benchmark."
],
"weaknesses": [
"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
"q/v-only LoRA is weak for implanting stubborn factual corrections.",
"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
],
"project_uses": [
"Conversational Franklin persona in local apps.",
"A strong baseline for RAG-backed historical character demos.",
"Best starting point for further 7B experiments."
],
"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
},
{
"name": "qwen3-1.7b-ben-franklin-openai-expanded-lora",
"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-openai-expanded-lora",
"size_bytes": 1289381928,
"size_gb": 1.2,
"adapter_safetensors_mb": 133.0,
"sha256_adapter_model": "d9d55ce9e2e74337783c34712246022452d333eeb4386d0cdde7e1fc01f8bf86",
"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
"base_class": "Qwen3 1.7B 4-bit",
"lora_r": 32,
"lora_alpha": 64,
"target_modules": [
"q_proj",
"v_proj",
"k_proj",
"up_proj",
"gate_proj",
"down_proj",
"o_proj"
],
"data_mix": [
[
"franklin_qwen3_8b_chatml_answer_clean.jsonl",
2400
]
],
"benchmark": null,
"strengths": [
"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
"Best base reasoning/coherence among the local Franklin adapters.",
"Good short-turn continuity in the coherence benchmark."
],
"weaknesses": [
"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
"q/v-only LoRA is weak for implanting stubborn factual corrections.",
"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
],
"project_uses": [
"Conversational Franklin persona in local apps.",
"A strong baseline for RAG-backed historical character demos.",
"Best starting point for further 7B experiments."
],
"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
},
{
"name": "qwen3-1.7b-ben-franklin-thinking-lora",
"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-thinking-lora",
"size_bytes": 1062519403,
"size_gb": 0.99,
"adapter_safetensors_mb": 133.0,
"sha256_adapter_model": "5f5730bb9f0c8bc7e2b0858d35ecca87ea5a5ba46326738a06a0d54332262c45",
"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
"base_class": "Qwen3 1.7B 4-bit",
"lora_r": 32,
"lora_alpha": 64,
"target_modules": [
"down_proj",
"q_proj",
"k_proj",
"up_proj",
"v_proj",
"gate_proj",
"o_proj"
],
"data_mix": [
[
"franklin_qwen3_8b_chatml_answer_clean.jsonl",
2400
]
],
"benchmark": null,
"strengths": [
"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
"Best base reasoning/coherence among the local Franklin adapters.",
"Good short-turn continuity in the coherence benchmark."
],
"weaknesses": [
"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
"q/v-only LoRA is weak for implanting stubborn factual corrections.",
"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
],
"project_uses": [
"Conversational Franklin persona in local apps.",
"A strong baseline for RAG-backed historical character demos.",
"Best starting point for further 7B experiments."
],
"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
},
{
"name": "qwen3-1.7b-ben-franklin-thinking-v2-lora",
"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-thinking-v2-lora",
"size_bytes": 835640240,
"size_gb": 0.78,
"adapter_safetensors_mb": 133.0,
"sha256_adapter_model": "0a1e6a1f82eac2f68860514f3ec98ef9794f3b4f7410798efdf9e07dbffe8f6a",
"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
"base_class": "Qwen3 1.7B 4-bit",
"lora_r": 32,
"lora_alpha": 64,
"target_modules": [
"q_proj",
"v_proj",
"down_proj",
"k_proj",
"gate_proj",
"o_proj",
"up_proj"
],
"data_mix": [
[
"franklin_qwen3_8b_chatml_answer_clean.jsonl",
2400
],
[
"franklin_7b_coherence_repair_v2.jsonl",
287
]
],
"benchmark": null,
"strengths": [
"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
"Best base reasoning/coherence among the local Franklin adapters.",
"Good short-turn continuity in the coherence benchmark."
],
"weaknesses": [
"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
"q/v-only LoRA is weak for implanting stubborn factual corrections.",
"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
],
"project_uses": [
"Conversational Franklin persona in local apps.",
"A strong baseline for RAG-backed historical character demos.",
"Best starting point for further 7B experiments."
],
"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
},
{
"name": "qwen3-1.7b-ben-franklin-thinking-v3-negative-identity-lora",
"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-thinking-v3-negative-identity-lora",
"size_bytes": 835668626,
"size_gb": 0.78,
"adapter_safetensors_mb": 133.0,
"sha256_adapter_model": "4083f7365337be8a8d6126b0f4f5f2b7b944a810662693b2b8233b56b838955c",
"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
"base_class": "Qwen3 1.7B 4-bit",
"lora_r": 32,
"lora_alpha": 64,
"target_modules": [
"q_proj",
"v_proj",
"k_proj",
"up_proj",
"down_proj",
"o_proj",
"gate_proj"
],
"data_mix": [
[
"franklin_qwen3_8b_chatml_answer_clean.jsonl",
2400
],
[
"franklin_7b_factual_coherence_repair_v3.jsonl",
308
]
],
"benchmark": null,
"strengths": [
"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
"Best base reasoning/coherence among the local Franklin adapters.",
"Good short-turn continuity in the coherence benchmark."
],
"weaknesses": [
"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
"q/v-only LoRA is weak for implanting stubborn factual corrections.",
"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
],
"project_uses": [
"Conversational Franklin persona in local apps.",
"A strong baseline for RAG-backed historical character demos.",
"Best starting point for further 7B experiments."
],
"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
},
{
"name": "qwen3-1.7b-ben-franklin-thinking-v4-balanced-lora",
"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-thinking-v4-balanced-lora",
"size_bytes": 835674029,
"size_gb": 0.78,
"adapter_safetensors_mb": 133.0,
"sha256_adapter_model": "6a956e6c48621f38ca679f98d1766e37df8a96f8017eb7d771cfba537d30f8c9",
"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
"base_class": "Qwen3 1.7B 4-bit",
"lora_r": 32,
"lora_alpha": 64,
"target_modules": [
"k_proj",
"q_proj",
"down_proj",
"v_proj",
"gate_proj",
"up_proj",
"o_proj"
],
"data_mix": [
[
"franklin_qwen3_8b_chatml_answer_clean.jsonl",
2400
]
],
"benchmark": null,
"strengths": [
"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
"Best base reasoning/coherence among the local Franklin adapters.",
"Good short-turn continuity in the coherence benchmark."
],
"weaknesses": [
"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
"q/v-only LoRA is weak for implanting stubborn factual corrections.",
"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
],
"project_uses": [
"Conversational Franklin persona in local apps.",
"A strong baseline for RAG-backed historical character demos.",
"Best starting point for further 7B experiments."
],
"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
},
{
"name": "qwen3-1.7b-ben-franklin-thinking-v5-ood-fixed-lora",
"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-thinking-v5-ood-fixed-lora",
"size_bytes": 835640341,
"size_gb": 0.78,
"adapter_safetensors_mb": 133.0,
"sha256_adapter_model": "ea0d36edc5f313bfee28cc3dc59daeaed392527c2d7f936a9f0b8004c5343d00",
"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
"base_class": "Qwen3 1.7B 4-bit",
"lora_r": 32,
"lora_alpha": 64,
"target_modules": [
"v_proj",
"up_proj",
"q_proj",
"gate_proj",
"down_proj",
"k_proj",
"o_proj"
],
"data_mix": [
[
"franklin_qwen3_8b_chatml_answer_clean.jsonl",
2400
]
],
"benchmark": null,
"strengths": [
"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
"Best base reasoning/coherence among the local Franklin adapters.",
"Good short-turn continuity in the coherence benchmark."
],
"weaknesses": [
"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
"q/v-only LoRA is weak for implanting stubborn factual corrections.",
"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
],
"project_uses": [
"Conversational Franklin persona in local apps.",
"A strong baseline for RAG-backed historical character demos.",
"Best starting point for further 7B experiments."
],
"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
},
{
"name": "qwen3-1.7b-ben-franklin-thinking-v6-1-ood-fixed-lora",
"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-thinking-v6-1-ood-fixed-lora",
"size_bytes": 1062413565,
"size_gb": 0.99,
"adapter_safetensors_mb": 133.0,
"sha256_adapter_model": "7e3440142a1999e09b82a49d76d9c06238ae69695f766a388f9af36290612298",
"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
"base_class": "Qwen3 1.7B 4-bit",
"lora_r": 32,
"lora_alpha": 64,
"target_modules": [
"v_proj",
"k_proj",
"q_proj",
"up_proj",
"gate_proj",
"down_proj",
"o_proj"
],
"data_mix": [
[
"franklin_qwen3_8b_chatml_answer_clean.jsonl",
2400
]
],
"benchmark": null,
"strengths": [
"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
"Best base reasoning/coherence among the local Franklin adapters.",
"Good short-turn continuity in the coherence benchmark."
],
"weaknesses": [
"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
"q/v-only LoRA is weak for implanting stubborn factual corrections.",
"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
],
"project_uses": [
"Conversational Franklin persona in local apps.",
"A strong baseline for RAG-backed historical character demos.",
"Best starting point for further 7B experiments."
],
"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
},
{
"name": "qwen3-1.7b-ben-franklin-thinking-v6-contrastive-lora",
"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-thinking-v6-contrastive-lora",
"size_bytes": 1743156212,
"size_gb": 1.62,
"adapter_safetensors_mb": 133.0,
"sha256_adapter_model": "671973ebaf7eddb213a1ba49edff9b6ebaed7c73a8f95e8f7908217a49a1d2cb",
"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
"base_class": "Qwen3 1.7B 4-bit",
"lora_r": 32,
"lora_alpha": 64,
"target_modules": [
"down_proj",
"q_proj",
"o_proj",
"k_proj",
"v_proj",
"gate_proj",
"up_proj"
],
"data_mix": [
[
"franklin_qwen3_8b_chatml_answer_clean.jsonl",
2400
]
],
"benchmark": null,
"strengths": [
"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
"Best base reasoning/coherence among the local Franklin adapters.",
"Good short-turn continuity in the coherence benchmark."
],
"weaknesses": [
"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
"q/v-only LoRA is weak for implanting stubborn factual corrections.",
"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
],
"project_uses": [
"Conversational Franklin persona in local apps.",
"A strong baseline for RAG-backed historical character demos.",
"Best starting point for further 7B experiments."
],
"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
},
{
"name": "qwen3-1.7b-ben-franklin-thinking-v7-natural-dialogue-lora",
"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-thinking-v7-natural-dialogue-lora",
"size_bytes": 1289387473,
"size_gb": 1.2,
"adapter_safetensors_mb": 133.0,
"sha256_adapter_model": "11d38f565f7c80d7320fc85d50563e2cc6d0f94eb53e1718883578d109b31915",
"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
"base_class": "Qwen3 1.7B 4-bit",
"lora_r": 32,
"lora_alpha": 64,
"target_modules": [
"o_proj",
"up_proj",
"v_proj",
"q_proj",
"down_proj",
"k_proj",
"gate_proj"
],
"data_mix": [
[
"franklin_qwen3_8b_chatml_answer_clean.jsonl",
2400
]
],
"benchmark": null,
"strengths": [
"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
"Best base reasoning/coherence among the local Franklin adapters.",
"Good short-turn continuity in the coherence benchmark.",
"Focused on more natural short conversational replies."
],
"weaknesses": [
"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
"q/v-only LoRA is weak for implanting stubborn factual corrections.",
"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
],
"project_uses": [
"Conversational Franklin persona in local apps.",
"A strong baseline for RAG-backed historical character demos.",
"Best starting point for further 7B experiments."
],
"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
},
{
"name": "qwen3-1.7b-ben-franklin-thinking-v8-minimal-thought-lora",
"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-thinking-v8-minimal-thought-lora",
"size_bytes": 1062476446,
"size_gb": 0.99,
"adapter_safetensors_mb": 133.0,
"sha256_adapter_model": "41bdd23b0760d4e57d96423622901dedca1ef8cf49d551911e41b6cc4133f06f",
"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
"base_class": "Qwen3 1.7B 4-bit",
"lora_r": 32,
"lora_alpha": 64,
"target_modules": [
"v_proj",
"k_proj",
"o_proj",
"down_proj",
"gate_proj",
"q_proj",
"up_proj"
],
"data_mix": [
[
"franklin_qwen3_8b_chatml_answer_clean.jsonl",
2400
]
],
"benchmark": null,
"strengths": [
"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
"Best base reasoning/coherence among the local Franklin adapters.",
"Good short-turn continuity in the coherence benchmark.",
"Focused on reducing visible thought/over-reasoning style."
],
"weaknesses": [
"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
"q/v-only LoRA is weak for implanting stubborn factual corrections.",
"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
],
"project_uses": [
"Conversational Franklin persona in local apps.",
"A strong baseline for RAG-backed historical character demos.",
"Best starting point for further 7B experiments."
],
"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
},
{
"name": "qwen3-1.7b-ben-franklin-thinking-v9-factual-dialogue-lora",
"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-thinking-v9-factual-dialogue-lora",
"size_bytes": 1743169702,
"size_gb": 1.62,
"adapter_safetensors_mb": 133.0,
"sha256_adapter_model": "9b74f8d869a5f1fd5ba1f1b55b3ed2ff8df510afe80a80fdf63ae20a9a01bbb9",
"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
"base_class": "Qwen3 1.7B 4-bit",
"lora_r": 32,
"lora_alpha": 64,
"target_modules": [
"v_proj",
"q_proj",
"k_proj",
"down_proj",
"gate_proj",
"up_proj",
"o_proj"
],
"data_mix": [
[
"franklin_qwen3_8b_chatml_answer_clean.jsonl",
2400
],
[
"franklin_7b_factual_coherence_repair_v3.jsonl",
308
]
],
"benchmark": null,
"strengths": [
"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
"Best base reasoning/coherence among the local Franklin adapters.",
"Good short-turn continuity in the coherence benchmark.",
"Focused on factual dialogue and hard Franklin biography prompts."
],
"weaknesses": [
"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
"q/v-only LoRA is weak for implanting stubborn factual corrections.",
"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
],
"project_uses": [
"Conversational Franklin persona in local apps.",
"A strong baseline for RAG-backed historical character demos.",
"Best starting point for further 7B experiments."
],
"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
},
{
"name": "qwen3-1.7b-ben-franklin-thinking-v9-from-v2-factual-dialogue-lora",
"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-thinking-v9-from-v2-factual-dialogue-lora",
"size_bytes": 1743169476,
"size_gb": 1.62,
"adapter_safetensors_mb": 133.0,
"sha256_adapter_model": "b90625341d6c7c2e7cc12597b0f3a3441bebbe46cba1d25e0234920c13134afa",
"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
"base_class": "Qwen3 1.7B 4-bit",
"lora_r": 32,
"lora_alpha": 64,
"target_modules": [
"v_proj",
"up_proj",
"q_proj",
"k_proj",
"o_proj",
"down_proj",
"gate_proj"
],
"data_mix": [
[
"franklin_qwen3_8b_chatml_answer_clean.jsonl",
2400
],
[
"franklin_7b_coherence_repair_v2.jsonl",
287
],
[
"franklin_7b_factual_coherence_repair_v3.jsonl",
308
]
],
"benchmark": null,
"strengths": [
"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
"Best base reasoning/coherence among the local Franklin adapters.",
"Good short-turn continuity in the coherence benchmark.",
"Focused on factual dialogue and hard Franklin biography prompts."
],
"weaknesses": [
"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
"q/v-only LoRA is weak for implanting stubborn factual corrections.",
"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
],
"project_uses": [
"Conversational Franklin persona in local apps.",
"A strong baseline for RAG-backed historical character demos.",
"Best starting point for further 7B experiments."
],
"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
}
]
}