Hermes Agent

Add Qwen Franklin model zoo and demo

2763681 6 days ago

45.1 kB

	{
	"created_at": "2026-06-24T07:48:11",
	"zoo_dir": ".",
	"model_count": 22,
	"total_adapter_copy_bytes": 25731631872,
	"data_counts": {
	"franklin_7b_coherence_repair_v2.jsonl": 287,
	"franklin_7b_factual_coherence_repair_v3.jsonl": 308,
	"franklin_identity_reinforcement.jsonl": 212,
	"franklin_negative_identity_thinking.jsonl": 829,
	"franklin_persona_openai_expanded.jsonl": 891,
	"franklin_persona_sft.jsonl": 288,
	"franklin_qwen3_4b_answer_only.jsonl": 3253,
	"franklin_qwen3_4b_english_lock_cleanup.jsonl": 816,
	"franklin_qwen3_4b_toolcall_cleanup.jsonl": 920,
	"franklin_qwen3_8b_chatml_answer_clean.jsonl": 2400,
	"franklin_thinking_sft.jsonl": 1259,
	"franklin_thinking_strong_reinforcement.jsonl": 575,
	"franklin_v4_general_balanced_thinking.jsonl": 825,
	"franklin_v5_out_of_domain_correction.jsonl": 684,
	"franklin_v6_1_targeted_ood_fix.jsonl": 870,
	"franklin_v6_contrastive_thinking.jsonl": 599,
	"franklin_v6_contrastive_thinking_final.jsonl": 2684,
	"franklin_v6_contrastive_thinking_weighted.jsonl": 1584,
	"franklin_v7_natural_dialogue_repair.jsonl": 1830,
	"franklin_v8_minimal_thought_repair.jsonl": 1040,
	"franklin_v9_factual_dialogue.jsonl": 3019
	},
	"models": [
	{
	"name": "qwen2.5-7b-ben-franklin-v1-lite-r4-qv",
	"adapter_dir": "adapters/qwen2.5-7b-ben-franklin-v1-lite-r4-qv",
	"size_bytes": 68950305,
	"size_gb": 0.06,
	"adapter_safetensors_mb": 4.8,
	"sha256_adapter_model": "f1d6d49a4ecb8597501d50089688c8ce950c1b7ffa92f0d69099fa62a7a1f72a",
	"base_model": "unsloth/Qwen2.5-7B-Instruct-bnb-4bit",
	"base_class": "Qwen2.5 7B Instruct 4-bit",
	"lora_r": 4,
	"lora_alpha": 8,
	"target_modules": [
	"v_proj",
	"q_proj"
	],
	"data_mix": [
	[
	"franklin_qwen3_8b_chatml_answer_clean.jsonl",
	2400
	]
	],
	"benchmark": {
	"score": 30,
	"flags": {
	"base_identity_leak": 1,
	"overdenial": 1
	},
	"bench_file": "benchmarks/franklin_coherence/franklin_coherence_20260623_080144.json",
	"html": "benchmarks/franklin_coherence/franklin_coherence_20260623_080144.html"
	},
	"strengths": [
	"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
	"Best base reasoning/coherence among the local Franklin adapters.",
	"Good short-turn continuity in the coherence benchmark.",
	"Benchmark score: 30 with flags {'base_identity_leak': 1, 'overdenial': 1}."
	],
	"weaknesses": [
	"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
	"q/v-only LoRA is weak for implanting stubborn factual corrections.",
	"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
	],
	"project_uses": [
	"Conversational Franklin persona in local apps.",
	"A strong baseline for RAG-backed historical character demos.",
	"Best starting point for further 7B experiments."
	],
	"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
	},
	{
	"name": "qwen2.5-7b-ben-franklin-v2-coherence-r4-qv",
	"adapter_dir": "adapters/qwen2.5-7b-ben-franklin-v2-coherence-r4-qv",
	"size_bytes": 68959660,
	"size_gb": 0.06,
	"adapter_safetensors_mb": 4.8,
	"sha256_adapter_model": "d1bf06fb647a8ecc08089f43ff4808e23225729036038bb5567fc97391bead2e",
	"base_model": "unsloth/Qwen2.5-7B-Instruct-bnb-4bit",
	"base_class": "Qwen2.5 7B Instruct 4-bit",
	"lora_r": 4,
	"lora_alpha": 8,
	"target_modules": [
	"q_proj",
	"v_proj"
	],
	"data_mix": [
	[
	"franklin_qwen3_8b_chatml_answer_clean.jsonl",
	2400
	],
	[
	"franklin_7b_coherence_repair_v2.jsonl",
	287
	]
	],
	"benchmark": {
	"score": 33,
	"flags": {
	"base_identity_leak": 1
	},
	"bench_file": "benchmarks/franklin_coherence/franklin_coherence_20260623_081743.json",
	"html": "benchmarks/franklin_coherence/franklin_coherence_20260623_081743.html"
	},
	"strengths": [
	"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
	"Best base reasoning/coherence among the local Franklin adapters.",
	"Good short-turn continuity in the coherence benchmark.",
	"Best modest improvement over 7B v1 for coherence and reduced over-denial in the broad benchmark.",
	"Benchmark score: 33 with flags {'base_identity_leak': 1}."
	],
	"weaknesses": [
	"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
	"q/v-only LoRA is weak for implanting stubborn factual corrections.",
	"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
	],
	"project_uses": [
	"Conversational Franklin persona in local apps.",
	"A strong baseline for RAG-backed historical character demos.",
	"Best starting point for further 7B experiments."
	],
	"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
	},
	{
	"name": "qwen2.5-7b-ben-franklin-v3-factual-coherence-r4-qv",
	"adapter_dir": "adapters/qwen2.5-7b-ben-franklin-v3-factual-coherence-r4-qv",
	"size_bytes": 68963988,
	"size_gb": 0.06,
	"adapter_safetensors_mb": 4.8,
	"sha256_adapter_model": "f76a2640a84889c7370e8cf8c4c0c6cc71e53a546a8cf7008f8c90ee7588769b",
	"base_model": "unsloth/Qwen2.5-7B-Instruct-bnb-4bit",
	"base_class": "Qwen2.5 7B Instruct 4-bit",
	"lora_r": 4,
	"lora_alpha": 8,
	"target_modules": [
	"q_proj",
	"v_proj"
	],
	"data_mix": [
	[
	"franklin_qwen3_8b_chatml_answer_clean.jsonl",
	2400
	],
	[
	"franklin_7b_coherence_repair_v2.jsonl",
	287
	],
	[
	"franklin_7b_factual_coherence_repair_v3.jsonl",
	308
	]
	],
	"benchmark": {
	"score": 35,
	"flags": {
	"base_identity_leak": 1
	},
	"bench_file": "benchmarks/franklin_coherence/franklin_coherence_20260623_082910.json",
	"html": "benchmarks/franklin_coherence/franklin_coherence_20260623_082910.html"
	},
	"strengths": [
	"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
	"Best base reasoning/coherence among the local Franklin adapters.",
	"Good short-turn continuity in the coherence benchmark.",
	"Best numeric coherence benchmark score among evaluated 7B adapters.",
	"Benchmark score: 35 with flags {'base_identity_leak': 1}."
	],
	"weaknesses": [
	"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
	"q/v-only LoRA is weak for implanting stubborn factual corrections.",
	"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied.",
	"Despite the name, not a clean factual fix: Craven Street answer still hallucinated."
	],
	"project_uses": [
	"Conversational Franklin persona in local apps.",
	"A strong baseline for RAG-backed historical character demos.",
	"Best starting point for further 7B experiments."
	],
	"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
	},
	{
	"name": "qwen2.5-7b-ben-franklin-v3c-factual-r8-qv-from-base",
	"adapter_dir": "adapters/qwen2.5-7b-ben-franklin-v3c-factual-r8-qv-from-base",
	"size_bytes": 88585447,
	"size_gb": 0.08,
	"adapter_safetensors_mb": 9.6,
	"sha256_adapter_model": "8f71e370eb4e7ddec058439e64cb608a54ebf4aad975a9a35154f6bf320f619a",
	"base_model": "unsloth/Qwen2.5-7B-Instruct-bnb-4bit",
	"base_class": "Qwen2.5 7B Instruct 4-bit",
	"lora_r": 8,
	"lora_alpha": 16,
	"target_modules": [
	"v_proj",
	"q_proj"
	],
	"data_mix": [
	[
	"franklin_qwen3_8b_chatml_answer_clean.jsonl",
	2400
	],
	[
	"franklin_7b_factual_coherence_repair_v3.jsonl",
	308
	]
	],
	"benchmark": {
	"score": 28,
	"flags": {
	"base_identity_leak": 1,
	"overdenial": 1
	},
	"bench_file": "benchmarks/franklin_coherence/franklin_coherence_20260623_084048.json",
	"html": "benchmarks/franklin_coherence/franklin_coherence_20260623_084048.html"
	},
	"strengths": [
	"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
	"Best base reasoning/coherence among the local Franklin adapters.",
	"Good short-turn continuity in the coherence benchmark.",
	"Proves r=8 q/v LoRA from clean 7B base can train on this 8GB GPU.",
	"Benchmark score: 28 with flags {'base_identity_leak': 1, 'overdenial': 1}."
	],
	"weaknesses": [
	"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
	"q/v-only LoRA is weak for implanting stubborn factual corrections.",
	"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied.",
	"Regressed versus v1/v2/v3 in the coherence benchmark."
	],
	"project_uses": [
	"Conversational Franklin persona in local apps.",
	"A strong baseline for RAG-backed historical character demos.",
	"Best starting point for further 7B experiments."
	],
	"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
	},
	{
	"name": "qwen3-4b-instruct-2507-ben-franklin-v1-lora",
	"adapter_dir": "adapters/qwen3-4b-instruct-2507-ben-franklin-v1-lora",
	"size_bytes": 1443396342,
	"size_gb": 1.34,
	"adapter_safetensors_mb": 126.1,
	"sha256_adapter_model": "e109b9fdb3da837c52d86e58dd2e3ba286dcac9b68d5596b56b28b6dc2d52c2b",
	"base_model": "unsloth/Qwen3-4B-Instruct-2507-unsloth-bnb-4bit",
	"base_class": "Qwen3 4B Instruct 4-bit",
	"lora_r": 16,
	"lora_alpha": 32,
	"target_modules": [
	"o_proj",
	"v_proj",
	"k_proj",
	"gate_proj",
	"up_proj",
	"down_proj",
	"q_proj"
	],
	"data_mix": [
	[
	"franklin_qwen3_4b_answer_only.jsonl",
	3253
	]
	],
	"benchmark": null,
	"strengths": [
	"Middle-size family: more capable than 1.7B while still comfortable on 8GB VRAM.",
	"Several variants target ChatML/completion formatting, tool-call cleanup, and English-lock behavior."
	],
	"weaknesses": [
	"Some later 4B adapters, especially v5, know targeted facts but emit visible tool_call tags offline.",
	"Can leak base-model identity or policy/meta phrasing depending on prompt path."
	],
	"project_uses": [
	"Fast local prototyping and comparison against the 7B family.",
	"Source of good factual repair examples after stripping tool-call pollution."
	],
	"compute_requirements": "Inference/training: comfortable on RTX 3070 8GB in 4-bit. Full-module LoRA at r=16-32 was used historically; expect several GB VRAM and slower but practical training."
	},
	{
	"name": "qwen3-4b-instruct-2507-ben-franklin-v2-chatml-lora",
	"adapter_dir": "adapters/qwen3-4b-instruct-2507-ben-franklin-v2-chatml-lora",
	"size_bytes": 2355646968,
	"size_gb": 2.19,
	"adapter_safetensors_mb": 252.1,
	"sha256_adapter_model": "e6a6242d8200b0533c371296ea3c836ca3f4a4401162232bbbd02e572dcfd432",
	"base_model": "unsloth/Qwen3-4B-Instruct-2507-unsloth-bnb-4bit",
	"base_class": "Qwen3 4B Instruct 4-bit",
	"lora_r": 32,
	"lora_alpha": 64,
	"target_modules": [
	"down_proj",
	"q_proj",
	"o_proj",
	"v_proj",
	"gate_proj",
	"k_proj",
	"up_proj"
	],
	"data_mix": [
	[
	"franklin_qwen3_4b_answer_only.jsonl",
	3253
	]
	],
	"benchmark": null,
	"strengths": [
	"Middle-size family: more capable than 1.7B while still comfortable on 8GB VRAM.",
	"Several variants target ChatML/completion formatting, tool-call cleanup, and English-lock behavior."
	],
	"weaknesses": [
	"Some later 4B adapters, especially v5, know targeted facts but emit visible tool_call tags offline.",
	"Can leak base-model identity or policy/meta phrasing depending on prompt path."
	],
	"project_uses": [
	"Fast local prototyping and comparison against the 7B family.",
	"Source of good factual repair examples after stripping tool-call pollution."
	],
	"compute_requirements": "Inference/training: comfortable on RTX 3070 8GB in 4-bit. Full-module LoRA at r=16-32 was used historically; expect several GB VRAM and slower but practical training."
	},
	{
	"name": "qwen3-4b-instruct-2507-ben-franklin-v3-chatml-completions-lora",
	"adapter_dir": "adapters/qwen3-4b-instruct-2507-ben-franklin-v3-chatml-completions-lora",
	"size_bytes": 2355647101,
	"size_gb": 2.19,
	"adapter_safetensors_mb": 252.1,
	"sha256_adapter_model": "e6a6242d8200b0533c371296ea3c836ca3f4a4401162232bbbd02e572dcfd432",
	"base_model": "unsloth/Qwen3-4B-Instruct-2507-unsloth-bnb-4bit",
	"base_class": "Qwen3 4B Instruct 4-bit",
	"lora_r": 32,
	"lora_alpha": 64,
	"target_modules": [
	"q_proj",
	"v_proj",
	"up_proj",
	"gate_proj",
	"k_proj",
	"down_proj",
	"o_proj"
	],
	"data_mix": [
	[
	"franklin_qwen3_4b_answer_only.jsonl",
	3253
	]
	],
	"benchmark": null,
	"strengths": [
	"Middle-size family: more capable than 1.7B while still comfortable on 8GB VRAM.",
	"Several variants target ChatML/completion formatting, tool-call cleanup, and English-lock behavior."
	],
	"weaknesses": [
	"Some later 4B adapters, especially v5, know targeted facts but emit visible tool_call tags offline.",
	"Can leak base-model identity or policy/meta phrasing depending on prompt path."
	],
	"project_uses": [
	"Fast local prototyping and comparison against the 7B family.",
	"Source of good factual repair examples after stripping tool-call pollution."
	],
	"compute_requirements": "Inference/training: comfortable on RTX 3070 8GB in 4-bit. Full-module LoRA at r=16-32 was used historically; expect several GB VRAM and slower but practical training."
	},
	{
	"name": "qwen3-4b-instruct-2507-ben-franklin-v4-toolcall-clean-lora",
	"adapter_dir": "adapters/qwen3-4b-instruct-2507-ben-franklin-v4-toolcall-clean-lora",
	"size_bytes": 1940397833,
	"size_gb": 1.81,
	"adapter_safetensors_mb": 252.1,
	"sha256_adapter_model": "c5b4e589ba3c3cd4a059b8e2563c21c247f1b980dd465b4cce254496ac53f9f2",
	"base_model": "unsloth/Qwen3-4B-Instruct-2507-unsloth-bnb-4bit",
	"base_class": "Qwen3 4B Instruct 4-bit",
	"lora_r": 32,
	"lora_alpha": 64,
	"target_modules": [
	"o_proj",
	"gate_proj",
	"q_proj",
	"k_proj",
	"down_proj",
	"v_proj",
	"up_proj"
	],
	"data_mix": [
	[
	"franklin_qwen3_4b_toolcall_cleanup.jsonl",
	920
	]
	],
	"benchmark": null,
	"strengths": [
	"Middle-size family: more capable than 1.7B while still comfortable on 8GB VRAM.",
	"Several variants target ChatML/completion formatting, tool-call cleanup, and English-lock behavior.",
	"Targeted cleanup of visible tool_call artifacts."
	],
	"weaknesses": [
	"Some later 4B adapters, especially v5, know targeted facts but emit visible tool_call tags offline.",
	"Can leak base-model identity or policy/meta phrasing depending on prompt path."
	],
	"project_uses": [
	"Fast local prototyping and comparison against the 7B family.",
	"Source of good factual repair examples after stripping tool-call pollution."
	],
	"compute_requirements": "Inference/training: comfortable on RTX 3070 8GB in 4-bit. Full-module LoRA at r=16-32 was used historically; expect several GB VRAM and slower but practical training."
	},
	{
	"name": "qwen3-4b-instruct-2507-ben-franklin-v5-english-lock-lora",
	"adapter_dir": "adapters/qwen3-4b-instruct-2507-ben-franklin-v5-english-lock-lora",
	"size_bytes": 1940396707,
	"size_gb": 1.81,
	"adapter_safetensors_mb": 252.1,
	"sha256_adapter_model": "1b53f3a5d4dd002990dcea61ba2fc79fa57b391d430b66069b9ac0e846ed39df",
	"base_model": "unsloth/Qwen3-4B-Instruct-2507-unsloth-bnb-4bit",
	"base_class": "Qwen3 4B Instruct 4-bit",
	"lora_r": 32,
	"lora_alpha": 64,
	"target_modules": [
	"gate_proj",
	"k_proj",
	"v_proj",
	"up_proj",
	"o_proj",
	"down_proj",
	"q_proj"
	],
	"data_mix": [
	[
	"franklin_qwen3_4b_english_lock_cleanup.jsonl",
	816
	]
	],
	"benchmark": {
	"score": -92,
	"flags": {
	"tool_call": 15,
	"continuity_miss": 1
	},
	"bench_file": "benchmarks/franklin_coherence/franklin_coherence_20260623_080144.json",
	"html": "benchmarks/franklin_coherence/franklin_coherence_20260623_080144.html"
	},
	"strengths": [
	"Middle-size family: more capable than 1.7B while still comfortable on 8GB VRAM.",
	"Several variants target ChatML/completion formatting, tool-call cleanup, and English-lock behavior.",
	"Contains useful cleaned English/factual phrasing, including better Craven/Hewson material.",
	"Benchmark score: -92 with flags {'tool_call': 15, 'continuity_miss': 1}."
	],
	"weaknesses": [
	"Some later 4B adapters, especially v5, know targeted facts but emit visible tool_call tags offline.",
	"Can leak base-model identity or policy/meta phrasing depending on prompt path.",
	"Offline benchmark showed severe visible tool_call tag regression."
	],
	"project_uses": [
	"Fast local prototyping and comparison against the 7B family.",
	"Source of good factual repair examples after stripping tool-call pollution."
	],
	"compute_requirements": "Inference/training: comfortable on RTX 3070 8GB in 4-bit. Full-module LoRA at r=16-32 was used historically; expect several GB VRAM and slower but practical training."
	},
	{
	"name": "qwen3-1.7b-ben-franklin-identity-reinforced-lora",
	"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-identity-reinforced-lora",
	"size_bytes": 1062390080,
	"size_gb": 0.99,
	"adapter_safetensors_mb": 133.0,
	"sha256_adapter_model": "ba4df98e8adfda7dc726bbe5662c7db7fc1893d9caba7725a1a240bcb2d6d517",
	"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
	"base_class": "Qwen3 1.7B 4-bit",
	"lora_r": 32,
	"lora_alpha": 64,
	"target_modules": [
	"q_proj",
	"gate_proj",
	"up_proj",
	"o_proj",
	"k_proj",
	"down_proj",
	"v_proj"
	],
	"data_mix": [
	[
	"franklin_qwen3_8b_chatml_answer_clean.jsonl",
	2400
	]
	],
	"benchmark": null,
	"strengths": [
	"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
	"Best base reasoning/coherence among the local Franklin adapters.",
	"Good short-turn continuity in the coherence benchmark."
	],
	"weaknesses": [
	"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
	"q/v-only LoRA is weak for implanting stubborn factual corrections.",
	"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
	],
	"project_uses": [
	"Conversational Franklin persona in local apps.",
	"A strong baseline for RAG-backed historical character demos.",
	"Best starting point for further 7B experiments."
	],
	"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
	},
	{
	"name": "qwen3-1.7b-ben-franklin-openai-expanded-lora",
	"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-openai-expanded-lora",
	"size_bytes": 1289381928,
	"size_gb": 1.2,
	"adapter_safetensors_mb": 133.0,
	"sha256_adapter_model": "d9d55ce9e2e74337783c34712246022452d333eeb4386d0cdde7e1fc01f8bf86",
	"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
	"base_class": "Qwen3 1.7B 4-bit",
	"lora_r": 32,
	"lora_alpha": 64,
	"target_modules": [
	"q_proj",
	"v_proj",
	"k_proj",
	"up_proj",
	"gate_proj",
	"down_proj",
	"o_proj"
	],
	"data_mix": [
	[
	"franklin_qwen3_8b_chatml_answer_clean.jsonl",
	2400
	]
	],
	"benchmark": null,
	"strengths": [
	"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
	"Best base reasoning/coherence among the local Franklin adapters.",
	"Good short-turn continuity in the coherence benchmark."
	],
	"weaknesses": [
	"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
	"q/v-only LoRA is weak for implanting stubborn factual corrections.",
	"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
	],
	"project_uses": [
	"Conversational Franklin persona in local apps.",
	"A strong baseline for RAG-backed historical character demos.",
	"Best starting point for further 7B experiments."
	],
	"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
	},
	{
	"name": "qwen3-1.7b-ben-franklin-thinking-lora",
	"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-thinking-lora",
	"size_bytes": 1062519403,
	"size_gb": 0.99,
	"adapter_safetensors_mb": 133.0,
	"sha256_adapter_model": "5f5730bb9f0c8bc7e2b0858d35ecca87ea5a5ba46326738a06a0d54332262c45",
	"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
	"base_class": "Qwen3 1.7B 4-bit",
	"lora_r": 32,
	"lora_alpha": 64,
	"target_modules": [
	"down_proj",
	"q_proj",
	"k_proj",
	"up_proj",
	"v_proj",
	"gate_proj",
	"o_proj"
	],
	"data_mix": [
	[
	"franklin_qwen3_8b_chatml_answer_clean.jsonl",
	2400
	]
	],
	"benchmark": null,
	"strengths": [
	"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
	"Best base reasoning/coherence among the local Franklin adapters.",
	"Good short-turn continuity in the coherence benchmark."
	],
	"weaknesses": [
	"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
	"q/v-only LoRA is weak for implanting stubborn factual corrections.",
	"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
	],
	"project_uses": [
	"Conversational Franklin persona in local apps.",
	"A strong baseline for RAG-backed historical character demos.",
	"Best starting point for further 7B experiments."
	],
	"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
	},
	{
	"name": "qwen3-1.7b-ben-franklin-thinking-v2-lora",
	"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-thinking-v2-lora",
	"size_bytes": 835640240,
	"size_gb": 0.78,
	"adapter_safetensors_mb": 133.0,
	"sha256_adapter_model": "0a1e6a1f82eac2f68860514f3ec98ef9794f3b4f7410798efdf9e07dbffe8f6a",
	"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
	"base_class": "Qwen3 1.7B 4-bit",
	"lora_r": 32,
	"lora_alpha": 64,
	"target_modules": [
	"q_proj",
	"v_proj",
	"down_proj",
	"k_proj",
	"gate_proj",
	"o_proj",
	"up_proj"
	],
	"data_mix": [
	[
	"franklin_qwen3_8b_chatml_answer_clean.jsonl",
	2400
	],
	[
	"franklin_7b_coherence_repair_v2.jsonl",
	287
	]
	],
	"benchmark": null,
	"strengths": [
	"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
	"Best base reasoning/coherence among the local Franklin adapters.",
	"Good short-turn continuity in the coherence benchmark."
	],
	"weaknesses": [
	"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
	"q/v-only LoRA is weak for implanting stubborn factual corrections.",
	"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
	],
	"project_uses": [
	"Conversational Franklin persona in local apps.",
	"A strong baseline for RAG-backed historical character demos.",
	"Best starting point for further 7B experiments."
	],
	"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
	},
	{
	"name": "qwen3-1.7b-ben-franklin-thinking-v3-negative-identity-lora",
	"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-thinking-v3-negative-identity-lora",
	"size_bytes": 835668626,
	"size_gb": 0.78,
	"adapter_safetensors_mb": 133.0,
	"sha256_adapter_model": "4083f7365337be8a8d6126b0f4f5f2b7b944a810662693b2b8233b56b838955c",
	"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
	"base_class": "Qwen3 1.7B 4-bit",
	"lora_r": 32,
	"lora_alpha": 64,
	"target_modules": [
	"q_proj",
	"v_proj",
	"k_proj",
	"up_proj",
	"down_proj",
	"o_proj",
	"gate_proj"
	],
	"data_mix": [
	[
	"franklin_qwen3_8b_chatml_answer_clean.jsonl",
	2400
	],
	[
	"franklin_7b_factual_coherence_repair_v3.jsonl",
	308
	]
	],
	"benchmark": null,
	"strengths": [
	"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
	"Best base reasoning/coherence among the local Franklin adapters.",
	"Good short-turn continuity in the coherence benchmark."
	],
	"weaknesses": [
	"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
	"q/v-only LoRA is weak for implanting stubborn factual corrections.",
	"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
	],
	"project_uses": [
	"Conversational Franklin persona in local apps.",
	"A strong baseline for RAG-backed historical character demos.",
	"Best starting point for further 7B experiments."
	],
	"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
	},
	{
	"name": "qwen3-1.7b-ben-franklin-thinking-v4-balanced-lora",
	"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-thinking-v4-balanced-lora",
	"size_bytes": 835674029,
	"size_gb": 0.78,
	"adapter_safetensors_mb": 133.0,
	"sha256_adapter_model": "6a956e6c48621f38ca679f98d1766e37df8a96f8017eb7d771cfba537d30f8c9",
	"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
	"base_class": "Qwen3 1.7B 4-bit",
	"lora_r": 32,
	"lora_alpha": 64,
	"target_modules": [
	"k_proj",
	"q_proj",
	"down_proj",
	"v_proj",
	"gate_proj",
	"up_proj",
	"o_proj"
	],
	"data_mix": [
	[
	"franklin_qwen3_8b_chatml_answer_clean.jsonl",
	2400
	]
	],
	"benchmark": null,
	"strengths": [
	"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
	"Best base reasoning/coherence among the local Franklin adapters.",
	"Good short-turn continuity in the coherence benchmark."
	],
	"weaknesses": [
	"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
	"q/v-only LoRA is weak for implanting stubborn factual corrections.",
	"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
	],
	"project_uses": [
	"Conversational Franklin persona in local apps.",
	"A strong baseline for RAG-backed historical character demos.",
	"Best starting point for further 7B experiments."
	],
	"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
	},
	{
	"name": "qwen3-1.7b-ben-franklin-thinking-v5-ood-fixed-lora",
	"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-thinking-v5-ood-fixed-lora",
	"size_bytes": 835640341,
	"size_gb": 0.78,
	"adapter_safetensors_mb": 133.0,
	"sha256_adapter_model": "ea0d36edc5f313bfee28cc3dc59daeaed392527c2d7f936a9f0b8004c5343d00",
	"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
	"base_class": "Qwen3 1.7B 4-bit",
	"lora_r": 32,
	"lora_alpha": 64,
	"target_modules": [
	"v_proj",
	"up_proj",
	"q_proj",
	"gate_proj",
	"down_proj",
	"k_proj",
	"o_proj"
	],
	"data_mix": [
	[
	"franklin_qwen3_8b_chatml_answer_clean.jsonl",
	2400
	]
	],
	"benchmark": null,
	"strengths": [
	"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
	"Best base reasoning/coherence among the local Franklin adapters.",
	"Good short-turn continuity in the coherence benchmark."
	],
	"weaknesses": [
	"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
	"q/v-only LoRA is weak for implanting stubborn factual corrections.",
	"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
	],
	"project_uses": [
	"Conversational Franklin persona in local apps.",
	"A strong baseline for RAG-backed historical character demos.",
	"Best starting point for further 7B experiments."
	],
	"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
	},
	{
	"name": "qwen3-1.7b-ben-franklin-thinking-v6-1-ood-fixed-lora",
	"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-thinking-v6-1-ood-fixed-lora",
	"size_bytes": 1062413565,
	"size_gb": 0.99,
	"adapter_safetensors_mb": 133.0,
	"sha256_adapter_model": "7e3440142a1999e09b82a49d76d9c06238ae69695f766a388f9af36290612298",
	"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
	"base_class": "Qwen3 1.7B 4-bit",
	"lora_r": 32,
	"lora_alpha": 64,
	"target_modules": [
	"v_proj",
	"k_proj",
	"q_proj",
	"up_proj",
	"gate_proj",
	"down_proj",
	"o_proj"
	],
	"data_mix": [
	[
	"franklin_qwen3_8b_chatml_answer_clean.jsonl",
	2400
	]
	],
	"benchmark": null,
	"strengths": [
	"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
	"Best base reasoning/coherence among the local Franklin adapters.",
	"Good short-turn continuity in the coherence benchmark."
	],
	"weaknesses": [
	"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
	"q/v-only LoRA is weak for implanting stubborn factual corrections.",
	"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
	],
	"project_uses": [
	"Conversational Franklin persona in local apps.",
	"A strong baseline for RAG-backed historical character demos.",
	"Best starting point for further 7B experiments."
	],
	"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
	},
	{
	"name": "qwen3-1.7b-ben-franklin-thinking-v6-contrastive-lora",
	"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-thinking-v6-contrastive-lora",
	"size_bytes": 1743156212,
	"size_gb": 1.62,
	"adapter_safetensors_mb": 133.0,
	"sha256_adapter_model": "671973ebaf7eddb213a1ba49edff9b6ebaed7c73a8f95e8f7908217a49a1d2cb",
	"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
	"base_class": "Qwen3 1.7B 4-bit",
	"lora_r": 32,
	"lora_alpha": 64,
	"target_modules": [
	"down_proj",
	"q_proj",
	"o_proj",
	"k_proj",
	"v_proj",
	"gate_proj",
	"up_proj"
	],
	"data_mix": [
	[
	"franklin_qwen3_8b_chatml_answer_clean.jsonl",
	2400
	]
	],
	"benchmark": null,
	"strengths": [
	"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
	"Best base reasoning/coherence among the local Franklin adapters.",
	"Good short-turn continuity in the coherence benchmark."
	],
	"weaknesses": [
	"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
	"q/v-only LoRA is weak for implanting stubborn factual corrections.",
	"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
	],
	"project_uses": [
	"Conversational Franklin persona in local apps.",
	"A strong baseline for RAG-backed historical character demos.",
	"Best starting point for further 7B experiments."
	],
	"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
	},
	{
	"name": "qwen3-1.7b-ben-franklin-thinking-v7-natural-dialogue-lora",
	"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-thinking-v7-natural-dialogue-lora",
	"size_bytes": 1289387473,
	"size_gb": 1.2,
	"adapter_safetensors_mb": 133.0,
	"sha256_adapter_model": "11d38f565f7c80d7320fc85d50563e2cc6d0f94eb53e1718883578d109b31915",
	"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
	"base_class": "Qwen3 1.7B 4-bit",
	"lora_r": 32,
	"lora_alpha": 64,
	"target_modules": [
	"o_proj",
	"up_proj",
	"v_proj",
	"q_proj",
	"down_proj",
	"k_proj",
	"gate_proj"
	],
	"data_mix": [
	[
	"franklin_qwen3_8b_chatml_answer_clean.jsonl",
	2400
	]
	],
	"benchmark": null,
	"strengths": [
	"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
	"Best base reasoning/coherence among the local Franklin adapters.",
	"Good short-turn continuity in the coherence benchmark.",
	"Focused on more natural short conversational replies."
	],
	"weaknesses": [
	"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
	"q/v-only LoRA is weak for implanting stubborn factual corrections.",
	"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
	],
	"project_uses": [
	"Conversational Franklin persona in local apps.",
	"A strong baseline for RAG-backed historical character demos.",
	"Best starting point for further 7B experiments."
	],
	"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
	},
	{
	"name": "qwen3-1.7b-ben-franklin-thinking-v8-minimal-thought-lora",
	"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-thinking-v8-minimal-thought-lora",
	"size_bytes": 1062476446,
	"size_gb": 0.99,
	"adapter_safetensors_mb": 133.0,
	"sha256_adapter_model": "41bdd23b0760d4e57d96423622901dedca1ef8cf49d551911e41b6cc4133f06f",
	"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
	"base_class": "Qwen3 1.7B 4-bit",
	"lora_r": 32,
	"lora_alpha": 64,
	"target_modules": [
	"v_proj",
	"k_proj",
	"o_proj",
	"down_proj",
	"gate_proj",
	"q_proj",
	"up_proj"
	],
	"data_mix": [
	[
	"franklin_qwen3_8b_chatml_answer_clean.jsonl",
	2400
	]
	],
	"benchmark": null,
	"strengths": [
	"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
	"Best base reasoning/coherence among the local Franklin adapters.",
	"Good short-turn continuity in the coherence benchmark.",
	"Focused on reducing visible thought/over-reasoning style."
	],
	"weaknesses": [
	"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
	"q/v-only LoRA is weak for implanting stubborn factual corrections.",
	"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
	],
	"project_uses": [
	"Conversational Franklin persona in local apps.",
	"A strong baseline for RAG-backed historical character demos.",
	"Best starting point for further 7B experiments."
	],
	"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
	},
	{
	"name": "qwen3-1.7b-ben-franklin-thinking-v9-factual-dialogue-lora",
	"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-thinking-v9-factual-dialogue-lora",
	"size_bytes": 1743169702,
	"size_gb": 1.62,
	"adapter_safetensors_mb": 133.0,
	"sha256_adapter_model": "9b74f8d869a5f1fd5ba1f1b55b3ed2ff8df510afe80a80fdf63ae20a9a01bbb9",
	"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
	"base_class": "Qwen3 1.7B 4-bit",
	"lora_r": 32,
	"lora_alpha": 64,
	"target_modules": [
	"v_proj",
	"q_proj",
	"k_proj",
	"down_proj",
	"gate_proj",
	"up_proj",
	"o_proj"
	],
	"data_mix": [
	[
	"franklin_qwen3_8b_chatml_answer_clean.jsonl",
	2400
	],
	[
	"franklin_7b_factual_coherence_repair_v3.jsonl",
	308
	]
	],
	"benchmark": null,
	"strengths": [
	"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
	"Best base reasoning/coherence among the local Franklin adapters.",
	"Good short-turn continuity in the coherence benchmark.",
	"Focused on factual dialogue and hard Franklin biography prompts."
	],
	"weaknesses": [
	"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
	"q/v-only LoRA is weak for implanting stubborn factual corrections.",
	"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
	],
	"project_uses": [
	"Conversational Franklin persona in local apps.",
	"A strong baseline for RAG-backed historical character demos.",
	"Best starting point for further 7B experiments."
	],
	"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
	},
	{
	"name": "qwen3-1.7b-ben-franklin-thinking-v9-from-v2-factual-dialogue-lora",
	"adapter_dir": "adapters/qwen3-1.7b-ben-franklin-thinking-v9-from-v2-factual-dialogue-lora",
	"size_bytes": 1743169476,
	"size_gb": 1.62,
	"adapter_safetensors_mb": 133.0,
	"sha256_adapter_model": "b90625341d6c7c2e7cc12597b0f3a3441bebbe46cba1d25e0234920c13134afa",
	"base_model": "unsloth/Qwen3-1.7B-unsloth-bnb-4bit",
	"base_class": "Qwen3 1.7B 4-bit",
	"lora_r": 32,
	"lora_alpha": 64,
	"target_modules": [
	"v_proj",
	"up_proj",
	"q_proj",
	"k_proj",
	"o_proj",
	"down_proj",
	"gate_proj"
	],
	"data_mix": [
	[
	"franklin_qwen3_8b_chatml_answer_clean.jsonl",
	2400
	],
	[
	"franklin_7b_coherence_repair_v2.jsonl",
	287
	],
	[
	"franklin_7b_factual_coherence_repair_v3.jsonl",
	308
	]
	],
	"benchmark": null,
	"strengths": [
	"Largest Benjamin Franklin LoRA family proven trainable on this RTX 3070 8GB machine.",
	"Best base reasoning/coherence among the local Franklin adapters.",
	"Good short-turn continuity in the coherence benchmark.",
	"Focused on factual dialogue and hard Franklin biography prompts."
	],
	"weaknesses": [
	"Qwen2.5 7B base is already highly steerable, so improvements over the prompted base are modest.",
	"q/v-only LoRA is weak for implanting stubborn factual corrections.",
	"Craven Street/Hewson factuality remains unreliable unless retrieval/prompt context is supplied."
	],
	"project_uses": [
	"Conversational Franklin persona in local apps.",
	"A strong baseline for RAG-backed historical character demos.",
	"Best starting point for further 7B experiments."
	],
	"compute_requirements": "Inference: RTX 3070 8GB works in 4-bit with the adapter; expect roughly 6-7GB VRAM. Training proven only with q_proj/v_proj, r=4 or r=8, max_seq_length=512, batch_size=1, gradient_accumulation=16; full-module LoRA is not recommended on 8GB."
	}
	]
	}