AbstractPhil's picture
Update config.json
6a8a9d6 verified
Raw
History Blame
4.2 kB
{
"model_type": "GeoDavidCollective",
"architecture": "ProjectiveHead Enhanced Multi-Expert System",
"framework": "pytorch",
"version": "1.0",
"trained_epoch": 10,
"training_date": "2025-10-28T03:34:06.000667",
"num_blocks": 9,
"total_parameters": 884327310,
"num_timestep_bins": 100,
"num_patterns_per_bin": 10,
"block_configs": {
"down_0": {
"input_dim": 320,
"scale_dim": 128,
"use_belly": true,
"belly_expand": 2.0,
"num_experts": 3,
"num_gate_heads": 3,
"projective_head": "auto"
},
"down_1": {
"input_dim": 640,
"scale_dim": 192,
"use_belly": true,
"belly_expand": 2.0,
"num_experts": 3,
"num_gate_heads": 3,
"projective_head": "auto"
},
"down_2": {
"input_dim": 1280,
"scale_dim": 256,
"use_belly": true,
"belly_expand": 2.0,
"num_experts": 3,
"num_gate_heads": 3,
"projective_head": "auto"
},
"down_3": {
"input_dim": 1280,
"scale_dim": 256,
"use_belly": true,
"belly_expand": 2.0,
"num_experts": 3,
"num_gate_heads": 3,
"projective_head": "auto"
},
"mid": {
"input_dim": 1280,
"scale_dim": 256,
"use_belly": true,
"belly_expand": 1.5,
"num_experts": 4,
"num_gate_heads": 4,
"projective_head": "custom"
},
"up_0": {
"input_dim": 1280,
"scale_dim": 256,
"use_belly": true,
"belly_expand": 2.0,
"num_experts": 3,
"num_gate_heads": 3,
"projective_head": "auto"
},
"up_1": {
"input_dim": 1280,
"scale_dim": 256,
"use_belly": true,
"belly_expand": 2.0,
"num_experts": 3,
"num_gate_heads": 3,
"projective_head": "auto"
},
"up_2": {
"input_dim": 640,
"scale_dim": 192,
"use_belly": true,
"belly_expand": 2.0,
"num_experts": 3,
"num_gate_heads": 3,
"projective_head": "auto"
},
"up_3": {
"input_dim": 320,
"scale_dim": 128,
"use_belly": true,
"belly_expand": 1.5,
"num_experts": 3,
"num_gate_heads": 3,
"projective_head": "auto"
}
},
"block_weights": {
"down_0": 0.8,
"down_1": 1.0,
"down_2": 1.2,
"down_3": 1.3,
"mid": 1.5,
"up_0": 1.3,
"up_1": 1.2,
"up_2": 1.0,
"up_3": 0.8
},
"loss_config": {
"feature_similarity_weight": 0.4,
"rose_weight": 0.25,
"ce_weight": 0.15,
"pattern_diversity_weight": 0.05,
"cayley_weight": 0.1,
"cantor_coherence_weight": 0.05,
"use_soft_assignment": true,
"temperature": 0.1,
"cayley_volume_floor": 0.0001,
"cayley_chaos_scale": 1.0,
"cayley_edge_weight": 0.5,
"cayley_gram_weight": 0.1
},
"training": {
"base_model": "runwayml/stable-diffusion-v1-5",
"sd_blocks_used": [
"down_0",
"down_1",
"down_2",
"down_3",
"mid",
"up_0",
"up_1",
"up_2",
"up_3"
],
"dataset": {
"type": "SymbolicPromptDataset",
"num_samples": 10000,
"complexity_distribution": {
"1": 0.05,
"2": 0.15,
"3": 0.4,
"4": 0.25,
"5": 0.15
},
"seed": 42
},
"batch_size": 16,
"num_epochs": 10,
"optimizer": {
"type": "AdamW",
"learning_rate": 0.001,
"weight_decay": 0.001
},
"pool_mode": "mean",
"checkpoint_interval": 2,
"num_workers": 2,
"pin_memory": true
},
"feature_extraction": {
"method": "SD1.5 UNet Hooks",
"spatial_features": true,
"pooling": "mean",
"dtype": "float32"
},
"capabilities": {
"timestep_classification": true,
"pattern_classification": true,
"joint_classification": true,
"num_classes": 1000,
"geometric_constraints": true,
"multi_expert_routing": true
},
"companions": {
"type": "GeoDavidCompanion",
"timestep_head": "ProjectiveHead",
"pattern_head": "ProjectiveHead",
"geometric_features": [
"cayley_menger_volume",
"edge_lengths",
"gram_matrix"
],
"loss_functions": [
"rose",
"cayley",
"cantor"
]
}
}