| { |
| "model_type": "GeoDavidCollective", |
| "architecture": "ProjectiveHead Enhanced Multi-Expert System", |
| "framework": "pytorch", |
| "version": "1.0", |
| "trained_epoch": 10, |
| "training_date": "2025-10-28T03:34:06.000667", |
| "num_blocks": 9, |
| "total_parameters": 884327310, |
| "num_timestep_bins": 100, |
| "num_patterns_per_bin": 10, |
| "block_configs": { |
| "down_0": { |
| "input_dim": 320, |
| "scale_dim": 128, |
| "use_belly": true, |
| "belly_expand": 2.0, |
| "num_experts": 3, |
| "num_gate_heads": 3, |
| "projective_head": "auto" |
| }, |
| "down_1": { |
| "input_dim": 640, |
| "scale_dim": 192, |
| "use_belly": true, |
| "belly_expand": 2.0, |
| "num_experts": 3, |
| "num_gate_heads": 3, |
| "projective_head": "auto" |
| }, |
| "down_2": { |
| "input_dim": 1280, |
| "scale_dim": 256, |
| "use_belly": true, |
| "belly_expand": 2.0, |
| "num_experts": 3, |
| "num_gate_heads": 3, |
| "projective_head": "auto" |
| }, |
| "down_3": { |
| "input_dim": 1280, |
| "scale_dim": 256, |
| "use_belly": true, |
| "belly_expand": 2.0, |
| "num_experts": 3, |
| "num_gate_heads": 3, |
| "projective_head": "auto" |
| }, |
| "mid": { |
| "input_dim": 1280, |
| "scale_dim": 256, |
| "use_belly": true, |
| "belly_expand": 1.5, |
| "num_experts": 4, |
| "num_gate_heads": 4, |
| "projective_head": "custom" |
| }, |
| "up_0": { |
| "input_dim": 1280, |
| "scale_dim": 256, |
| "use_belly": true, |
| "belly_expand": 2.0, |
| "num_experts": 3, |
| "num_gate_heads": 3, |
| "projective_head": "auto" |
| }, |
| "up_1": { |
| "input_dim": 1280, |
| "scale_dim": 256, |
| "use_belly": true, |
| "belly_expand": 2.0, |
| "num_experts": 3, |
| "num_gate_heads": 3, |
| "projective_head": "auto" |
| }, |
| "up_2": { |
| "input_dim": 640, |
| "scale_dim": 192, |
| "use_belly": true, |
| "belly_expand": 2.0, |
| "num_experts": 3, |
| "num_gate_heads": 3, |
| "projective_head": "auto" |
| }, |
| "up_3": { |
| "input_dim": 320, |
| "scale_dim": 128, |
| "use_belly": true, |
| "belly_expand": 1.5, |
| "num_experts": 3, |
| "num_gate_heads": 3, |
| "projective_head": "auto" |
| } |
| }, |
| "block_weights": { |
| "down_0": 0.8, |
| "down_1": 1.0, |
| "down_2": 1.2, |
| "down_3": 1.3, |
| "mid": 1.5, |
| "up_0": 1.3, |
| "up_1": 1.2, |
| "up_2": 1.0, |
| "up_3": 0.8 |
| }, |
| "loss_config": { |
| "feature_similarity_weight": 0.4, |
| "rose_weight": 0.25, |
| "ce_weight": 0.15, |
| "pattern_diversity_weight": 0.05, |
| "cayley_weight": 0.1, |
| "cantor_coherence_weight": 0.05, |
| "use_soft_assignment": true, |
| "temperature": 0.1, |
| "cayley_volume_floor": 0.0001, |
| "cayley_chaos_scale": 1.0, |
| "cayley_edge_weight": 0.5, |
| "cayley_gram_weight": 0.1 |
| }, |
| "training": { |
| "base_model": "runwayml/stable-diffusion-v1-5", |
| "sd_blocks_used": [ |
| "down_0", |
| "down_1", |
| "down_2", |
| "down_3", |
| "mid", |
| "up_0", |
| "up_1", |
| "up_2", |
| "up_3" |
| ], |
| "dataset": { |
| "type": "SymbolicPromptDataset", |
| "num_samples": 10000, |
| "complexity_distribution": { |
| "1": 0.05, |
| "2": 0.15, |
| "3": 0.4, |
| "4": 0.25, |
| "5": 0.15 |
| }, |
| "seed": 42 |
| }, |
| "batch_size": 16, |
| "num_epochs": 10, |
| "optimizer": { |
| "type": "AdamW", |
| "learning_rate": 0.001, |
| "weight_decay": 0.001 |
| }, |
| "pool_mode": "mean", |
| "checkpoint_interval": 2, |
| "num_workers": 2, |
| "pin_memory": true |
| }, |
| "feature_extraction": { |
| "method": "SD1.5 UNet Hooks", |
| "spatial_features": true, |
| "pooling": "mean", |
| "dtype": "float32" |
| }, |
| "capabilities": { |
| "timestep_classification": true, |
| "pattern_classification": true, |
| "joint_classification": true, |
| "num_classes": 1000, |
| "geometric_constraints": true, |
| "multi_expert_routing": true |
| }, |
| "companions": { |
| "type": "GeoDavidCompanion", |
| "timestep_head": "ProjectiveHead", |
| "pattern_head": "ProjectiveHead", |
| "geometric_features": [ |
| "cayley_menger_volume", |
| "edge_lengths", |
| "gram_matrix" |
| ], |
| "loss_functions": [ |
| "rose", |
| "cayley", |
| "cantor" |
| ] |
| } |
| } |