LH-Tech-AI commited on
Commit
3a2a696
Β·
verified Β·
1 Parent(s): 2b06042

Create curriculum.html

Browse files
Files changed (1) hide show
  1. curriculum.html +315 -0
curriculum.html ADDED
@@ -0,0 +1,315 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <!DOCTYPE html>
2
+ <html lang="en">
3
+ <head>
4
+ <meta charset="UTF-8">
5
+ <meta name="viewport" content="width=device-width, initial-scale=1.0">
6
+ <title>SupraLabs | Information Routing: Dynamic Curriculum Shifting</title>
7
+ <script src="https://cdn.jsdelivr.net/npm/chart.js"></script>
8
+ <style>
9
+ :root {
10
+ --bg: #0f0f0f;
11
+ --surface: #1a1a1a;
12
+ --border: #333;
13
+ --text: #e0e0e0;
14
+ --accent: #536bfe; /* Supra Blue */
15
+ --muted: #888;
16
+ --success: #00e676;
17
+ --warning: #ffb300;
18
+ --font-mono: 'JetBrains Mono', 'Fira Code', monospace;
19
+ }
20
+ * { margin: 0; padding: 0; box-sizing: border-box; }
21
+ body {
22
+ background-color: var(--bg);
23
+ color: var(--text);
24
+ font-family: 'Inter', -apple-system, sans-serif;
25
+ line-height: 1.6;
26
+ padding: 2rem;
27
+ }
28
+ code, pre, .mono { font-family: var(--font-mono); }
29
+ .container { max-width: 1000px; margin: 0 auto; }
30
+ header {
31
+ border-bottom: 2px solid var(--border);
32
+ padding-bottom: 2rem;
33
+ margin-bottom: 3rem;
34
+ display: flex;
35
+ justify-content: space-between;
36
+ align-items: flex-end;
37
+ }
38
+ .logo-area a { text-decoration: none; color: inherit; }
39
+ .logo-area h1 {
40
+ font-size: 1.2rem;
41
+ text-transform: uppercase;
42
+ letter-spacing: 2px;
43
+ color: var(--accent);
44
+ line-height: 1;
45
+ display: flex;
46
+ align-items: center;
47
+ gap: 10px;
48
+ }
49
+ nav a {
50
+ color: var(--text);
51
+ text-decoration: none;
52
+ margin-left: 1.5rem;
53
+ font-size: 0.9rem;
54
+ border-bottom: 1px solid transparent;
55
+ }
56
+ nav a:hover { border-bottom: 1px solid var(--accent); }
57
+ .hero { margin-bottom: 4rem; }
58
+ .hero h2 { font-size: 3rem; line-height: 1.1; margin-bottom: 1.5rem; font-weight: 800; }
59
+ .hero p { font-size: 1.2rem; color: var(--muted); max-width: 750px; }
60
+ .section-label {
61
+ display: block;
62
+ font-family: var(--font-mono);
63
+ color: var(--accent);
64
+ font-size: 0.8rem;
65
+ margin-top: 3rem;
66
+ margin-bottom: 1rem;
67
+ text-transform: uppercase;
68
+ }
69
+ .card { background: var(--surface); border: 1px solid var(--border); padding: 2.5rem; margin-bottom: 2rem; }
70
+ h3 { font-size: 1.6rem; margin-bottom: 1rem; font-weight: 700; }
71
+ p { margin-bottom: 1rem; color: #ccc; }
72
+ ul { margin-left: 1.5rem; margin-bottom: 1.5rem; }
73
+ li { margin-bottom: 0.5rem; }
74
+ .winner-badge { color: var(--success); font-weight: bold; font-family: var(--font-mono); }
75
+ .table-container { overflow-x: auto; margin: 2rem 0; border: 1px solid var(--border); }
76
+ table { width: 100%; border-collapse: collapse; text-align: left; font-size: 0.95rem; }
77
+ th, td { padding: 1rem; border-bottom: 1px solid var(--border); }
78
+ th { background-color: rgba(26, 26, 26, 0.8); font-family: var(--font-mono); color: var(--accent); font-size: 0.85rem; text-transform: uppercase; }
79
+ tr:hover { background-color: rgba(83, 107, 254, 0.05); }
80
+ .highlight-row { border-left: 4px solid var(--success); background-color: rgba(0, 230, 118, 0.02); }
81
+ .chart-box { background: var(--surface); border: 1px solid var(--border); padding: 2rem; margin-bottom: 2rem; }
82
+ .stats-grid {
83
+ display: grid;
84
+ grid-template-columns: 1fr 1fr 1fr;
85
+ gap: 1rem;
86
+ margin-top: 4rem;
87
+ border-top: 1px solid var(--border);
88
+ padding-top: 2rem;
89
+ }
90
+ .stat-box { padding: 1rem; border-left: 2px solid var(--accent); }
91
+ .stat-box small { display: block; color: var(--muted); font-family: var(--font-mono); }
92
+ footer { margin-top: 6rem; padding-bottom: 2rem; font-size: 0.8rem; color: var(--muted); text-align: center; }
93
+ @media (max-width: 768px) {
94
+ .hero h2 { font-size: 2rem; }
95
+ header { flex-direction: column; align-items: flex-start; gap: 1rem; }
96
+ nav a { margin-left: 0; margin-right: 1rem; }
97
+ .stats-grid { grid-template-columns: 1fr; }
98
+ }
99
+ </style>
100
+ </head>
101
+ <body>
102
+ <div class="container">
103
+ <header>
104
+ <div class="logo-area" style="font-size: 1.5em;">
105
+ <a href="index.html"><h1><img src="./image.png" style="height: 2em" alt="Logo"> SupraLabs_</h1></a>
106
+ </div>
107
+ <nav>
108
+ <a href="#summary">Core Learnings</a>
109
+ <a href="#benchmarks">Routing Matrix</a>
110
+ <a href="#charts">Visualizations</a>
111
+ <a href="https://huggingface.co/SupraLabs" target="_blank">HuggingFace</a>
112
+ </nav>
113
+ </header>
114
+
115
+ <section class="hero">
116
+ <h2>Experiment #7:<br>Information Routing &mdash; Curriculum Shifting</h2>
117
+ <p>An empirical evaluation of structured knowledge injection schedules inside parameter-constrained spaces. We subjected a optimized <strong>4,196,096 parameter architecture</strong> to a rigid budget of <strong>200,000,000 total tokens</strong> to test multi-distribution blending against raw uniform pooling.</p>
118
+ </section>
119
+
120
+ <span class="section-label" id="summary">// Syntactic_Preservation_&_Memory_Retainment</span>
121
+ <div class="card">
122
+ <h3>Curing Catastrophic Forgetting via Shifting Weights</h3>
123
+ <p>When training extremely compact language models, data sequencing determines memory stabilization boundaries. Our comparative routing sweep demonstrates that standard dataset pooling bottlenecks the structural capability of micro-networks:</p>
124
+ <ul>
125
+ <li><strong>The Failure of Rigid Sequential Partitioning:</strong> Processing data in unblended sequential stages (Hard Blocks) triggers devastating memory overwrites. As the training block moves from base syntax to intense facts, the network suffers a 39% language accuracy collapse (Wikitext PPL: 632.9).</li>
126
+ <li><strong>The Naive Pooling Limitation:</strong> Shoving all token distributions into a single, uniform mix from the start (Baseline) forces the small weights matrix to stabilize multiple contradictory targets simultaneously, degrading the final linguistic resolution (PPL: 556.7).</li>
127
+ <li><strong>The Shifting Weight Solution:</strong> Launching with structured syntax (TinyStories/Cosmo), moving into reasoning (Math), and finalizing with facts while preserving a mathematical logic holding current protects the weight paths. Language Perplexity drops cleanly to <strong>453.6</strong>.</li>
128
+ </ul>
129
+ </div>
130
+
131
+ <span class="section-label" id="benchmarks">// Knowledge_Injection_Routing_Matrix</span>
132
+ <div class="card" style="padding: 1.5rem;">
133
+ <h3>Empirical Scheduling Analytics</h3>
134
+ <p>All training pipelines utilize an identical 4096 vocabulary architecture. Downstream tracking processed zero-shot. Deceptive optimization targets (apparent pretrain loss) are directly falsified by true language modeling benchmarks.</p>
135
+
136
+ <div class="table-container">
137
+ <table>
138
+ <thead>
139
+ <tr>
140
+ <th>Benchmark / Metric</th>
141
+ <th style="color: var(--success)">Run 1: Shifting Weights (πŸ† Win)</th>
142
+ <th>Run 2: Hard Sequential Blocks</th>
143
+ <th>Run 3: Uniform Baseline Mix</th>
144
+ </tr>
145
+ </thead>
146
+ <tbody>
147
+ <tr>
148
+ <td class="mono">Routing Architecture</td>
149
+ <td style="color: var(--success)">Dynamic Weight Stepper</td>
150
+ <td>Static Linear Switches</td>
151
+ <td>Star Blend Pooling</td>
152
+ </tr>
153
+ <tr>
154
+ <td class="mono">Final Pretrain Step Loss (↓)</td>
155
+ <td>2.770</td>
156
+ <td class="winner-badge">2.458</td>
157
+ <td>2.690</td>
158
+ </tr>
159
+ <tr>
160
+ <td class="mono">Final Pretrain Train Loss (↓)</td>
161
+ <td>3.151</td>
162
+ <td class="winner-badge">2.817</td>
163
+ <td>3.114</td>
164
+ </tr>
165
+ <tr>
166
+ <td class="mono">ARC-Easy Zero-Shot (↑)</td>
167
+ <td>29.71%</td>
168
+ <td class="winner-badge">30.22%</td>
169
+ <td>30.18%</td>
170
+ </tr>
171
+ <tr>
172
+ <td class="mono">ARC-Easy Acc Norm (↑)</td>
173
+ <td>30.26%</td>
174
+ <td class="winner-badge">30.64%</td>
175
+ <td>30.47%</td>
176
+ </tr>
177
+ <tr>
178
+ <td class="mono">Wikitext Byte PPL (↓)</td>
179
+ <td class="winner-badge">3.1392</td>
180
+ <td>3.3410</td>
181
+ <td>3.2618</td>
182
+ </tr>
183
+ <tr>
184
+ <td class="mono">Wikitext Word PPL (↓)</td>
185
+ <td class="winner-badge" style="color: var(--success); font-weight: bold;">453.6715</td>
186
+ <td>632.9729</td>
187
+ <td>556.7454</td>
188
+ </tr>
189
+ <tr class="highlight-row">
190
+ <td style="font-weight: bold;">PRETRAIN COHERENCE</td>
191
+ <td style="color: var(--success); font-weight: bold;">SOTA BALANCE ARCHIEVED</td>
192
+ <td style="color: var(--warning)">Severe Memory Corruption</td>
193
+ <td>Information Dilution</td>
194
+ </tr>
195
+ </tbody>
196
+ </table>
197
+ </div>
198
+ </div>
199
+
200
+ <span class="section-label" id="charts">// Visualizing_Routing_Mechanics</span>
201
+ <div class="chart-box">
202
+ <h3>Linguistic Perplexity Splintering Across Routing Approaches</h3>
203
+ <div style="position: relative; height:350px; width:100%">
204
+ <canvas id="curriculumPplChart"></canvas>
205
+ </div>
206
+ </div>
207
+
208
+ <div class="chart-box">
209
+ <h3>The Apparent Loss Paradox: Pretrain Loss vs. True Structural Perplexity</h3>
210
+ <p style="font-size: 0.85rem; color: var(--muted); margin-bottom: 1.5rem;">Critical discovery: Rigid data blocking pushes the localized training loss down artificially, but causes severe out-of-distribution language collapse on core evaluation matrices.</p>
211
+ <div style="position: relative; height:350px; width:100%">
212
+ <canvas id="curriculumParadoxChart"></canvas>
213
+ </div>
214
+ </div>
215
+
216
+ <section class="stats-grid" id="hardware">
217
+ <div class="stat-box">
218
+ <small>TOTAL COMPUTE EXPOSURE</small>
219
+ <strong>200M Unified Steps</strong>
220
+ </div>
221
+ <div class="stat-box">
222
+ <small>MODEL GEOMETRY PROFILE</small>
223
+ <strong>3-Layer Shallow Wide SOTA</strong>
224
+ </div>
225
+ <div class="stat-box">
226
+ <small>SCHEDULING RESOLUTION</small>
227
+ <strong>4096 Vocab Pareto Bound</strong>
228
+ </div>
229
+ </section>
230
+
231
+ <footer>
232
+ <p>&copy; 2026 SupraLabs. High performance. Small footprints. Proudly open-source.</p>
233
+ </footer>
234
+ </div>
235
+
236
+ <script>
237
+ // Curriculum Perplexity Chart
238
+ const ctxCurrPpl = document.getElementById('curriculumPplChart').getContext('2d');
239
+ new Chart(ctxCurrPpl, {
240
+ type: 'bar',
241
+ data: {
242
+ labels: ['Run 1: Dynamic Shifting Weights', 'Run 2: Hard Blocks', 'Run 3: Uniform Baseline Mix'],
243
+ datasets: [{
244
+ label: 'Wikitext Word Perplexity (Lower = Better)',
245
+ data: [453.67, 632.97, 556.74],
246
+ backgroundColor: ['rgba(0, 230, 118, 0.3)', 'rgba(229, 57, 53, 0.2)', 'rgba(255, 179, 0, 0.2)'],
247
+ borderColor: ['#00e676', '#e53935', '#ffb300'],
248
+ borderWidth: 2
249
+ }]
250
+ },
251
+ options: {
252
+ responsive: true,
253
+ maintainAspectRatio: false,
254
+ plugins: { legend: { labels: { color: '#bbb' } } },
255
+ scales: {
256
+ y: { grid: { color: '#222' }, ticks: { color: '#888' } },
257
+ x: { grid: { display: false }, ticks: { color: '#aaa' } }
258
+ }
259
+ }
260
+ });
261
+
262
+ // Paradox Dual Axis Curve
263
+ const ctxCurrParadox = document.getElementById('curriculumParadoxChart').getContext('2d');
264
+ new Chart(ctxCurrParadox, {
265
+ type: 'line',
266
+ data: {
267
+ labels: ['Dynamic Shifting', 'Hard Sequential Blocks', 'Uniform Baseline Mix'],
268
+ datasets: [
269
+ {
270
+ label: 'Apparent Pretrain Train Loss (Lower = Deceptive ↓)',
271
+ data: [3.151, 2.817, 3.114],
272
+ borderColor: 'rgba(229, 57, 53, 0.5)',
273
+ backgroundColor: 'transparent',
274
+ yAxisID: 'yLoss',
275
+ tension: 0.1,
276
+ borderWidth: 2
277
+ },
278
+ {
279
+ label: 'True Linguistic Word Perplexity (Lower = Superior ↑)',
280
+ data: [453.67, 632.97, 556.74],
281
+ borderColor: '#536bfe',
282
+ backgroundColor: 'transparent',
283
+ yAxisID: 'yPpl',
284
+ tension: 0.1,
285
+ borderWidth: 3,
286
+ borderDash: [3, 3]
287
+ }
288
+ ]
289
+ },
290
+ options: {
291
+ responsive: true,
292
+ maintainAspectRatio: false,
293
+ plugins: { legend: { labels: { color: '#bbb' } } },
294
+ scales: {
295
+ x: { grid: { display: false }, ticks: { color: '#aaa' } },
296
+ yLoss: {
297
+ type: 'linear',
298
+ position: 'left',
299
+ title: { display: true, text: 'Pretrain Loss Baseline', color: 'rgba(229, 57, 53, 0.8)' },
300
+ grid: { color: '#222' },
301
+ ticks: { color: '#888' }
302
+ },
303
+ yPpl: {
304
+ type: 'linear',
305
+ position: 'right',
306
+ title: { display: true, text: 'Linguistic Word Perplexity', color: '#536bfe' },
307
+ grid: { display: false },
308
+ ticks: { color: '#888' }
309
+ }
310
+ }
311
+ }
312
+ });
313
+ </script>
314
+ </body>
315
+ </html>