smol-training-playbook

Running on CPU Upgrade

App Files Files Community

Edit text inside embeds

#12

by loubnabnl HF Staff - opened 7 days ago

base: refs/heads/main

←

from: refs/pr/12

Discussion Files changed

+18

-18

Files changed (5) hide show

app/src/content/embeds/ablation-study.html +2 -2
app/src/content/embeds/attention-mechanisms.html +8 -8
app/src/content/embeds/model-architecture-decision-flowchart.html +2 -2
app/src/content/embeds/train-model-decision-flowchart.html +5 -5
app/src/content/embeds/training-compass.html +1 -1

app/src/content/embeds/ablation-study.html CHANGED Viewed

@@ -121,7 +121,7 @@
             const leftChart = document.createElement('div');
             leftChart.className = 'chart-container';
             leftChart.innerHTML = `
-        <div class="chart-title">From scratch ablation</div>
         <div class="chart-card">
           <div class="chart-svg"></div>
         </div>
@@ -130,7 +130,7 @@
             const rightChart = document.createElement('div');
             rightChart.className = 'chart-container';
             rightChart.innerHTML = `
-        <div class="chart-title">Annealing ablation (vs Main pretraining)</div>
         <div class="chart-card">
           <div class="chart-svg"></div>
         </div>

             const leftChart = document.createElement('div');
             leftChart.className = 'chart-container';
             leftChart.innerHTML = `
+        <div class="chart-title">From-scratch ablation</div>
         <div class="chart-card">
           <div class="chart-svg"></div>
         </div>
             const rightChart = document.createElement('div');
             rightChart.className = 'chart-container';
             rightChart.innerHTML = `
+        <div class="chart-title">Annealing ablation (vs main pretraining)</div>
         <div class="chart-card">
           <div class="chart-svg"></div>
         </div>

app/src/content/embeds/attention-mechanisms.html CHANGED Viewed

@@ -573,7 +573,7 @@
                     .stroke('none');
                 // CLKV text below the node (multi-line)
-                svg.text('Compressed\nLatent KV')
                     .font({
                         family: 'Arial, sans-serif',
                         size: 9,
@@ -607,7 +607,7 @@
                 // Add single "projection" label centered between both lines
                 const centerTextX = (clkvX + vGroupRightX) / 2 - 5;  // Shifted slightly to the right
                 const centerTextY = (vGroupTopY + kGroupBottomY) / 2;
-                svg.text('projection')
                     .font({
                         family: 'Arial, sans-serif',
                         size: 9,
@@ -659,15 +659,15 @@
                 </div>
                 <div class="diagrams-grid">
-                    <!-- DIAGRAM 1: Multi Head Attention -->
                     <div class="diagram-container">
-                        <div class="diagram-title">Multi head attention</div>
                         <div class="diagram-svg-container" id="diagram-1"></div>
                     </div>
-                    <!-- DIAGRAM 2: Multi Query Attention -->
                     <div class="diagram-container">
-                        <div class="diagram-title">Multi query attention</div>
                         <div class="diagram-svg-container" id="diagram-2"></div>
                     </div>
@@ -677,9 +677,9 @@
                         <div class="diagram-svg-container" id="diagram-3"></div>
                     </div>
-                    <!-- DIAGRAM 4: Multi Head Latent Attention -->
                     <div class="diagram-container">
-                        <div class="diagram-title">Multi head latent attention</div>
                         <div class="diagram-svg-container" id="diagram-4"></div>
                     </div>
                 </div>

                     .stroke('none');
                 // CLKV text below the node (multi-line)
+                svg.text('Compressed\nlatent KV')
                     .font({
                         family: 'Arial, sans-serif',
                         size: 9,
                 // Add single "projection" label centered between both lines
                 const centerTextX = (clkvX + vGroupRightX) / 2 - 5;  // Shifted slightly to the right
                 const centerTextY = (vGroupTopY + kGroupBottomY) / 2;
+                svg.text('Projection')
                     .font({
                         family: 'Arial, sans-serif',
                         size: 9,
                 </div>
                 <div class="diagrams-grid">
+                    <!-- DIAGRAM 1: Multi-head Attention -->
                     <div class="diagram-container">
+                        <div class="diagram-title">Multi-head attention</div>
                         <div class="diagram-svg-container" id="diagram-1"></div>
                     </div>
+                    <!-- DIAGRAM 2: Multi-query Attention -->
                     <div class="diagram-container">
+                        <div class="diagram-title">Multi-query attention</div>
                         <div class="diagram-svg-container" id="diagram-2"></div>
                     </div>
                         <div class="diagram-svg-container" id="diagram-3"></div>
                     </div>
+                    <!-- DIAGRAM 4: Multi-head Latent Attention -->
                     <div class="diagram-container">
+                        <div class="diagram-title">Multi-head latent attention</div>
                         <div class="diagram-svg-container" id="diagram-4"></div>
                     </div>
                 </div>

app/src/content/embeds/model-architecture-decision-flowchart.html CHANGED Viewed

@@ -144,9 +144,9 @@
             // Define the flowchart structure - Model Architecture Decision
             const nodes = [
                 { id: 'A', label: 'Where will this model run?', type: 'question', x: 400, y: 100 },
-                { id: 'B', label: 'Edge/Phones\nMemory-constrained environments', type: 'decision', x: 180, y: 320 },
                 { id: 'C', label: 'Other\nMore memory available', type: 'decision', x: 620, y: 320 },
-                { id: 'D', label: 'Dense (most cases)\nHybrid or other (for experienced teams)', type: 'success', x: 180, y: 540 },
                 { id: 'E', label: 'What\'s your team\'s expertise?', type: 'question', x: 620, y: 540 },
                 { id: 'F', label: 'First LLM training', type: 'decision', x: 380, y: 760 },
                 { id: 'G', label: 'Experienced\nComfortable with dense', type: 'decision', x: 620, y: 760 },

             // Define the flowchart structure - Model Architecture Decision
             const nodes = [
                 { id: 'A', label: 'Where will this model run?', type: 'question', x: 400, y: 100 },
+                { id: 'B', label: 'Edge/phones\nMemory-constrained environments', type: 'decision', x: 180, y: 320 },
                 { id: 'C', label: 'Other\nMore memory available', type: 'decision', x: 620, y: 320 },
+                { id: 'D', label: 'Dense (most cases)\nHybrid (for experienced teams)', type: 'success', x: 180, y: 540 },
                 { id: 'E', label: 'What\'s your team\'s expertise?', type: 'question', x: 620, y: 540 },
                 { id: 'F', label: 'First LLM training', type: 'decision', x: 380, y: 760 },
                 { id: 'G', label: 'Experienced\nComfortable with dense', type: 'decision', x: 620, y: 760 },

app/src/content/embeds/train-model-decision-flowchart.html CHANGED Viewed

@@ -149,15 +149,15 @@
                 { id: 'B', label: 'Can existing models handle your use case?', type: 'question', x: 400, y: 240 },
                 { id: 'C', label: 'Existing models work well just with prompting', type: 'decision', x: 200, y: 400 },
                 { id: 'D', label: 'Prompting isn\'t enough', type: 'decision', x: 600, y: 400 },
-                { id: 'E', label: '❌\nDon\'t train. Use existing models', type: 'success', x: 200, y: 560 },
-                { id: 'F', label: 'Can finetuning solve your problem?', type: 'question', x: 600, y: 600 },
-                { id: 'G', label: 'Finetuning works (post-training/continual pretraining)', type: 'decision', x: 450, y: 760 },
-                { id: 'H', label: 'Finetuning cannot solve your problem', type: 'decision', x: 750, y: 760 },
                 { id: 'I', label: '❌\nDon\'t train from scratch', type: 'success', x: 450, y: 920 },
                 { id: 'J', label: 'Train a model under one of these categories', type: 'category', x: 750, y: 960 },
                 { id: 'K', label: '🔬\nResearch', type: 'category', x: 600, y: 1120 },
                 { id: 'L', label: '🏭\nProduction', type: 'category', x: 750, y: 1120 },
-                { id: 'N', label: '🌐\nStrategic Open-Source', type: 'category', x: 970, y: 1120 }
             ];
             const links = [

                 { id: 'B', label: 'Can existing models handle your use case?', type: 'question', x: 400, y: 240 },
                 { id: 'C', label: 'Existing models work well just with prompting', type: 'decision', x: 200, y: 400 },
                 { id: 'D', label: 'Prompting isn\'t enough', type: 'decision', x: 600, y: 400 },
+                { id: 'E', label: '❌\nDon\'t train; use existing models', type: 'success', x: 200, y: 560 },
+                { id: 'F', label: 'Can fine-tuning solve your problem?', type: 'question', x: 600, y: 600 },
+                { id: 'G', label: 'Fine-tuning works (post-training/continual pretraining)', type: 'decision', x: 450, y: 760 },
+                { id: 'H', label: 'Fine-tuning cannot solve your problem', type: 'decision', x: 750, y: 760 },
                 { id: 'I', label: '❌\nDon\'t train from scratch', type: 'success', x: 450, y: 920 },
                 { id: 'J', label: 'Train a model under one of these categories', type: 'category', x: 750, y: 960 },
                 { id: 'K', label: '🔬\nResearch', type: 'category', x: 600, y: 1120 },
                 { id: 'L', label: '🏭\nProduction', type: 'category', x: 750, y: 1120 },
+                { id: 'N', label: '🌐\nStrategic Open Source', type: 'category', x: 970, y: 1120 }
             ];
             const links = [

app/src/content/embeds/training-compass.html CHANGED Viewed

@@ -176,7 +176,7 @@
           <div class="compass-stage">
             <div class="stage-header">How to train?</div>
             <div class="stage-items">
-              <div class="stage-item">Setup infra</div>
               <div class="stage-item">Training framework</div>
               <div class="stage-item">Handling loss spikes</div>
               <div class="stage-item">Midtraining</div>

           <div class="compass-stage">
             <div class="stage-header">How to train?</div>
             <div class="stage-items">
+              <div class="stage-item">Infrastructure setup</div>
               <div class="stage-item">Training framework</div>
               <div class="stage-item">Handling loss spikes</div>
               <div class="stage-item">Midtraining</div>