Transformers-tenets / src /fragments /warmup_demo.html
Molbap's picture
Molbap HF Staff
Recommit with PNGs tracked by LFS
c34c7de
raw
history blame
11.7 kB
<style>
.warmup-demo body {
font-family: 'Segoe UI', Tahoma, Geneva, Verdana, sans-serif;
margin: 0;
padding: 20px;
background-color: #f5f5f5;
}
.warmup-demo .container {
max-width: 1200px;
margin: 0 auto;
background: white;
border-radius: 12px;
padding: 30px;
box-shadow: 0 4px 6px rgba(0, 0, 0, 0.1);
}
.warmup-demo h1 {
text-align: center;
color: #333;
margin-bottom: 10px;
}
.warmup-demo .subtitle {
text-align: center;
color: #666;
margin-bottom: 30px;
font-size: 16px;
}
.warmup-demo .demo-container {
display: flex;
gap: 40px;
margin-bottom: 30px;
}
.warmup-demo .side {
flex: 1;
border: 2px solid #ddd;
border-radius: 8px;
padding: 20px;
background: #fafafa;
}
.warmup-demo .side h2 {
text-align: center;
margin-top: 0;
color: #333;
}
.warmup-demo .no-warmup h2 {
color: #d63384;
}
.warmup-demo .with-warmup h2 {
color: #198754;
}
.warmup-demo .memory-area {
height: 400px;
border: 2px dashed #ccc;
border-radius: 6px;
padding: 10px;
margin: 20px 0;
background: #fff;
position: relative;
overflow: hidden;
}
.warmup-demo .layer-box {
width: 80px;
height: 30px;
border: 2px solid #666;
border-radius: 4px;
margin: 3px;
display: inline-block;
position: relative;
background: #fff;
transition: all 0.3s ease;
}
.warmup-demo .layer-box.allocating {
background: #e9ecef;
border-color: #adb5bd;
}
.warmup-demo .layer-box.allocating::after {
content: "malloc";
position: absolute;
top: 50%;
left: 50%;
transform: translate(-50%, -50%);
font-size: 10px;
color: #666;
font-weight: bold;
}
.warmup-demo .layer-box.loaded {
background: #d1e7dd;
border-color: #198754;
}
.warmup-demo .layer-box.loaded::after {
content: "data";
position: absolute;
top: 50%;
left: 50%;
transform: translate(-50%, -50%);
font-size: 10px;
color: #198754;
font-weight: bold;
}
.warmup-demo .warmup-container {
width: 100%;
height: 60px;
border: 3px solid #666;
border-radius: 6px;
margin-bottom: 20px;
background: #fff;
position: relative;
overflow: hidden;
}
.warmup-demo .warmup-container.allocated {
border-color: #0d6efd;
background: #e7f1ff;
}
.warmup-demo .warmup-container::before {
content: "Pre-allocated Memory Pool";
position: absolute;
top: 50%;
left: 50%;
transform: translate(-50%, -50%);
font-size: 14px;
color: #666;
font-weight: bold;
z-index: 1;
}
.warmup-demo .warmup-container.allocated::before {
color: #0d6efd;
}
.warmup-demo .warmup-fill {
height: 100%;
background: linear-gradient(90deg, #198754, #20c997);
width: 0%;
transition: width 0.5s ease;
border-radius: 3px;
position: relative;
z-index: 2;
}
.warmup-demo .warmup-fill::after {
content: "Layer Data Loading";
position: absolute;
top: 50%;
left: 50%;
transform: translate(-50%, -50%);
font-size: 12px;
color: white;
font-weight: bold;
white-space: nowrap;
}
.warmup-demo .timing {
text-align: center;
font-size: 24px;
font-weight: bold;
margin: 15px 0;
min-height: 30px;
}
.warmup-demo .no-warmup .timing {
color: #d63384;
}
.warmup-demo .with-warmup .timing {
color: #198754;
}
.warmup-demo .controls {
text-align: center;
margin: 30px 0;
}
.warmup-demo .btn {
background: #0d6efd;
color: white;
border: none;
padding: 12px 24px;
border-radius: 6px;
font-size: 16px;
cursor: pointer;
margin: 0 10px;
transition: background 0.3s ease;
}
.warmup-demo .btn:hover {
background: #0b5ed7;
}
.warmup-demo .btn:disabled {
background: #6c757d;
cursor: not-allowed;
}
.warmup-demo .description {
background: #f8f9fa;
padding: 15px;
border-radius: 6px;
margin-top: 15px;
font-size: 14px;
line-height: 1.5;
}
.warmup-demo .phase-indicator {
font-size: 14px;
color: #666;
text-align: center;
margin-top: 10px;
min-height: 20px;
}
.warmup-demo .layer-counter {
text-align: center;
font-size: 16px;
color: #495057;
margin: 10px 0;
}
</style>
<div class="warmup-demo">
<div class="container">
<p class="subtitle">Mem allocation patterns during model loading</p>
<div class="controls">
<button class="btn" id="startBtn" onclick="startDemo()">Start Animation</button>
<button class="btn" id="resetBtn" onclick="resetDemo()">Reset</button>
</div>
<div class="demo-container">
<div class="side no-warmup">
<h4 data-no-toc>❌ Without Warmup</h4>
<div class="timing" id="noWarmupTime">0.00s</div>
<div class="layer-counter" id="noWarmupCounter">Layers loaded: 0/10</div>
<div class="phase-indicator" id="noWarmupPhase"></div>
<div class="memory-area" id="noWarmupArea"></div>
<div class="description">
<strong>Individual Allocations:</strong><br>
Each model layer triggers a separate cudaMalloc() call, creating memory fragmentation and allocation overhead.
<br><br>
📦 <strong>Grey "malloc"</strong> = Memory allocation overhead<br>
<strong>Green "data"</strong> = Actual layer data loading
</div>
</div>
<div class="side with-warmup">
<h4 data-no-toc>✅ With Warmup</h4>
<div class="timing" id="warmupTime">0.00s</div>
<div class="layer-counter" id="warmupCounter">Layers loaded: 0/10</div>
<div class="phase-indicator" id="warmupPhase"></div>
<div class="memory-area" id="warmupArea">
<div class="warmup-container" id="warmupContainer">
<div class="warmup-fill" id="warmupFill"></div>
</div>
<div id="warmupLayers"></div>
</div>
<div class="description">
<strong>Pre-allocated Pool:</strong><br>
The warmup function calculates total memory needed and makes ONE large allocation. Subsequent layers load directly into this pool, eliminating malloc overhead.
<br><br>
🔵 <strong>Blue container</strong> = Single large malloc (warmup)<br>
🟢 <strong>Green progress bar</strong> = Layer data loading (no malloc needed)
</div>
</div>
</div>
</div>
</div>
<script>
let animationSpeed = 1 / 2.4;
let isRunning = false;
const totalLayers = 10;
function startDemo() {
if (isRunning) return;
isRunning = true;
document.getElementById('startBtn').disabled = true;
document.getElementById('resetBtn').disabled = true;
Promise.all([
animateNoWarmup(),
animateWithWarmup()
]).then(() => {
isRunning = false;
document.getElementById('startBtn').disabled = false;
document.getElementById('resetBtn').disabled = false;
});
}
function resetDemo() {
if (isRunning) return;
document.getElementById('noWarmupArea').innerHTML = '';
document.getElementById('warmupLayers').innerHTML = '';
document.getElementById('warmupFill').style.width = '0%';
document.getElementById('warmupContainer').classList.remove('allocated');
document.getElementById('noWarmupTime').textContent = '0.00s';
document.getElementById('warmupTime').textContent = '0.00s';
document.getElementById('noWarmupCounter').textContent = 'Layers loaded: 0/10';
document.getElementById('warmupCounter').textContent = 'Layers loaded: 0/10';
document.getElementById('noWarmupPhase').textContent = '';
document.getElementById('warmupPhase').textContent = '';
}
async function animateNoWarmup() {
const container = document.getElementById('noWarmupArea');
const timeEl = document.getElementById('noWarmupTime');
const counterEl = document.getElementById('noWarmupCounter');
const phaseEl = document.getElementById('noWarmupPhase');
let currentTime = 0;
const baseDelay = 200 / animationSpeed;
phaseEl.textContent = 'Loading model layers...';
for (let i = 0; i < totalLayers; i++) {
const layerBox = document.createElement('div');
layerBox.className = 'layer-box';
container.appendChild(layerBox);
await sleep(baseDelay * 0.3);
layerBox.classList.add('allocating');
currentTime += 0.08;
timeEl.textContent = currentTime.toFixed(2) + 's';
await sleep(baseDelay * 0.7);
layerBox.classList.remove('allocating');
layerBox.classList.add('loaded');
currentTime += 0.12;
timeEl.textContent = currentTime.toFixed(2) + 's';
counterEl.textContent = `Layers loaded: ${i + 1}/${totalLayers}`;
}
phaseEl.textContent = 'Complete!';
}
async function animateWithWarmup() {
const container = document.getElementById('warmupLayers');
const timeEl = document.getElementById('warmupTime');
const counterEl = document.getElementById('warmupCounter');
const phaseEl = document.getElementById('warmupPhase');
const warmupContainer = document.getElementById('warmupContainer');
const warmupFill = document.getElementById('warmupFill');
let currentTime = 0;
const baseDelay = 200 / animationSpeed;
phaseEl.textContent = 'Warming up allocator...';
await sleep(baseDelay * 2);
warmupContainer.classList.add('allocated');
currentTime += 0.3;
timeEl.textContent = currentTime.toFixed(2) + 's';
phaseEl.textContent = 'Loading model layers...';
for (let i = 0; i < totalLayers; i++) {
const layerBox = document.createElement('div');
layerBox.className = 'layer-box loaded';
layerBox.style.width = '40px';
layerBox.style.height = '20px';
container.appendChild(layerBox);
const progress = ((i + 1) / totalLayers) * 100;
warmupFill.style.width = progress + '%';
await sleep(baseDelay * 0.5);
currentTime += 0.08;
timeEl.textContent = currentTime.toFixed(2) + 's';
counterEl.textContent = `Layers loaded: ${i + 1}/${totalLayers}`;
}
phaseEl.textContent = 'Complete!';
}
function sleep(ms) {
return new Promise(resolve => setTimeout(resolve, ms));
}
</script>