Files
maths-cs-ai-compendium-zh/images/efficientnet_scaling.svg
T

72 lines
6.7 KiB
XML
Raw Blame History

This file contains ambiguous Unicode characters
This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.
<svg width="700" height="280" xmlns="http://www.w3.org/2000/svg">
<text x="350" y="22" fill="#333" font-size="14" font-weight="bold" text-anchor="middle">EfficientNet: Compound Scaling</text>
<!-- Baseline network -->
<text x="90" y="55" fill="#666" font-size="10" text-anchor="middle" font-weight="bold">Baseline</text>
<rect x="50" y="65" width="80" height="120" rx="4" fill="#3498db" opacity="0.12" stroke="#3498db" stroke-width="1.5"/>
<!-- Layers inside -->
<rect x="62" y="75" width="56" height="14" rx="2" fill="#3498db" opacity="0.2" stroke="#3498db" stroke-width="0.8"/>
<rect x="62" y="93" width="56" height="14" rx="2" fill="#3498db" opacity="0.2" stroke="#3498db" stroke-width="0.8"/>
<rect x="62" y="111" width="56" height="14" rx="2" fill="#3498db" opacity="0.2" stroke="#3498db" stroke-width="0.8"/>
<rect x="62" y="129" width="56" height="14" rx="2" fill="#3498db" opacity="0.2" stroke="#3498db" stroke-width="0.8"/>
<rect x="62" y="147" width="56" height="14" rx="2" fill="#3498db" opacity="0.2" stroke="#3498db" stroke-width="0.8"/>
<rect x="62" y="165" width="56" height="14" rx="2" fill="#3498db" opacity="0.2" stroke="#3498db" stroke-width="0.8"/>
<text x="90" y="200" fill="#3498db" font-size="8" text-anchor="middle">d layers</text>
<text x="90" y="212" fill="#3498db" font-size="8" text-anchor="middle">w channels</text>
<text x="90" y="224" fill="#3498db" font-size="8" text-anchor="middle">r resolution</text>
<!-- Width scaling -->
<text x="225" y="55" fill="#e74c3c" font-size="10" text-anchor="middle" font-weight="bold">Width (w)</text>
<rect x="170" y="65" width="110" height="120" rx="4" fill="#e74c3c" opacity="0.08" stroke="#e74c3c" stroke-width="1.5"/>
<rect x="180" y="75" width="90" height="14" rx="2" fill="#e74c3c" opacity="0.2" stroke="#e74c3c" stroke-width="0.8"/>
<rect x="180" y="93" width="90" height="14" rx="2" fill="#e74c3c" opacity="0.2" stroke="#e74c3c" stroke-width="0.8"/>
<rect x="180" y="111" width="90" height="14" rx="2" fill="#e74c3c" opacity="0.2" stroke="#e74c3c" stroke-width="0.8"/>
<rect x="180" y="129" width="90" height="14" rx="2" fill="#e74c3c" opacity="0.2" stroke="#e74c3c" stroke-width="0.8"/>
<rect x="180" y="147" width="90" height="14" rx="2" fill="#e74c3c" opacity="0.2" stroke="#e74c3c" stroke-width="0.8"/>
<rect x="180" y="165" width="90" height="14" rx="2" fill="#e74c3c" opacity="0.2" stroke="#e74c3c" stroke-width="0.8"/>
<text x="225" y="200" fill="#e74c3c" font-size="8" text-anchor="middle">More channels</text>
<!-- Depth scaling -->
<text x="355" y="55" fill="#27ae60" font-size="10" text-anchor="middle" font-weight="bold">Depth (d)</text>
<rect x="315" y="55" width="80" height="145" rx="4" fill="#27ae60" opacity="0.08" stroke="#27ae60" stroke-width="1.5"/>
<rect x="327" y="63" width="56" height="12" rx="2" fill="#27ae60" opacity="0.2" stroke="#27ae60" stroke-width="0.8"/>
<rect x="327" y="78" width="56" height="12" rx="2" fill="#27ae60" opacity="0.2" stroke="#27ae60" stroke-width="0.8"/>
<rect x="327" y="93" width="56" height="12" rx="2" fill="#27ae60" opacity="0.2" stroke="#27ae60" stroke-width="0.8"/>
<rect x="327" y="108" width="56" height="12" rx="2" fill="#27ae60" opacity="0.2" stroke="#27ae60" stroke-width="0.8"/>
<rect x="327" y="123" width="56" height="12" rx="2" fill="#27ae60" opacity="0.2" stroke="#27ae60" stroke-width="0.8"/>
<rect x="327" y="138" width="56" height="12" rx="2" fill="#27ae60" opacity="0.2" stroke="#27ae60" stroke-width="0.8"/>
<rect x="327" y="153" width="56" height="12" rx="2" fill="#27ae60" opacity="0.2" stroke="#27ae60" stroke-width="0.8"/>
<rect x="327" y="168" width="56" height="12" rx="2" fill="#27ae60" opacity="0.2" stroke="#27ae60" stroke-width="0.8"/>
<rect x="327" y="183" width="56" height="12" rx="2" fill="#27ae60" opacity="0.2" stroke="#27ae60" stroke-width="0.8"/>
<text x="355" y="212" fill="#27ae60" font-size="8" text-anchor="middle">More layers</text>
<!-- Resolution scaling -->
<text x="480" y="55" fill="#f39c12" font-size="10" text-anchor="middle" font-weight="bold">Resolution (r)</text>
<rect x="430" y="50" width="100" height="150" rx="4" fill="#f39c12" opacity="0.08" stroke="#f39c12" stroke-width="1.5"/>
<rect x="442" y="60" width="76" height="20" rx="2" fill="#f39c12" opacity="0.15" stroke="#f39c12" stroke-width="0.8"/>
<rect x="442" y="84" width="76" height="20" rx="2" fill="#f39c12" opacity="0.15" stroke="#f39c12" stroke-width="0.8"/>
<rect x="442" y="108" width="76" height="20" rx="2" fill="#f39c12" opacity="0.15" stroke="#f39c12" stroke-width="0.8"/>
<rect x="442" y="132" width="76" height="20" rx="2" fill="#f39c12" opacity="0.15" stroke="#f39c12" stroke-width="0.8"/>
<rect x="442" y="156" width="76" height="20" rx="2" fill="#f39c12" opacity="0.15" stroke="#f39c12" stroke-width="0.8"/>
<text x="480" y="212" fill="#f39c12" font-size="8" text-anchor="middle">Higher resolution</text>
<!-- Compound scaling -->
<text x="620" y="55" fill="#9b59b6" font-size="10" text-anchor="middle" font-weight="bold">Compound (φ)</text>
<rect x="565" y="50" width="110" height="160" rx="4" fill="#9b59b6" opacity="0.08" stroke="#9b59b6" stroke-width="2"/>
<rect x="575" y="58" width="90" height="14" rx="2" fill="#9b59b6" opacity="0.2" stroke="#9b59b6" stroke-width="0.8"/>
<rect x="575" y="75" width="90" height="14" rx="2" fill="#9b59b6" opacity="0.2" stroke="#9b59b6" stroke-width="0.8"/>
<rect x="575" y="92" width="90" height="14" rx="2" fill="#9b59b6" opacity="0.2" stroke="#9b59b6" stroke-width="0.8"/>
<rect x="575" y="109" width="90" height="14" rx="2" fill="#9b59b6" opacity="0.2" stroke="#9b59b6" stroke-width="0.8"/>
<rect x="575" y="126" width="90" height="14" rx="2" fill="#9b59b6" opacity="0.2" stroke="#9b59b6" stroke-width="0.8"/>
<rect x="575" y="143" width="90" height="14" rx="2" fill="#9b59b6" opacity="0.2" stroke="#9b59b6" stroke-width="0.8"/>
<rect x="575" y="160" width="90" height="14" rx="2" fill="#9b59b6" opacity="0.2" stroke="#9b59b6" stroke-width="0.8"/>
<rect x="575" y="177" width="90" height="14" rx="2" fill="#9b59b6" opacity="0.2" stroke="#9b59b6" stroke-width="0.8"/>
<rect x="575" y="194" width="90" height="14" rx="2" fill="#9b59b6" opacity="0.2" stroke="#9b59b6" stroke-width="0.8"/>
<text x="620" y="222" fill="#9b59b6" font-size="8" text-anchor="middle">All three scaled together</text>
<!-- Bottom formula box -->
<rect x="80" y="240" width="540" height="35" rx="6" fill="#f5f5f5" stroke="#333" stroke-width="1"/>
<text x="350" y="255" fill="#333" font-size="9" text-anchor="middle">d = α^φ, w = β^φ, r = γ^φ subject to α·β²·γ² ≈ 2</text>
<text x="350" y="269" fill="#666" font-size="9" text-anchor="middle">Scaling all dimensions together is more effective than scaling any single one.</text>
</svg>