File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change 4141 cp wasm/_headers _site/_headers 2>/dev/null || true
4242 # Educational guide (/guide)
4343 cp site/index.html _site/guide/ 2>/dev/null || true
44+ cp site/og-image.png _site/guide/ 2>/dev/null || true
4445
4546 - name : Setup Pages
4647 uses : actions/configure-pages@v5
Original file line number Diff line number Diff line change 55< meta name ="viewport " content ="width=device-width, initial-scale=1.0 ">
66< title > quant.cpp — Understanding KV Cache Compression</ title >
77< meta name ="description " content ="An educational guide to KV cache compression in LLM inference. Learn how quant.cpp achieves 6.4x compression with only 3% quality loss. ">
8+ <!-- Open Graph / Social Preview -->
9+ < meta property ="og:title " content ="quant.cpp — AI's Memory, Compressed 6.4x ">
10+ < meta property ="og:description " content ="An interactive guide to KV cache compression. 4 orthogonal techniques achieve 6.4x compression at 3% quality cost. ">
11+ < meta property ="og:image " content ="https://quantumaikr.github.io/quant.cpp/guide/og-image.png ">
12+ < meta property ="og:url " content ="https://quantumaikr.github.io/quant.cpp/guide/ ">
13+ < meta property ="og:type " content ="website ">
14+ < meta name ="twitter:card " content ="summary_large_image ">
15+ < meta name ="twitter:title " content ="quant.cpp — AI's Memory, Compressed 6.4x ">
16+ < meta name ="twitter:description " content ="An interactive guide to KV cache compression. 6.4x compression, 59% faster attention, 3% quality cost. ">
17+ < meta name ="twitter:image " content ="https://quantumaikr.github.io/quant.cpp/guide/og-image.png ">
818< style >
919/* ===== Reset & Base ===== */
1020* {margin : 0 ;padding : 0 ;box-sizing : border-box}
You can’t perform that action at this time.
0 commit comments