Unverified Commit 56dd0d90 authored by dagil-nvidia's avatar dagil-nvidia Committed by GitHub
Browse files

docs: update architecture overview diagram (#7440)


Signed-off-by: default avatarDan Gil <dagil@nvidia.com>
parent 3882cba4
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 70 560 525" width="1680" height="1575">
<svg xmlns="http://www.w3.org/2000/svg" viewBox="0 70 560 525" width="2240" height="2100">
<defs>
<linearGradient id="bg-grad" x1="0%" y1="0%" x2="100%" y2="100%">
<stop offset="0%" stop-color="#F8FAFC"/>
......@@ -96,6 +96,7 @@
<style>
text { font-family: -apple-system, 'Segoe UI', 'Helvetica Neue', Arial, sans-serif; }
.title { font-size: 24px; font-weight: 700; fill: #0F172A; }
.subtitle { font-size: 12px; font-weight: 400; fill: #94A3B8; letter-spacing: 0.3px; }
.box-label { font-size: 13.5px; font-weight: 600; fill: #1E293B; text-anchor: start; }
.box-label-center { font-size: 14px; font-weight: 600; fill: #1E293B; text-anchor: middle; }
......@@ -116,6 +117,40 @@
.connector-dashed { fill: none; stroke: #CBD5E1; stroke-width: 1.8; stroke-dasharray: 6 4; }
</style>
<!-- Logo and title removed -->
<!-- REMOVED_START
<path fill="#76B900" d="M39.49988,24c0-.61621-.04578-1.2207-.1156-1.81787.18384-.31543.37524-.63477.5365-.93945,1.00208-1.90088,1.57373-3.56885,1.57886-4.9292.00232-.81348-.2207-1.55127-.75012-2.07324l-.00049.00049c-.53174-.52588-1.2771-.74365-2.1012-.7417-.4353,0-.8999.05859-1.39343.16797l.21594.97607c.43762-.09668.83337-.14453,1.17749-.14453.66443.00195,1.11035.16797,1.39893.45312l.00073.00146c.28528.28125.44995.71289.45227,1.36035.00488,1.0376-.47583,2.55273-1.38306,4.29688-1.29248-5.78564-5.81421-10.34082-11.57874-11.68896.14099-.07227.28088-.14209.41882-.20947l.44922-.21875-.43726-.89844-.44922.21875c-.15088.07275-.30322.14893-.45703.22803l-.44482.22852.26074.50732c-.93384-.17529-1.89368-.27734-2.87842-.27734-8.56067,0-15.49976,6.93945-15.5,15.5,0,.61621.04565,1.2207.1156,1.81787-.18396.31543-.37549.63477-.53699.93994-1.0022,1.90137-1.57373,3.56982-1.57886,4.93066-.00244.81348.22119,1.55176.75049,2.07373l.00037.00098c.52856.52051,1.27014.73779,2.09155.73584.41211,0,.85132-.05225,1.31714-.1499l-.20581-.97852-.00012-.00049c-.41138.08691-.78467.12939-1.11121.12939-.6604-.00195-1.10413-.16748-1.38965-.44922h-.00012c-.28564-.28271-.45044-.71436-.45276-1.36182-.005-1.03906.47595-2.5542,1.38354-4.29932,1.29224,5.78564,5.81409,10.34082,11.57874,11.68896-.14099.07227-.28076.14209-.4187.20898l-.44971.21826.43677.89941.44971-.21826c.151-.07324.30347-.14941.45728-.22852l.44434-.22852-.26074-.50732c.93396.17529,1.89417.27734,2.87915.27734,8.56055,0,15.49963-6.93945,15.49988-15.49951ZM9.65552,26.01221c.9043-1.50684,2.06372-3.14062,3.45288-4.82471l.00024.00049-.00012-.00049c.61035-.73975,1.26306-1.48828,1.95447-2.23926l-.7356-.67676c-.70337.76318-1.36804,1.52539-1.99023,2.27979l.00012.00049c-1.07947,1.30859-2.01318,2.58545-2.81897,3.81201-.00317-.12207-.01843-.24072-.01843-.36377.00037-4.00586,1.62219-7.62744,4.24695-10.25342,2.62561-2.62451,6.24744-4.24658,10.25317-4.24707.17468,0,.34424.02002.51733.02637-.37134.23877-.74536.48438-1.12598.74854l.57007.82129-.00012.00049c.76208-.52832,1.49988-.99561,2.21375-1.41602,3.13135.47217,5.93835,1.92773,8.078,4.06641,2.1759,2.17725,3.64624,5.04346,4.09119,8.24072-.9043,1.50732-2.06372,3.1416-3.453,4.82617h0c-.61023.74023-1.26282,1.48877-1.95422,2.23926l.7356.67676c.70312-.7627,1.3678-1.52539,1.98999-2.2793h.00037c1.07922-1.30957,2.01282-2.58691,2.81873-3.81396.00293.12207.01831.24072.01831.36377-.00037,4.00537-1.62219,7.62695-4.24695,10.25293-2.62561,2.62451-6.24744,4.24658-10.25305,4.24707-.17444,0-.34375-.02002-.51672-.02637.37085-.23828.74451-.48389,1.12463-.74756l-.56982-.82227v.00049c-.7616.52832-1.49902.99512-2.2124,1.41504-3.13184-.47217-5.93896-1.92773-8.07886-4.06641-2.17603-2.17725-3.64624-5.04395-4.09131-8.24072Z"/>
<path fill="#76B900" d="M19.56604,28.06836l2.69275,1.34668c-.01807.10156-.03149.20508-.03149.31201.00024.979.79346,1.77246,1.77271,1.77246.97913,0,1.77234-.79346,1.77258-1.77246-.00012-.10693-.01343-.21045-.03162-.31201l2.69275-1.34668c.32361.34717.78137.56738,1.29358.56738.97913,0,1.77222-.79297,1.77258-1.77197-.00024-.97949-.79346-1.77295-1.77258-1.77295-.18311,0-.35632.03564-.52246.0874l-.78577-1.17822.78601-1.17969c.16602.05176.33911.0874.52222.0874.97913,0,1.77234-.79346,1.77258-1.77246-.00024-.97949-.79346-1.77295-1.77258-1.77295-.51245,0-.97034.2207-1.29395.56836l-2.69226-1.34668c.01807-.10107.03137-.20459.03149-.31104-.00024-.97949-.79346-1.77295-1.77258-1.77295-.97925,0-1.77246.79346-1.77271,1.77295,0,.10693.01343.20996.03149.31152l-2.7168,1.3584c-.32202-.33154-.77075-.53857-1.26929-.53857-.97925,0-1.77246.79346-1.77271,1.77295.00037.979.79346,1.77197,1.77271,1.77197.19141,0,.37231-.03809.54517-.09424l.76257,1.14453-.78552,1.17871c-.16602-.05176-.33911-.0874-.52222-.0874-.97925,0-1.77246.79346-1.77271,1.77295.00037.979.79346,1.77197,1.77271,1.77197.51221,0,.96973-.22021,1.29333-.56738ZM20.78296,23.99951l.52478-.78711.95105.4751c-.01807.10205-.03149.20557-.03149.3125,0,.10645.01343.20947.03137.31104l-.95093.47559-.18689-.28027-.33789-.50684ZM26.69226,24.78613l-.95105-.47461c.01807-.10156.03137-.20508.03137-.31152,0-.10693-.01331-.21045-.03149-.31201l.95093-.47559.5249.78711-.52466.78662ZM24.77271,24c-.00024.10254-.02246.19922-.05859.28809l-.0166.03369c-.03455.07422-.08057.1416-.13574.20068-.02173.02393-.04858.0415-.07288.06201-.04578.03857-.09412.07324-.14807.1001-.02441.0127-.04907.02441-.07483.03418-.08362.03125-.17163.05371-.26599.0542-.09448-.00049-.18237-.02295-.26611-.0542-.02576-.00977-.05029-.02148-.07483-.03418-.05371-.02686-.10217-.06152-.14783-.09961-.02441-.021-.05151-.03857-.07324-.0625-.05493-.05908-.10083-.12598-.13525-.2002l-.01709-.03418c-.03613-.08936-.05835-.18604-.05847-.28809.00085-.42725.34619-.77246.77283-.77344.42651.00098.77185.34619.77271.77344ZM20.04541,26.86377c0-.10693-.01343-.21045-.03149-.31201l.95117-.4751,1.57422,2.36133-2.52539-1.2627c.01807-.10156.03149-.20459.03149-.31152ZM23.53125,28.02539c-.0188.00488-.03931.00391-.05774.00977l-1.0011-1.50098-.60596-.90918.84033-.41992c.10181.10938.21582.20557.34216.28662.01062.00684.02234.01123.03308.01758.11304.06885.23462.12305.36255.16553.03442.01172.06824.02295.10376.03223.14502.03857.29456.06543.45166.06543s.30664-.02686.45166-.06543c.03552-.00928.06921-.02051.10376-.03223.12793-.04199.24951-.09668.36255-.16553.01074-.00635.02246-.01074.03296-.01758.12646-.08105.24036-.17725.34216-.28662l.08997.04492.75037.37549-.81189,1.21777-.79492,1.19189c-.01843-.00586-.03906-.00488-.05786-.00977-.15015-.0415-.30542-.0708-.46875-.0708s-.3186.0293-.46875.0708ZM25.46033,28.43799l1.57434-2.36182.95129.47559c-.01819.10156-.03149.20508-.03149.31201s.01331.20996.03137.31152l-2.52551,1.2627ZM27.59387,25.2373l.224-.33643.44775.67188-.67175-.33545ZM27.59375,22.76172l.67334-.33691-.44885.67334-.22449-.33643ZM24.52246,19.95752l.29602.44434,1.31458,1.97217-.84009.41992c-.32349-.34668-.78101-.56689-1.29297-.56689s-.96948.22021-1.29297.56689l-.84058-.41992.00037-.00049h-.00012l1.6106-2.41602c.16626.05176.33948.0874.52271.0874.18311,0,.3562-.03564.52246-.0874ZM20.21985,22.66846l.18604.09326-.22437.33643-.44836-.67285.48669.24316ZM20.40588,25.2373l-.67126.33496.44727-.6709.224.33594ZM24,30.5c-.42664-.00098-.77197-.34619-.77283-.77295.00012-.10254.02234-.19971.05872-.28906l.01562-.03076c.00757-.0166.02124-.02881.03003-.04492.05322-.09766.125-.1748.20508-.23682.03894-.03027.07764-.06055.12207-.08252.02319-.01172.04578-.02441.07007-.03369.08496-.03223.17505-.05518.27124-.05518s.18628.02295.27124.05518c.02417.00928.04688.02197.07007.03369.04431.02197.08301.05225.12195.08203.08044.0625.15222.14014.20569.23828.00854.01562.02197.02734.02954.04395l.01538.03076c.0365.08936.05859.18652.05884.28906-.00085.42676-.34619.77197-.77271.77295ZM30.5,26.86377c-.00085.42578-.34619.77148-.77271.77246-.30542-.00049-.56348-.18164-.68921-.43848-.05347-.10986-.08325-.21826-.08362-.33447.00024-.11523.03015-.22461.08362-.33398.12549-.25732.38379-.43848.68921-.43896.42651.00098.77185.34619.77271.77344ZM29.72729,20.36182c.42651.00098.77185.34619.77271.77344-.00085.42676-.34619.77197-.77271.77295-.42676-.00098-.77209-.34619-.77295-.77295.00085-.42725.34619-.77246.77295-.77344ZM27.98608,21.44775l-.60938.30469-.34192.1709-1.57483-2.36182,2.52588,1.2627c-.01807.10156-.03137.20459-.03137.31104,0,.10693.01331.21094.03162.3125ZM24,17.49951c.42651.00098.77185.34619.77271.77344-.00085.42578-.34619.77148-.77271.77246-.42664-.00098-.77197-.34668-.77283-.77246.00085-.42725.34619-.77246.77283-.77344ZM22.53979,19.56152l-1.14355,1.71533-.43091.646-.94751-.47314c.01392-.08936.02747-.1792.02747-.27246,0-.12012-.01257-.2373-.0354-.35107l2.52991-1.26465ZM17.49988,21.17725c.00085-.42725.34619-.77246.77283-.77344.42664.00098.77185.34619.77271.77344-.00085.42578-.34607.77148-.77271.77246-.42664-.00098-.77197-.34668-.77283-.77246ZM17.49988,26.86377c.00085-.42725.34619-.77246.77283-.77344.30542.00049.56372.18164.68921.43896.05322.10986.08325.21924.0835.33398-.00037.11621-.03003.22461-.08374.33447-.12549.25684-.38354.43799-.68896.43848-.42664-.00098-.77197-.34668-.77283-.77246Z"/>
<path fill="#76B900" d="M10.69629,14.45703c.10706-.12354.21558-.24805.32544-.37256l.33057-.375-.75-.66113-.33057.375c-.11218.12695-.2229.25342-.33228.38037l-.32666.37842.75684.65332.32666-.37842Z"/>
<path fill="#76B900" d="M12.36096,12.62549c.1134-.11914.22791-.23779.34351-.35693l.34863-.35889-.71729-.69727-.34863.35889c-.1178.12158-.23438.24268-.34985.36377l-.34521.36182.72363.69043.34521-.36182Z"/>
<polygon fill="#76B900" points="15.93445 9.19141 15.93445 9.19189 15.95569 9.17285 16.3302 8.8418 15.66858 8.09277 15.29407 8.42383 15.27234 8.44238 14.89783 8.77344 15.55994 9.52246 15.93445 9.19141"/>
<path fill="#76B900" d="M14.1106,10.87109h.00012c.11877-.11426.2384-.22803.35913-.3418l.36377-.34326-.68652-.72754-.36377.34326c-.12268.11621-.24438.23193-.36511.34766l-.36084.34619.69238.72168.36084-.34619Z"/>
<path fill="#76B900" d="M7.59961,18.54688l-.00012-.00049c.44568-.69482.95764-1.42041,1.52917-2.16602l.00635-.0083-.00012-.00049c.09912-.12939.20007-.25928.30273-.38965l.30908-.39307-.78589-.61816-.30908.39307c-.10535.13379-.20886.26709-.31067.3999l-.3042.39697.00757.00586c-.46753.62695-.90454,1.24414-1.28687,1.84033l.84204.54004Z"/>
<path fill="#76B900" d="M6.61475,20.23438l-.88721-.46094c-.55151,1.06152-.93237,2.0415-1.11304,2.92432l.97974.2002c.15308-.75342.49805-1.66016,1.02051-2.66357Z"/>
<path fill="#76B900" d="M7.48645,26.49854l.23035-.00342-.03345-.99902-.00012-.00049-.19678.00342c-.79749-.00195-1.31287-.20752-1.61194-.54785-.22632-.25732-.35815-.61182-.37354-1.11475l-.99951.02832c.00977.38867.08789.75537.22681,1.09033l-.00903.00391c.00977.02344.0293.04102.03955.06396.0957.2124.21045.41406.36621.59033.55908.63086,1.40454.88721,2.36145.88525Z"/>
<path fill="#76B900" d="M37.04224,33.44922c-.11047.12109-.22241.24219-.33569.36328l-.34131.36523.73096.68262.34131-.36523c.1156-.12402.22998-.24756.34277-.37109l.3374-.36914-.73804-.6748-.3374.36914Z"/>
<polygon fill="#76B900" points="31.65747 38.56494 31.65759 38.56494 31.63586 38.58301 31.25159 38.90332 31.89221 39.67188 32.27649 39.35156 32.29834 39.33252 32.68213 39.01172 32.04126 38.24414 31.65747 38.56494"/>
<path fill="#76B900" d="M35.32666,35.23291l-.00012.00049c-.11658.11572-.2345.23145-.35352.34717l-.3584.34863.69751.7168.3584-.34863c.12109-.11816.24109-.23584.35999-.35352l.35547-.35205-.70386-.71094-.35547.35205Z"/>
<path fill="#76B900" d="M33.52808,36.93799c-.12195.11035-.24487.2207-.36865.33154l-.37305.33252.66553.74609.37305-.33252c.12598-.1123.25098-.22461.375-.3374l.37012-.33594-.67188-.74023-.37012.33594Z"/>
<path fill="#76B900" d="M40.2533,29.44775h-.00012c-.46692.68506-1.00098,1.39893-1.59607,2.13184l.00037.00049h-.00024l-.00012-.00049c-.10278.12646-.20728.25342-.31372.38135l-.31982.38379.76831.63965.31982-.38379c.10876-.13037.21606-.26074.32141-.39062l.00037.00049c.00452-.00586.00842-.01123.01306-.0166l.30176-.37207-.00708-.00586c.48511-.61426.93933-1.21924,1.33826-1.80469l-.82617-.56348Z"/>
<path fill="#76B900" d="M41.28479,27.78809l.87402.48633c.5813-1.0459.98938-2.01465,1.19495-2.89209l-.97388-.22754c-.17407.74854-.54456,1.64502-1.09509,2.6333Z"/>
<path fill="#76B900" d="M40.43091,21.49951l-.07886.00098.02148.99951.05737-.00098c.86951.00195,1.422.22607,1.72656.5957.21912.26416.34082.62012.34253,1.12598h1c.00098-.39014-.06714-.75977-.19666-1.09863l.00928-.00342c-.00916-.02393-.02844-.04199-.03821-.06543-.08936-.21436-.19824-.41895-.34863-.59863-.57202-.68408-1.46948-.95703-2.49487-.95508Z"/>
<polygon fill="#76B900" points="40.37354 22.50049 40.37354 22.5 40.37341 22.5 40.37354 22.50049"/>
<path fill="#76B900" d="M18.57056,15.4458l-.67651-.73633c-.52161.47949-1.04297.97559-1.56213,1.48828-.20703.2041-.4115.40869-.61328.61328l.71228.70215c.19849-.20166.39966-.40283.60327-.604.51086-.50391,1.02368-.99219,1.53638-1.46338Z"/>
<path fill="#76B900" d="M20.05322,14.12939c.77734-.66602,1.54968-1.29053,2.30933-1.86914l-.6062-.7959c-.77539.59131-1.56238,1.22754-2.35388,1.90576l.65088.75977-.00012-.00049Z"/>
<path fill="#76B900" d="M33.66895,8.30664c.05298.10791.09644.229.12891.36572l.11621.48633.9729-.23242-.11621-.48633c-.04822-.20166-.11572-.39404-.20447-.57471l-.2207-.44873-.89746.44141.2207.44873h.00012Z"/>
<path fill="#76B900" d="M32.02148,7.49951l.0022-.00049c.15356,0,.29688.00977.42908.02734l.49561.06689.13428-.99121-.49561-.06689c-.18176-.02441-.36963-.03564-.56335-.03564h-.50269l.00049,1h.5Z"/>
<path fill="#76B900" d="M29.74451,7.96045v-.00049c.1554-.05371.30737-.10303.45557-.14746l.479-.14404-.28735-.95801-.479.14404c-.16248.04883-.32776.10254-.49561.16064l-.47266.16357.32739.94531.47266-.16357Z"/>
<polygon fill="#76B900" points="40.04736 14.95312 40.04749 14.95312 40.04724 14.95264 40.04736 14.95312"/>
<path fill="#76B900" d="M29.42908,32.55469l.67676.73633c.52148-.479,1.04285-.97559,1.56213-1.4873.20703-.20459.4115-.40918.61328-.61377l-.71216-.70215h-.00012c-.19849.20166-.39966.40283-.60327.604-.51086.50342-1.0238.9917-1.53662,1.46289Z"/>
<path fill="#76B900" d="M27.94641,33.87109c-.77747.66602-1.5498,1.29053-2.30945,1.86914l.60596.7959c.77551-.59131,1.56262-1.22754,2.35413-1.90576l-.65063-.75879v-.00049Z"/>
<rect fill="#76B900" x="13.26849" y="36.94187" width="1.03637" height="1.00006" transform="translate(-25.71802 43.04067) rotate(-77.852)"/>
<path fill="#76B900" d="M14.33044,39.69189c-.05298-.10791-.09644-.22949-.12903-.36572l-.11572-.48633-.97266.23145.11572.48633c.0481.20215.11548.39453.20422.5752l.2207.44873.89746-.44141-.2207-.44873v.00049Z"/>
<path fill="#76B900" d="M15.97791,40.49854l-.00195.00049c-.15369,0-.29688-.00977-.4292-.02734l-.49512-.06738-.13452.99023.49512.06738c.18176.0249.36975.03662.56372.03662h.00244l.5-.00049-.00049-1-.5.00049Z"/>
<path fill="#76B900" d="M18.25537,40.03857h-.00012c-.1554.05371-.30737.10303-.45569.14746l-.479.14355.28711.95801.479-.14355c.16248-.04883.32764-.10205.49561-.16016l.47266-.16357-.3269-.94531-.47266.16357Z"/>
<polygon fill="#76B900" points="37.47046 14.64355 37.47034 14.64307 37.47034 14.64307 37.47046 14.64355"/>
REMOVED_END -->
<!-- ================================================ -->
<!-- ROW 1 -->
<!-- ================================================ -->
......@@ -123,7 +158,6 @@
<!-- Router (green, wider, centered above workers) -->
<rect x="130" y="84" width="280" height="88" rx="10"
fill="url(#green-fill)" filter="url(#green-glow)"/>
<use href="#sym-fork" x="136" y="88" width="20" height="20" style="color:rgba(255,255,255,0.8)"/>
<text x="270" y="125" class="box-label-white">Router</text>
<text x="270" y="138" class="box-sub-white">KV-Aware Routing</text>
......@@ -140,7 +174,6 @@
<rect x="48" y="256" width="160" height="88" rx="10" fill="#76B900" opacity="0.7"/>
<rect x="50" y="256" width="160" height="88" rx="10"
fill="white" stroke="rgba(226,232,240,0.6)" stroke-width="1" filter="url(#shadow)"/>
<use href="#sym-layers" x="54" y="258" width="20" height="20" style="color:#76B900;opacity:0.8"/>
<text x="60" y="296" class="box-label">Prefill</text>
<text x="60" y="309" class="box-sub">Worker</text>
......@@ -148,7 +181,6 @@
<rect x="328" y="256" width="160" height="88" rx="10" fill="#76B900" opacity="0.7"/>
<rect x="330" y="256" width="160" height="88" rx="10"
fill="white" stroke="rgba(226,232,240,0.6)" stroke-width="1" filter="url(#shadow)"/>
<use href="#sym-stream" x="334" y="258" width="20" height="20" style="color:#76B900;opacity:0.8"/>
<text x="340" y="296" class="box-label">Decode</text>
<text x="340" y="309" class="box-sub">Worker</text>
......@@ -164,7 +196,6 @@
<rect x="30" y="420" width="480" height="48" rx="10"
fill="url(#green-fill)" filter="url(#green-glow)" opacity="0.75"/>
</g>
<use href="#sym-transfer" x="36" y="422" width="20" height="18" style="color:white"/>
<text x="270" y="440" class="box-label-white">NIXL</text>
<text x="270" y="453" class="box-sub-white">Accelerated KV Transfer</text>
......@@ -221,8 +252,8 @@
<!-- KV Cache pills (lines drawn earlier, before NIXL) -->
<rect x="136" y="384" width="60" height="16" rx="8" class="pill-green"/>
<text x="166" y="395" class="conn-label label-green">KV Cache</text>
<text x="166" y="395" class="conn-label label-green">KV Transfer</text>
<rect x="344" y="384" width="60" height="16" rx="8" class="pill-green"/>
<text x="374" y="395" class="conn-label label-green">KV Cache</text>
<text x="374" y="395" class="conn-label label-green">KV Transfer</text>
</svg>
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment