Files
LocalAI/docs/static/images/diagrams/model-resolution.html
LocalAI [bot] 7e59a5c7c5 docs: architecture & feature diagrams (blueprint style) (#10137)
* docs: add 'how LocalAI works' architecture diagram

Add a blueprint-style architecture diagram: clients -> small core (API,
router, WebUI, agents) -> gRPC -> backend processes pulled on demand as
OCI images. Place it on the overview page and replace the stale external
architecture image on the reference page.

Assisted-by: Claude:claude-opus-4-8 [Claude Code]
Signed-off-by: Ettore Di Giacinto <mudler@localai.io>

* docs: add blueprint diagrams across feature, distributed & getting-started docs

Add 24 architecture/flow/comparison diagrams (PNG + HTML source) under
docs/static/images/diagrams/, wired into their docs pages, from an
impact-vs-effort audit of the docs. Broaden the API surface on the
overview architecture diagram (OpenAI, Anthropic, ElevenLabs, Ollama,
and LocalAI's own API) and move the gRPC boundary label clear of the arrows.

Pages: distributed mode (architecture, scheduling, ds4 layer-split),
distributed inferencing, MLX, realtime, quantization, MCP, agents,
mitm & cloud proxy, middleware, reverse-proxy TLS, VRAM, voice & face
recognition, reranker, function calling, fine-tuning (recipe + jobs),
diarization, audio transform, quickstart, model resolution.

Assisted-by: Claude:claude-opus-4-8 [Claude Code]
Signed-off-by: Ettore Di Giacinto <mudler@localai.io>

* docs: add composable-core diagram to README hero

Commit the composable-core card (small core + on-demand backend tiles)
alongside the other diagrams and reference it from the README hero via a
repo-relative path, so it renders on GitHub.

Assisted-by: Claude:claude-opus-4-8 [Claude Code]
Signed-off-by: Ettore Di Giacinto <mudler@localai.io>

* docs: fix composable-core connectors/badge and federated-vs-worker layout

- composable-core: thicken the plug-in connectors so they read clearly, and
  widen the SEPARATE IMAGE badge so its text no longer overflows the box.
- federated-vs-worker: shorten the WHOLE/SPLIT REQUEST pills to fit, and
  replace the tangled node-to-node activation arrows with a clean fan-out
  (request split across all sharded nodes), mirroring the federated panel.

Assisted-by: Claude:claude-opus-4-8 [Claude Code]
Signed-off-by: Ettore Di Giacinto <mudler@localai.io>

---------

Signed-off-by: Ettore Di Giacinto <mudler@localai.io>
Co-authored-by: Ettore Di Giacinto <mudler@localai.io>
2026-06-02 18:43:22 +02:00

149 lines
6.7 KiB
HTML

<!doctype html>
<html lang="en">
<head>
<meta charset="utf-8">
<link rel="preconnect" href="https://fonts.googleapis.com">
<link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
<link href="https://fonts.googleapis.com/css2?family=Bricolage+Grotesque:opsz,wght@12..96,600;12..96,700;12..96,800&family=Archivo:wght@500;600;700&display=swap" rel="stylesheet">
<style>
:root{
--paper:#F3E8D2; --paper2:#ECDFC2; --ink:#211C14; --ink-soft:#5A5142;
--rust:#B43A2C; --rust-deep:#8F2C20; --cold:#3F6E73; --hi:#E7D6AE; --dim:#A99F88;
}
*{box-sizing:border-box;margin:0;padding:0}
html,body{width:1600px;height:900px}
body{
background:var(--paper);color:var(--ink);font-family:"Archivo",sans-serif;
position:relative;overflow:hidden;
background-image:
linear-gradient(var(--paper2) 1px,transparent 1px),
linear-gradient(90deg,var(--paper2) 1px,transparent 1px);
background-size:40px 40px;
}
.frame{position:absolute;inset:26px;border:3px solid var(--ink);}
.wrap{position:absolute;inset:26px;padding:30px 56px 26px;display:flex;flex-direction:column}
header{display:flex;align-items:flex-end;justify-content:space-between;gap:30px}
.eyebrow{font-weight:700;letter-spacing:.22em;text-transform:uppercase;font-size:17px;color:var(--rust-deep)}
.eyebrow b{color:var(--ink)}
h1{font-family:"Bricolage Grotesque",sans-serif;font-weight:800;font-size:50px;line-height:.98;letter-spacing:-.015em;margin-top:6px}
h1 em{font-style:normal;color:var(--rust)}
.stamp{border:3px solid var(--ink);padding:10px 16px 8px;transform:rotate(3deg);text-align:center;background:var(--paper);box-shadow:6px 6px 0 var(--ink);flex:none}
.stamp .k{font-family:"Bricolage Grotesque";font-weight:800;font-size:21px;letter-spacing:.04em;line-height:1.05}
.stamp .s{font-weight:700;font-size:11px;letter-spacing:.18em;text-transform:uppercase;color:var(--ink-soft);margin-top:5px}
.stage{flex:1;margin-top:8px}
svg{width:100%;height:100%;overflow:visible}
footer{display:flex;align-items:center;justify-content:space-between;margin-top:6px;gap:24px}
.note{font-weight:600;font-size:18px;color:var(--ink-soft);line-height:1.3;max-width:1080px}
.note b{color:var(--ink)}
.url{font-family:"Bricolage Grotesque";font-weight:800;font-size:22px;color:var(--rust-deep);letter-spacing:.01em;flex:none}
.url span{color:var(--ink)}
</style>
</head>
<body>
<div class="frame"></div>
<div class="wrap">
<header>
<div>
<div class="eyebrow">LocalAI <b>&middot;</b> Models</div>
<h1>Many sources, <em>one load path</em></h1>
</div>
<div class="stamp">
<div class="k">AUTO</div>
<div class="s">detect</div>
</div>
</header>
<div class="stage"><svg viewBox="0 0 1480 560" id="svg"></svg></div>
<footer>
<div class="note">However you point at a model, it lands on the same <b>resolve &rarr; backend &rarr; load</b> path.</div>
<div class="url">localai.io<span>/getting-started/models</span></div>
</footer>
</div>
<script>
const INK="#211C14", PAPER="#F3E8D2", PAPER2="#ECDFC2", HI="#E7D6AE", SOFT="#5A5142", RUST="#B43A2C", RUSTD="#8F2C20", COLD="#3F6E73", DIM="#A99F88";
function el(t,a,x){const e=document.createElementNS("http://www.w3.org/2000/svg",t);for(const k in a)e.setAttribute(k,a[k]);if(x!=null)e.textContent=x;return e;}
const svg=document.getElementById("svg");
function shadowRect(x,y,w,h,fill,stroke,sw,dash){
svg.appendChild(el("rect",{x:x+7,y:y+7,width:w,height:h,fill:INK}));
svg.appendChild(el("rect",{x,y,width:w,height:h,fill,stroke:stroke||INK,"stroke-width":sw||3.5,"stroke-dasharray":dash||"none"}));
}
function txt(x,y,s,o){o=o||{};svg.appendChild(el("text",{x,y,"font-family":o.f||"Archivo","font-weight":o.w||700,"font-size":o.sz||15,"letter-spacing":o.ls||"0","text-anchor":o.a||"start",fill:o.fill||INK},s));}
function arrow(x1,y1,x2,y2,color,dash){
const mx=(x1+x2)/2;
svg.appendChild(el("path",{d:`M ${x1} ${y1} C ${mx} ${y1}, ${mx} ${y2}, ${x2-11} ${y2}`,fill:"none",stroke:color,"stroke-width":3.5,"stroke-linecap":"round","stroke-dasharray":dash||"none"}));
const a=7;
svg.appendChild(el("path",{d:`M ${x2-11} ${y2} l -${a+4} -${a} M ${x2-11} ${y2} l -${a+4} ${a}`,fill:"none",stroke:color,"stroke-width":3.5,"stroke-linecap":"round"}));
}
// ---------- INPUT SOURCES (left) ----------
txt(20,42,"SOURCES",{w:700,sz:14,ls:".2em",fill:SOFT});
const sources=[
{n:"gallery name", s:"localai run llama"},
{n:"huggingface://", s:"hub repo + file"},
{n:"oci:// · ollama://", s:"registry pull"},
{n:"manual file / YAML", s:"local model config"},
];
const SX=24, SW=288, SH=92, sGap=42;
const sTop=58;
const srcY=[];
sources.forEach((c,i)=>{
const y=sTop+i*(SH+sGap);
srcY.push(y);
shadowRect(SX,y,SW,SH,PAPER2,COLD,3.5);
txt(SX+20,y+42,c.n,{f:"Bricolage Grotesque",w:800,sz:25,fill:INK});
txt(SX+20,y+72,c.s,{w:700,sz:15,fill:SOFT});
});
// ---------- CONVERGENCE POINT ----------
const convX=512; // where arrows converge / pipeline begins
const convY=280; // vertical center of pipeline
// ---------- PIPELINE (right, single load path) ----------
const stages=[
{n:"resolve", s:"locate source"},
{n:"auto-detect",s:"match by format"},
{n:"load", s:"start process"},
{n:"serve", s:"ready · OpenAI API"},
];
const PW=200, PH=130, pGap=42;
const pStart=540;
const pY=convY-PH/2;
const pX=[];
stages.forEach((st,i)=> pX.push(pStart+i*(PW+pGap)) );
// connector line behind the pipeline boxes
svg.appendChild(el("line",{x1:convX,y1:convY,x2:pX[stages.length-1]+PW,y2:convY,stroke:RUSTD,"stroke-width":3.5}));
// arrows from each source into the convergence point
const cw=4;
sources.forEach((c,i)=>{
arrow(SX+SW, srcY[i]+SH/2, convX, convY, RUST);
});
// convergence node (small junction)
svg.appendChild(el("circle",{cx:convX,cy:convY,r:9,fill:RUST,stroke:INK,"stroke-width":3}));
// pipeline stage boxes (emphasis: rust)
stages.forEach((st,i)=>{
const x=pX[i], emph=(i===stages.length-1);
shadowRect(x,pY,PW,PH,emph?RUST:HI,INK,4);
txt(x+PW/2,pY+58,st.n,{f:"Bricolage Grotesque",w:800,sz:emph?27:24,a:"middle",fill:emph?PAPER:INK});
txt(x+PW/2,pY+92,st.s,{w:700,sz:15,a:"middle",fill:emph?"#F1D9C8":SOFT});
// step number badge
const bw=34,bh=26,bx=x+14,by=pY+14;
svg.appendChild(el("rect",{x:bx,y:by,width:bw,height:bh,fill:emph?PAPER:PAPER,stroke:INK,"stroke-width":2}));
txt(bx+bw/2,by+19,(i+1),{f:"Bricolage Grotesque",w:800,sz:16,a:"middle",fill:RUSTD});
});
// arrows between pipeline stages
for(let i=0;i<stages.length-1;i++){
arrow(pX[i]+PW, convY, pX[i+1], convY, RUSTD);
}
// arrow from convergence node into first stage
arrow(convX+9, convY, pX[0], convY, RUSTD);
// label above pipeline
txt(pStart, pY-22, "ONE LOAD PATH", {w:700,sz:14,ls:".2em",fill:RUSTD});
</script>
</body>
</html>