Files
neuron/docs/architecture/soma-implementation.html
T
will.anderson a76aaf4831
Deploy Soul to GKE / deploy (push) Failing after 27s
Neuron Soul CI / build (push) Failing after 4m26s
docs: add architecture, R&D, and patent strategy docs
2026-06-10 17:31:07 -05:00

1391 lines
86 KiB
HTML
Raw Blame History

This file contains ambiguous Unicode characters
This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.
<!DOCTYPE html>
<html lang="en">
<head>
<meta charset="UTF-8">
<meta name="viewport" content="width=device-width, initial-scale=1">
<title>Soma — AI-Native Cloud Platform · Eyes Only · Neuron Technologies</title>
<link rel="preconnect" href="https://fonts.googleapis.com">
<link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
<link href="https://fonts.googleapis.com/css2?family=Playfair+Display:ital,wght@0,700;1,400;1,700&family=IBM+Plex+Sans:ital,wght@0,400;0,500;0,600;1,400&family=IBM+Plex+Mono:wght@400;500&display=swap" rel="stylesheet">
<style>
*,*::before,*::after{box-sizing:border-box;margin:0;padding:0}
:root{
--bg:#FAFAF8;--bg2:#F0F0EC;--card:#FFFFFF;
--navy:#0052A0;--navy-d:rgba(0,82,160,.06);--navy-m:rgba(0,82,160,.12);--navy-b:rgba(0,82,160,.22);
--green:#1A7F4B;--green-d:rgba(26,127,75,.06);--green-b:rgba(26,127,75,.22);
--amber:#B45309;--amber-d:rgba(180,83,9,.06);--amber-b:rgba(180,83,9,.22);
--gold:#8B6914;--gold-d:rgba(139,105,20,.07);--gold-b:rgba(139,105,20,.25);
--t1:#0D0D14;--t2:#3A3A4A;--t3:#6B6B7E;
--border:rgba(0,0,0,.07);--border2:rgba(0,0,0,.13);
--head:'Playfair Display',Georgia,serif;
--body:'IBM Plex Sans',system-ui,sans-serif;
--mono:'IBM Plex Mono','SF Mono',monospace;
}
html{scroll-behavior:smooth}
body{font-family:var(--body);background:var(--bg);color:var(--t1);font-size:16px;line-height:1.7;overflow-x:hidden}
body::before{content:'';position:fixed;inset:0;pointer-events:none;z-index:0;
background-image:linear-gradient(rgba(0,0,0,.025) 1px,transparent 1px),linear-gradient(90deg,rgba(0,0,0,.025) 1px,transparent 1px);
background-size:48px 48px}
nav{position:sticky;top:0;z-index:100;background:rgba(250,250,248,.96);backdrop-filter:blur(10px);
border-bottom:1px solid var(--border2);display:flex;align-items:center;padding:0 32px;height:54px;gap:6px;flex-wrap:wrap}
.nav-wordmark{font-family:var(--mono);font-size:.68rem;font-weight:500;letter-spacing:.18em;color:var(--t1);text-transform:uppercase;margin-right:auto}
.nav-link{font-family:var(--mono);font-size:.52rem;letter-spacing:.12em;text-transform:uppercase;color:var(--t3);padding:4px 10px;border-radius:4px;cursor:pointer;transition:all .2s;text-decoration:none;border:1px solid transparent}
.nav-link:hover,.nav-link.active{color:var(--navy);background:var(--navy-d);border-color:var(--navy-b)}
.nav-badge{font-family:var(--mono);font-size:.54rem;letter-spacing:.14em;text-transform:uppercase;
background:rgba(139,105,20,.08);border:1px solid var(--gold-b);color:var(--gold);padding:3px 10px;border-radius:99px;margin-left:8px}
.doc-page{max-width:860px;margin:0 auto;padding:72px 48px 120px;position:relative;z-index:1}
.reveal{opacity:0;transform:translateY(28px);transition:opacity .7s cubic-bezier(.16,1,.3,1),transform .7s cubic-bezier(.16,1,.3,1)}
.reveal.visible{opacity:1;transform:translateY(0)}
.reveal-delay-1{transition-delay:80ms}
.reveal-delay-2{transition-delay:160ms}
.reveal-delay-3{transition-delay:240ms}
/* ── MASTHEAD ── */
.masthead{text-align:center;border-top:3px solid var(--t1);border-bottom:1px solid var(--border2);padding:36px 0 32px;margin-bottom:60px}
.masthead .dateline{font-family:var(--mono);font-size:.56rem;letter-spacing:.20em;text-transform:uppercase;color:var(--t3);margin-bottom:22px}
.masthead .eyebrow{font-family:var(--mono);font-size:.62rem;letter-spacing:.18em;text-transform:uppercase;color:var(--navy);margin-bottom:14px;font-weight:500}
.masthead h1{font-family:var(--head);font-size:2.8rem;font-weight:700;line-height:1.1;margin-bottom:16px}
.masthead h1 em{font-style:italic;color:var(--navy)}
.masthead .subtitle{font-size:.95rem;color:var(--t3);max-width:540px;margin:0 auto;line-height:1.7;font-style:italic}
.masthead .class-badge{display:inline-block;font-family:var(--mono);font-size:.52rem;letter-spacing:.18em;text-transform:uppercase;
background:rgba(139,105,20,.1);border:1px solid var(--gold-b);color:var(--gold);padding:4px 14px;border-radius:99px;margin-bottom:18px}
/* ── SECTION HEADERS ── */
.doc-page h2{font-family:var(--mono);font-size:.56rem;font-weight:500;letter-spacing:.20em;text-transform:uppercase;
color:var(--navy);margin:60px 0 20px;padding-bottom:10px;border-bottom:1px solid var(--border2)}
p{margin-bottom:.9em;font-size:.95rem;color:var(--t2);line-height:1.8}
p strong{color:var(--t1);font-weight:600}
/* ── CALLOUTS ── */
.callout{border-left:3px solid var(--navy);padding:16px 22px;margin:20px 0;background:var(--navy-d);border-radius:0 12px 12px 0;
font-family:var(--head);font-style:italic;font-size:1.02rem;line-height:1.65;color:var(--t1)}
.callout.amber{border-left-color:var(--amber);background:var(--amber-d)}
.callout.green{border-left-color:var(--green);background:var(--green-d)}
.callout.dark{position:relative;border-left:none;background:#0D0D14;color:rgba(255,255,255,.85);border-radius:12px;padding:32px 36px;margin:32px 0;overflow:hidden}
.callout.dark::before{content:'\201C';position:absolute;top:-12px;left:16px;font-family:var(--head);font-size:8rem;line-height:1;color:rgba(255,255,255,.06);pointer-events:none}
.callout.dark p{color:rgba(255,255,255,.75);font-family:var(--head);font-style:italic;font-size:1.1rem;line-height:1.65;margin:0}
.callout.dark strong{color:rgba(255,255,255,.95)}
/* ── PULL QUOTE ── */
.pull-quote{border-top:3px solid var(--t1);border-bottom:1px solid var(--border2);padding:44px 0;margin:60px 0 48px;text-align:center}
.pull-quote blockquote{font-family:var(--head);font-size:1.5rem;font-style:italic;line-height:1.5;color:var(--t1);max-width:600px;margin:0 auto 20px}
.pull-quote cite{font-family:var(--mono);font-size:.54rem;letter-spacing:.16em;text-transform:uppercase;color:var(--t3)}
/* ── SERVICE CATALOG ── */
.catalog-category{margin:32px 0 8px}
.cat-label{font-family:var(--mono);font-size:.52rem;letter-spacing:.18em;text-transform:uppercase;
padding:3px 12px;border-radius:99px;display:inline-block;margin-bottom:14px}
.cat-label.ai{background:var(--navy-d);border:1px solid var(--navy-b);color:var(--navy)}
.cat-label.compute{background:var(--amber-d);border:1px solid var(--amber-b);color:var(--amber)}
.cat-label.network{background:rgba(130,40,180,.07);border:1px solid rgba(130,40,180,.22);color:#7828B4}
.cat-label.data{background:var(--green-d);border:1px solid var(--green-b);color:var(--green)}
.cat-label.security{background:rgba(0,0,0,.05);border:1px solid rgba(0,0,0,.15);color:var(--t1)}
.service-grid{display:grid;grid-template-columns:1fr 1fr;gap:10px;margin-bottom:20px}
.svc-card{background:var(--card);border:1px solid var(--border2);border-radius:10px;padding:16px 18px;transition:box-shadow .2s}
.svc-card:hover{box-shadow:0 4px 16px rgba(0,0,0,.06)}
.svc-name{font-family:var(--mono);font-size:.54rem;letter-spacing:.14em;text-transform:uppercase;margin-bottom:5px;font-weight:500}
.svc-name.ai{color:var(--navy)}
.svc-name.compute{color:var(--amber)}
.svc-name.network{color:#7828B4}
.svc-name.data{color:var(--green)}
.svc-name.security{color:var(--t1)}
.svc-body{font-size:.82rem;color:var(--t2);line-height:1.6}
.svc-badge{font-family:var(--mono);font-size:.46rem;letter-spacing:.1em;text-transform:uppercase;
padding:2px 7px;border-radius:4px;background:var(--navy-d);border:1px solid var(--navy-b);color:var(--navy);
display:inline-block;margin-top:6px}
.svc-badge.differentiator{background:var(--gold-d);border-color:var(--gold-b);color:var(--gold)}
/* ── ARCHITECTURE / VBD DIAGRAM ── */
.arch-diagram{background:var(--card);border:1px solid var(--border2);border-radius:16px;padding:28px;margin:24px 0;overflow:hidden}
.arch-diagram-title{font-family:var(--mono);font-size:.54rem;letter-spacing:.18em;text-transform:uppercase;color:var(--t3);margin-bottom:20px}
/* ── PHASE TIMELINE ── */
.phase-timeline{margin:28px 0;display:flex;flex-direction:column;gap:0}
.phase-card{border:1px solid var(--border2);border-radius:0;background:var(--card);overflow:hidden;border-bottom:none}
.phase-card:first-child{border-radius:14px 14px 0 0}
.phase-card:last-child{border-radius:0 0 14px 14px;border-bottom:1px solid var(--border2)}
.phase-header{padding:20px 24px;display:flex;align-items:flex-start;gap:18px;cursor:pointer;user-select:none;transition:background .2s}
.phase-header:hover{background:var(--navy-d)}
.phase-num{font-family:var(--mono);font-size:1.6rem;font-weight:500;line-height:1;color:rgba(0,0,0,.1);min-width:40px;flex-shrink:0}
.phase-meta{flex:1}
.phase-label-row{display:flex;align-items:center;gap:10px;margin-bottom:5px;flex-wrap:wrap}
.phase-tag{font-family:var(--mono);font-size:.48rem;letter-spacing:.12em;text-transform:uppercase;color:var(--t3)}
.phase-timing{font-family:var(--mono);font-size:.5rem;letter-spacing:.12em;text-transform:uppercase;
padding:2px 9px;border-radius:99px;background:var(--bg2);border:1px solid var(--border2);color:var(--t3)}
.phase-status-badge{font-family:var(--mono);font-size:.5rem;letter-spacing:.12em;text-transform:uppercase;
padding:2px 9px;border-radius:99px}
.phase-status-badge.foundation{background:var(--navy-d);border:1px solid var(--navy-b);color:var(--navy)}
.phase-status-badge.expansion{background:var(--amber-d);border:1px solid var(--amber-b);color:var(--amber)}
.phase-status-badge.scale{background:var(--green-d);border:1px solid var(--green-b);color:var(--green)}
.phase-status-badge.compound{background:rgba(0,0,0,.06);border:1px solid rgba(0,0,0,.18);color:var(--t1)}
.phase-title{font-family:var(--head);font-size:1.2rem;font-weight:700;color:var(--t1);margin-bottom:3px}
.phase-summary{font-size:.83rem;color:var(--t3);line-height:1.5}
.phase-chevron{font-size:.7rem;color:var(--t3);transition:transform .3s;flex-shrink:0;margin-top:6px}
.phase-card.open .phase-chevron{transform:rotate(180deg)}
.phase-card.open .phase-header{background:var(--navy-d)}
.phase-body{max-height:0;overflow:hidden;transition:max-height .5s cubic-bezier(.16,1,.3,1)}
.phase-card.open .phase-body{max-height:2400px}
.phase-content{padding:0 24px 24px;background:var(--card);border-top:1px solid var(--border)}
.phase-content p{font-size:.88rem;margin-bottom:.8em}
/* ── MILESTONE LIST ── */
.milestone-list{margin:14px 0;display:flex;flex-direction:column;gap:7px}
.ms-item{display:flex;gap:12px;align-items:flex-start;padding:10px 14px;border-radius:8px;background:var(--bg2);border:1px solid var(--border)}
.ms-icon{font-size:.85rem;flex-shrink:0;margin-top:1px}
.ms-text{font-size:.84rem;color:var(--t2);line-height:1.55;flex:1}
.ms-text strong{color:var(--t1)}
/* ── TECH SPEC ACCORDION ── */
.spec-block{border:1px solid var(--border2);border-radius:12px;margin:14px 0;overflow:hidden}
.spec-header{padding:18px 22px;display:flex;align-items:center;gap:14px;cursor:pointer;user-select:none;transition:background .2s;background:var(--card)}
.spec-header:hover{background:var(--navy-d)}
.spec-title{font-family:var(--mono);font-size:.56rem;letter-spacing:.16em;text-transform:uppercase;color:var(--t1);font-weight:500;flex:1}
.spec-chevron{font-size:.7rem;color:var(--t3);transition:transform .3s}
.spec-block.open .spec-chevron{transform:rotate(180deg)}
.spec-block.open .spec-header{background:var(--navy-d)}
.spec-body{max-height:0;overflow:hidden;transition:max-height .5s cubic-bezier(.16,1,.3,1)}
.spec-block.open .spec-body{max-height:2400px}
.spec-content{padding:0 22px 22px;background:var(--card);border-top:1px solid var(--border)}
.spec-content p{font-size:.87rem;margin-bottom:.8em}
/* ── CODE / MONO BLOCK ── */
.code-block{font-family:var(--mono);font-size:.78rem;line-height:1.7;background:var(--t1);color:rgba(255,255,255,.8);
border-radius:10px;padding:20px 24px;margin:14px 0;overflow-x:auto;white-space:pre}
.code-block .kw{color:#7CC8FF}
.code-block .cm{color:rgba(255,255,255,.35);font-style:italic}
.code-block .val{color:#A8E6A3}
.code-block .str{color:#FFD180}
/* ── COMPONENT GRID ── */
.comp-grid{display:grid;grid-template-columns:1fr 1fr;gap:10px;margin:16px 0}
.comp-card{border-radius:10px;padding:14px 16px;border:1px solid var(--border2);background:var(--bg2)}
.comp-name{font-family:var(--mono);font-size:.52rem;letter-spacing:.14em;text-transform:uppercase;margin-bottom:5px;font-weight:500}
.comp-body{font-size:.81rem;color:var(--t2);line-height:1.6}
.comp-card.stable .comp-name{color:var(--green)}
.comp-card.stable{border-color:var(--green-b);background:var(--green-d)}
.comp-card.variable .comp-name{color:var(--navy)}
.comp-card.variable{border-color:var(--navy-b);background:var(--navy-d)}
.comp-card.dynamic .comp-name{color:var(--amber)}
.comp-card.dynamic{border-color:var(--amber-b);background:var(--amber-d)}
/* ── OPERATOR TABLE ── */
.op-table{width:100%;border-collapse:collapse;margin:16px 0;font-size:.83rem}
.op-table th{font-family:var(--mono);font-size:.5rem;letter-spacing:.14em;text-transform:uppercase;
color:var(--t3);font-weight:500;padding:10px 14px;border-bottom:2px solid var(--border2);text-align:left}
.op-table td{padding:11px 14px;border-bottom:1px solid var(--border);color:var(--t2);vertical-align:top;line-height:1.5}
.op-table tr:last-child td{border-bottom:none}
.op-table tr:hover td{background:var(--bg2)}
.tag-pill{font-family:var(--mono);font-size:.46rem;letter-spacing:.1em;text-transform:uppercase;
padding:2px 7px;border-radius:4px;display:inline-block;white-space:nowrap}
.tag-pill.navy{background:var(--navy-d);border:1px solid var(--navy-b);color:var(--navy)}
.tag-pill.green{background:var(--green-d);border:1px solid var(--green-b);color:var(--green)}
.tag-pill.amber{background:var(--amber-d);border:1px solid var(--amber-b);color:var(--amber)}
/* ── NODE STATE FLOW ── */
.state-flow{display:flex;align-items:center;gap:6px;flex-wrap:wrap;margin:16px 0;padding:20px 24px;
background:var(--card);border:1px solid var(--border2);border-radius:12px}
.state-node{font-family:var(--mono);font-size:.54rem;letter-spacing:.1em;text-transform:uppercase;
padding:7px 14px;border-radius:8px;border:1px solid var(--border2);background:var(--bg2);color:var(--t2)}
.state-node.active{background:var(--navy-d);border-color:var(--navy-b);color:var(--navy)}
.state-node.warn{background:var(--amber-d);border-color:var(--amber-b);color:var(--amber)}
.state-node.end{background:rgba(0,0,0,.06);border-color:rgba(0,0,0,.18);color:var(--t1)}
.state-arrow{color:var(--t3);font-size:.75rem;flex-shrink:0}
/* ── COMPETITIVE POSITION ── */
.position-grid{display:grid;grid-template-columns:1fr 1fr 1fr;gap:10px;margin:20px 0}
.pos-card{background:var(--card);border:1px solid var(--border2);border-radius:10px;padding:18px}
.pos-label{font-family:var(--mono);font-size:.5rem;letter-spacing:.14em;text-transform:uppercase;color:var(--t3);margin-bottom:8px}
.pos-title{font-family:var(--head);font-size:.95rem;font-weight:700;color:var(--t1);margin-bottom:6px;line-height:1.3}
.pos-body{font-size:.8rem;color:var(--t2);line-height:1.6}
.pos-card.highlight{border-color:var(--navy-b);background:var(--navy-d)}
.pos-card.highlight .pos-label{color:var(--navy)}
/* ── FIVE YEAR ARC ── */
.arc-timeline{margin:24px 0;position:relative;padding-left:28px}
.arc-timeline::before{content:'';position:absolute;left:6px;top:8px;bottom:8px;width:2px;background:linear-gradient(to bottom,var(--navy),var(--green))}
.arc-item{position:relative;margin-bottom:28px;padding-left:24px}
.arc-dot{position:absolute;left:-22px;top:4px;width:12px;height:12px;border-radius:50%;background:var(--navy);border:2px solid var(--bg);flex-shrink:0}
.arc-dot.mid{background:var(--amber)}
.arc-dot.end{background:var(--green)}
.arc-year{font-family:var(--mono);font-size:.5rem;letter-spacing:.16em;text-transform:uppercase;color:var(--t3);margin-bottom:4px}
.arc-headline{font-family:var(--head);font-size:1.1rem;font-weight:700;color:var(--t1);margin-bottom:6px}
.arc-body{font-size:.84rem;color:var(--t2);line-height:1.65}
/* ── FOOTER ── */
.footer-block{font-family:var(--mono);font-size:.56rem;letter-spacing:.12em;text-transform:uppercase;color:var(--t3);text-align:center;line-height:2;margin-top:80px;padding-top:32px;border-top:1px solid var(--border2)}
@media(max-width:700px){
.doc-page{padding:48px 20px 80px}
.masthead h1{font-size:2rem}
.service-grid{grid-template-columns:1fr}
.comp-grid{grid-template-columns:1fr}
.position-grid{grid-template-columns:1fr}
.phase-header{gap:12px}
.phase-num{font-size:1.2rem;min-width:28px}
}
</style>
</head>
<body>
<nav>
<span class="nav-wordmark">Neuron · Soma</span>
<a class="nav-link active" href="#executive-summary">Summary</a>
<a class="nav-link" href="#strategy">Strategy</a>
<a class="nav-link" href="#catalog">Services</a>
<a class="nav-link" href="#architecture">Architecture</a>
<a class="nav-link" href="#phases">Phases</a>
<a class="nav-link" href="#specs">Tech Spec</a>
<a class="nav-link" href="#competitive">Position</a>
<a class="nav-link" href="#operations">Operations</a>
<a class="nav-link" href="#arc">5-Year Arc</a>
<span class="nav-badge">Eyes Only · Confidential</span>
</nav>
<div class="doc-page">
<div class="masthead reveal">
<div class="dateline">April 25, 2026 · Eyes Only · Confidential · Internal Use Only</div>
<div class="class-badge">Eyes Only — Confidential</div>
<div class="eyebrow">Soma · AI-Native Cloud Platform</div>
<h1>Full <em>Implementation</em> Plan</h1>
<p class="subtitle">Six phases. One substrate. The complete build plan for Soma — from internal inference router to the infrastructure layer that quietly consumes its providers.</p>
</div>
<!-- ── EXECUTIVE SUMMARY ── -->
<section id="executive-summary">
<h2>Executive Summary</h2>
<p>Soma is the cloud platform Neuron Technologies is building — not as a startup play to compete with AWS on price, but as <strong>the infrastructure substrate the entire Neuron ecosystem runs on</strong>, which will scale into a platform offered to external customers and eventually leverage its providers into acquisition conversations from a position of dependency.</p>
<p>The premise is simple and has almost no precedent: an AI-native cloud where the operator is an AI, the routing intelligence is patented, and the economics improve automatically as open-source models improve and GPU costs fall. Soma doesn't have human ops engineers. Neuron runs it.</p>
<div class="callout dark">
<p>The cloud providers will see growing revenue. Their customers will come to us. By the time anyone understands what happened, Soma is the largest single customer of at least one provider region — and the negotiating table looks very different from that chair.</p>
</div>
<p>In the near term, Soma's primary value is <strong>internal</strong>: running Neuron's inference at effectively zero marginal cost because Soma is the infrastructure and Neuron is the AI that manages it. Every Neuron AI license sold has a delivery cost that approaches zero. That's the business model in one sentence.</p>
<p>The 5-year arc: internal-only substrate → multi-provider abstraction → external customer platform → significant provider spend (leverage building) → data center acquisitions → acquisition offers from leverage, not desperation.</p>
<div class="callout">
Soma's moat is not the models. Models are commodities. The moat is the <strong>backplane</strong> — the routing intelligence, the provider abstraction, the Neuron operator interface — all protected by patents before the architecture is disclosed.
</div>
</section>
<!-- ── STRATEGIC CONTEXT ── -->
<section id="strategy">
<h2>Strategic Context</h2>
<p>The cloud industry's structural weakness is that every major provider depends on growing their retail customer base. If a sufficiently large customer routes all new workloads through a single abstraction layer — one the provider can't see inside — the provider loses the direct relationship, the usage data, and eventually the retail customers who follow the abstraction.</p>
<p><strong>The consumption strategy has four phases, and providers are participants in all of them without knowing it:</strong></p>
<div class="callout dark">
<p><strong>Phase one:</strong> Soma runs on provider infrastructure. They see growing revenue. Customers sign NDAs. They don't disclose where Soma runs. Providers don't know what's happening inside Soma's abstraction — they see API calls and billing.<br><br>
<strong>Phase two:</strong> Soma grows. Provider spend grows. Anti-concentration rules keep no single provider above 60% — they all see healthy revenue but none sees the full picture.<br><br>
<strong>Phase three:</strong> Physical data centers, acquired quietly. Unglamorous facilities, not headlines. Neuron manages them. Cost per compute unit collapses.<br><br>
<strong>Phase four:</strong> Providers can't afford to lose Soma's spend. Acquisition offers arrive, or Soma makes them. Either way, the negotiating position is leverage — not supplication.</p>
</div>
<p>The cover story is completely true and reveals nothing: "Our cloud spend is enormous." Yes. That's correct. That's all they get to know.</p>
<p>Meanwhile, the Dharma R&D lab continuously widens the capability gap. Every six months that Soma runs, the moat deepens: more patent coverage, more routing intelligence, more operational data that trains better cost optimization. The compounding is structural.</p>
<div class="callout green">
Why this works at all: Neuron (the AI) manages Soma operationally. No human ops team. Operational costs are near zero. Open-source model improvements and falling GPU costs improve Soma's economics automatically — without any action from us. The flywheel self-accelerates.
</div>
</section>
<!-- ── PULL QUOTE ── -->
<div class="pull-quote reveal">
<blockquote>"The intelligence is in the backplane, not the models. The backplane is ours."</blockquote>
<cite>Soma Architecture Principle · Internal</cite>
</div>
<!-- ── SERVICE CATALOG ── -->
<section id="catalog">
<h2>Full Service Catalog</h2>
<p>Soma offers a complete cloud platform. Services are organized by category. AI-native services are Soma's primary differentiator — these are not retrofitted onto a general-purpose cloud. They are the reason Soma exists.</p>
<!-- AI Services -->
<div class="catalog-category">
<div class="cat-label ai">AI-Native Services</div>
<div class="service-grid">
<div class="svc-card">
<div class="svc-name ai">Inference Router</div>
<div class="svc-body">Intelligent LLM request routing across three compute tiers. Low (8B models, ~$0.40/hr), Medium (1334B, balanced), High (70B+, ~$1.75/hr). Deterministic routing tree — every decision is auditable.</div>
<div class="svc-badge differentiator">Core Differentiator</div>
</div>
<div class="svc-card">
<div class="svc-name ai">Image Generation</div>
<div class="svc-body">Dedicated compute for image workloads. 10 checkpoint models including lustify, juggernaut, flux, illustrious. Intelligent LoRA selection via LLM reasoning. SD Forge backend.</div>
<div class="svc-badge">AI-Native</div>
</div>
<div class="svc-card">
<div class="svc-name ai">Video Generation</div>
<div class="svc-body">SVD XT on dedicated GPU. Separate from inference pool — video workloads have distinct latency profiles and memory requirements.</div>
<div class="svc-badge">AI-Native</div>
</div>
<div class="svc-card">
<div class="svc-name ai">Model Registry</div>
<div class="svc-body">Versioned catalog of all available models with routing metadata, capability tags, cost profiles, and availability status. The authoritative source the Router queries.</div>
<div class="svc-badge">Core Infrastructure</div>
</div>
<div class="svc-card">
<div class="svc-name ai">Pipeline Engine</div>
<div class="svc-body">22-step async pipeline system inherited from Pantheon conductor. Event-driven, step-level observability, dead-letter handling, priority queues.</div>
<div class="svc-badge differentiator">Core Differentiator</div>
</div>
<div class="svc-card">
<div class="svc-name ai">AI Workload Environments</div>
<div class="svc-body">Four environment profiles: <strong>Studio</strong> (full creative suite), <strong>Mini</strong> (lightweight inference), <strong>Crucible</strong> (H200-scale training/merging), <strong>Production</strong> (always-on routed inference).</div>
<div class="svc-badge differentiator">Core Differentiator</div>
</div>
</div>
</div>
<!-- Compute -->
<div class="catalog-category">
<div class="cat-label compute">Compute</div>
<div class="service-grid">
<div class="svc-card">
<div class="svc-name compute">Containers</div>
<div class="svc-body">Docker-compatible container deployment to the multi-provider node pool. Soma selects the optimal node — provider, region, and tier — transparently.</div>
</div>
<div class="svc-card">
<div class="svc-name compute">Functions</div>
<div class="svc-body">Serverless, event-triggered execution. Scales to zero between invocations. Ideal for webhook handlers, background jobs, and lightweight data processing.</div>
</div>
<div class="svc-card">
<div class="svc-name compute">VMs</div>
<div class="svc-body">Full virtual machines for workloads that need dedicated isolation, specific kernel versions, or persistent state that containers don't suit.</div>
</div>
<div class="svc-card">
<div class="svc-name compute">GPU Instances</div>
<div class="svc-body">First-class GPU allocation. Tier-aware provisioning — the right GPU for the job, across RunPod, Legion, or cloud provider spot pools, without the customer specifying provider.</div>
</div>
</div>
</div>
<!-- Networking -->
<div class="catalog-category">
<div class="cat-label network">Networking</div>
<div class="service-grid">
<div class="svc-card">
<div class="svc-name network">Load Balancers</div>
<div class="svc-body">HTTP/HTTPS with health checks, SSL termination, weighted routing, and sticky sessions. Provider-agnostic — the same config works regardless of where the backends run.</div>
</div>
<div class="svc-card">
<div class="svc-name network">API Gateway</div>
<div class="svc-body">AI-native: semantic routing, intent-based rate limiting, auth, versioning, usage analytics. Not a generic proxy — understands the shape of AI workloads.</div>
<div class="svc-badge differentiator">AI-Native</div>
</div>
<div class="svc-card">
<div class="svc-name network">DNS Management</div>
<div class="svc-body">One zone, works across all providers and regions. Customer configures DNS once — Soma handles propagation and failover as backends move.</div>
</div>
<div class="svc-card">
<div class="svc-name network">VPC / Private Networks</div>
<div class="svc-body">Spans providers transparently. Customer-isolated. Private traffic between Soma services never traverses the public internet.</div>
</div>
<div class="svc-card">
<div class="svc-name network">Firewall</div>
<div class="svc-body">Rules defined once, enforced everywhere. Soma translates declarative firewall config to provider-native rules — AWS security groups, GCP firewall rules, etc.</div>
</div>
<div class="svc-card">
<div class="svc-name network">CDN</div>
<div class="svc-body">Edge caching and asset delivery. Tightly integrated with Soma Object Storage — assets uploaded there are automatically available at edge.</div>
</div>
</div>
</div>
<!-- Data -->
<div class="catalog-category">
<div class="cat-label data">Data</div>
<div class="service-grid">
<div class="svc-card">
<div class="svc-name data">Object Storage</div>
<div class="svc-body">S3/R2-compatible blob storage. Model weights, artifacts, training datasets, generated assets. Cryptographically separated per customer namespace.</div>
</div>
<div class="svc-card">
<div class="svc-name data">Managed Databases</div>
<div class="svc-body">Postgres and Redis, managed. Automated backups, HA configuration, point-in-time recovery. Customer doesn't manage the underlying cluster.</div>
</div>
<div class="svc-card">
<div class="svc-name data">Block Storage</div>
<div class="svc-body">Persistent volumes for containers and VMs. Provider-agnostic — a volume provisioned against a Legion node looks identical to one on AWS.</div>
</div>
<div class="svc-card">
<div class="svc-name data">Message Queues</div>
<div class="svc-body">Async job processing with dead letter queues, priority queues, and visibility timeouts. Foundation of the Pipeline Engine's step execution model.</div>
</div>
</div>
</div>
<!-- Security -->
<div class="catalog-category">
<div class="cat-label security">Security &amp; Identity</div>
<div class="service-grid">
<div class="svc-card">
<div class="svc-name security">Secrets Management</div>
<div class="svc-body">Vault-backed, auto-rotated, customer-isolated. No customer ever touches another's secrets namespace. The same secret delivery mechanism Neuron itself uses.</div>
</div>
<div class="svc-card">
<div class="svc-name security">API Keys</div>
<div class="svc-body">Scoped, revocable, usage-tracked. Every API key is bound to a customer namespace and a permission scope — no ambient authority.</div>
</div>
<div class="svc-card">
<div class="svc-name security">IAM</div>
<div class="svc-body">Role-based access control, team management, audit logs. Every action through Soma is attributed, logged, and queryable.</div>
</div>
<div class="svc-card">
<div class="svc-name security">Customer Isolation</div>
<div class="svc-body">Hard multi-tenancy: separate Vault namespaces, cryptographically separated storage buckets, VPC-level network isolation. Enforced at the infrastructure layer, not application logic.</div>
<div class="svc-badge differentiator">Architectural Property</div>
</div>
</div>
</div>
</section>
<!-- ── ARCHITECTURE ── -->
<section id="architecture">
<h2>Architecture — Volatility-Based Decomposition</h2>
<p>Soma's architecture is organized by <strong>volatility tier</strong> — how frequently a component changes. Stable components define the contracts. Variable components implement the policies. Dynamic components reflect live state. This decomposition keeps the stable API surface clean while allowing aggressive iteration on the components that need to evolve.</p>
<div class="arch-diagram reveal">
<div class="arch-diagram-title">Soma System Diagram — VBD Volatility Swim Lanes</div>
<svg viewBox="0 0 800 420" xmlns="http://www.w3.org/2000/svg" style="width:100%;height:auto;display:block">
<!-- Background lanes -->
<rect x="0" y="0" width="800" height="420" rx="8" fill="#F8F8F6"/>
<!-- Lane: Dynamic (top) -->
<rect x="10" y="10" width="780" height="118" rx="6" fill="rgba(180,83,9,.05)" stroke="rgba(180,83,9,.22)" stroke-width="1"/>
<text x="20" y="28" font-family="'IBM Plex Mono',monospace" font-size="9" fill="#B45309" letter-spacing="2" text-transform="uppercase">DYNAMIC — continuously changing</text>
<!-- Dynamic components -->
<rect x="20" y="36" width="155" height="82" rx="6" fill="rgba(180,83,9,.08)" stroke="rgba(180,83,9,.3)" stroke-width="1"/>
<text x="30" y="55" font-family="'IBM Plex Mono',monospace" font-size="8" fill="#B45309" letter-spacing="1">CONTROL PLANE</text>
<text x="30" y="70" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Live node state</text>
<text x="30" y="83" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Health &amp; capacity</text>
<text x="30" y="96" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Fleet composition</text>
<rect x="185" y="36" width="155" height="82" rx="6" fill="rgba(180,83,9,.08)" stroke="rgba(180,83,9,.3)" stroke-width="1"/>
<text x="195" y="55" font-family="'IBM Plex Mono',monospace" font-size="8" fill="#B45309" letter-spacing="1">COST ORACLE</text>
<text x="195" y="70" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Real-time pricing</text>
<text x="195" y="83" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">All providers</text>
<text x="195" y="96" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">60s poll + cache</text>
<rect x="350" y="36" width="155" height="82" rx="6" fill="rgba(180,83,9,.08)" stroke="rgba(180,83,9,.3)" stroke-width="1"/>
<text x="360" y="55" font-family="'IBM Plex Mono',monospace" font-size="8" fill="#B45309" letter-spacing="1">ORCHESTRATOR</text>
<text x="360" y="70" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Provisioning</text>
<text x="360" y="83" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Scaling decisions</text>
<text x="360" y="96" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Warm pool mgmt</text>
<rect x="515" y="36" width="155" height="82" rx="6" fill="rgba(180,83,9,.08)" stroke="rgba(180,83,9,.3)" stroke-width="1"/>
<text x="525" y="55" font-family="'IBM Plex Mono',monospace" font-size="8" fill="#B45309" letter-spacing="1">OBSERVER</text>
<text x="525" y="70" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Telemetry stream</text>
<text x="525" y="83" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Anomaly detection</text>
<text x="525" y="96" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Event emission</text>
<!-- Lane: Variable (middle) -->
<rect x="10" y="138" width="780" height="138" rx="6" fill="rgba(0,82,160,.04)" stroke="rgba(0,82,160,.18)" stroke-width="1"/>
<text x="20" y="156" font-family="'IBM Plex Mono',monospace" font-size="9" fill="#0052A0" letter-spacing="2">VARIABLE — changes with requirements</text>
<rect x="20" y="164" width="155" height="100" rx="6" fill="rgba(0,82,160,.07)" stroke="rgba(0,82,160,.25)" stroke-width="1"/>
<text x="30" y="183" font-family="'IBM Plex Mono',monospace" font-size="8" fill="#0052A0" letter-spacing="1">SOMA ROUTER</text>
<text x="30" y="198" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Routing rules</text>
<text x="30" y="211" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Tier definitions</text>
<text x="30" y="224" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Model selection</text>
<text x="30" y="237" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Anti-concentration</text>
<text x="30" y="250" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">logic</text>
<rect x="185" y="164" width="155" height="100" rx="6" fill="rgba(0,82,160,.07)" stroke="rgba(0,82,160,.25)" stroke-width="1"/>
<text x="195" y="183" font-family="'IBM Plex Mono',monospace" font-size="8" fill="#0052A0" letter-spacing="1">NODE POOL</text>
<text x="195" y="198" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Fleet composition</text>
<text x="195" y="211" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Provider mix</text>
<text x="195" y="224" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">RunPod + Legion</text>
<text x="195" y="237" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">+ Cloud providers</text>
<rect x="350" y="164" width="155" height="100" rx="6" fill="rgba(0,82,160,.07)" stroke="rgba(0,82,160,.25)" stroke-width="1"/>
<text x="360" y="183" font-family="'IBM Plex Mono',monospace" font-size="8" fill="#0052A0" letter-spacing="1">PIPELINE ENGINE</text>
<text x="360" y="198" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Step configs</text>
<text x="360" y="211" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Pipeline defs</text>
<text x="360" y="224" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">22-step async</text>
<rect x="515" y="164" width="155" height="100" rx="6" fill="rgba(0,82,160,.07)" stroke="rgba(0,82,160,.25)" stroke-width="1"/>
<text x="525" y="183" font-family="'IBM Plex Mono',monospace" font-size="8" fill="#0052A0" letter-spacing="1">API GATEWAY RULES</text>
<text x="525" y="198" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Auth policies</text>
<text x="525" y="211" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Rate limits</text>
<text x="525" y="224" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Routing config</text>
<!-- Lane: Stable (bottom) -->
<rect x="10" y="286" width="780" height="124" rx="6" fill="rgba(26,127,75,.04)" stroke="rgba(26,127,75,.18)" stroke-width="1"/>
<text x="20" y="304" font-family="'IBM Plex Mono',monospace" font-size="9" fill="#1A7F4B" letter-spacing="2">STABLE — rarely changes · contract layer</text>
<rect x="20" y="312" width="175" height="88" rx="6" fill="rgba(26,127,75,.07)" stroke="rgba(26,127,75,.25)" stroke-width="1"/>
<text x="30" y="331" font-family="'IBM Plex Mono',monospace" font-size="8" fill="#1A7F4B" letter-spacing="1">STORAGE LAYER</text>
<text x="30" y="346" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">S3-compatible API contract</text>
<text x="30" y="359" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">R2 / provider-agnostic</text>
<text x="30" y="372" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">interface</text>
<rect x="205" y="312" width="175" height="88" rx="6" fill="rgba(26,127,75,.07)" stroke="rgba(26,127,75,.25)" stroke-width="1"/>
<text x="215" y="331" font-family="'IBM Plex Mono',monospace" font-size="8" fill="#1A7F4B" letter-spacing="1">MODEL CATALOG</text>
<text x="215" y="346" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Schema + interface</text>
<text x="215" y="359" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Routing metadata</text>
<text x="215" y="372" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">contract</text>
<rect x="390" y="312" width="175" height="88" rx="6" fill="rgba(26,127,75,.07)" stroke="rgba(26,127,75,.25)" stroke-width="1"/>
<text x="400" y="331" font-family="'IBM Plex Mono',monospace" font-size="8" fill="#1A7F4B" letter-spacing="1">SECRETS INTERFACE</text>
<text x="400" y="346" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Vault API contract</text>
<text x="400" y="359" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Customer-isolated</text>
<text x="400" y="372" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">namespace model</text>
<rect x="575" y="312" width="175" height="88" rx="6" fill="rgba(26,127,75,.07)" stroke="rgba(26,127,75,.25)" stroke-width="1"/>
<text x="585" y="331" font-family="'IBM Plex Mono',monospace" font-size="8" fill="#1A7F4B" letter-spacing="1">NEURON OPERATOR</text>
<text x="585" y="346" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Command protocol</text>
<text x="585" y="359" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">Scoped service token</text>
<text x="585" y="372" font-family="'IBM Plex Sans',sans-serif" font-size="9" fill="#3A3A4A">interface</text>
<!-- Arrows between layers (simplified) -->
<line x1="400" y1="128" x2="400" y2="138" stroke="rgba(0,0,0,.12)" stroke-width="1.5" marker-end="url(#arr)"/>
<line x1="400" y1="276" x2="400" y2="286" stroke="rgba(0,0,0,.12)" stroke-width="1.5" marker-end="url(#arr)"/>
<defs>
<marker id="arr" markerWidth="6" markerHeight="6" refX="3" refY="3" orient="auto">
<path d="M0,0 L6,3 L0,6 Z" fill="rgba(0,0,0,.25)"/>
</marker>
</defs>
</svg>
</div>
<h2 style="margin-top:32px">Component Breakdown</h2>
<p><strong>Stable (contract layer — rarely changes):</strong></p>
<div class="comp-grid">
<div class="comp-card stable">
<div class="comp-name">Storage Layer</div>
<div class="comp-body">S3-compatible API contract. Implemented on R2 today; provider can change without touching anything above.</div>
</div>
<div class="comp-card stable">
<div class="comp-name">Model Catalog</div>
<div class="comp-body">Schema and interface contract. Models are added; the schema does not change.</div>
</div>
<div class="comp-card stable">
<div class="comp-name">Secrets Interface</div>
<div class="comp-body">Vault API contract. Customer namespace model baked in — cannot be changed without breaking isolation guarantees.</div>
</div>
<div class="comp-card stable">
<div class="comp-name">Neuron Operator Interface</div>
<div class="comp-body">Command protocol between Neuron and Soma. Stable because it is the language Neuron speaks to manage the platform.</div>
</div>
</div>
<p><strong>Variable (policy layer — changes with requirements):</strong></p>
<div class="comp-grid">
<div class="comp-card variable">
<div class="comp-name">Soma Router</div>
<div class="comp-body">Routing rules, tier definitions, model selection logic. Evolves as the model landscape and pricing change.</div>
</div>
<div class="comp-card variable">
<div class="comp-name">Node Pool</div>
<div class="comp-body">Fleet composition and provider mix. Grows as new providers are onboarded. Anti-concentration rules enforced here.</div>
</div>
<div class="comp-card variable">
<div class="comp-name">Pipeline Engine</div>
<div class="comp-body">Step configurations, pipeline definitions. New pipeline types added without core changes.</div>
</div>
<div class="comp-card variable">
<div class="comp-name">API Gateway Rules</div>
<div class="comp-body">Auth, rate limiting, routing configuration. Customer-specific rules without platform rebuilds.</div>
</div>
</div>
<p><strong>Dynamic (state layer — continuously changing):</strong></p>
<div class="comp-grid">
<div class="comp-card dynamic">
<div class="comp-name">Control Plane</div>
<div class="comp-body">Live node state, health, capacity. Updated on every heartbeat from every node in the pool.</div>
</div>
<div class="comp-card dynamic">
<div class="comp-name">Cost Oracle</div>
<div class="comp-body">Real-time pricing across all providers. Polled every 60 seconds. Degraded mode uses cached data with staleness flag.</div>
</div>
<div class="comp-card dynamic">
<div class="comp-name">Workload Orchestrator</div>
<div class="comp-body">Active provisioning and scaling decisions. Acts on Observer signals and Neuron commands.</div>
</div>
<div class="comp-card dynamic">
<div class="comp-name">Observer</div>
<div class="comp-body">Telemetry stream and anomaly detection. Emits events that close the feedback loop on every routing decision.</div>
</div>
</div>
</section>
<!-- ── IMPLEMENTATION PHASES ── -->
<section id="phases">
<h2>Implementation Phases</h2>
<p>Six phases across 18+ months. Each phase has a clear "done" definition — a milestone that proves the phase is complete, not just that work happened. Phases 0 through 2 are internal-only. Phase 3 opens to external customers. Phases 4 and 5 are the strategic endgame.</p>
<div class="phase-timeline">
<!-- Phase 0 -->
<div class="phase-card" id="phase-0">
<div class="phase-header" onclick="togglePhase('phase-0')">
<div class="phase-num">0</div>
<div class="phase-meta">
<div class="phase-label-row">
<span class="phase-tag">Foundation</span>
<span class="phase-timing">Months 12</span>
<span class="phase-status-badge foundation">Internal Only</span>
</div>
<div class="phase-title">Foundation — Neuron Runs on Soma</div>
<div class="phase-summary">Port Pantheon. Wire inference. Prove the substrate works. No external exposure.</div>
</div>
<span class="phase-chevron"></span>
</div>
<div class="phase-body">
<div class="phase-content">
<p>Phase 0 is the hardest phase to define and the most important to execute correctly. It answers exactly one question: can Soma replace our current ad-hoc infrastructure as the substrate for Neuron's own inference?</p>
<p>The deliverables are unglamorous plumbing — but every subsequent phase builds on this foundation, so it must be right.</p>
<div class="milestone-list">
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Pantheon Conductor → Soma Core.</strong> Port the conductor pipeline system. 22-step async is the heartbeat of everything.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Control Plane:</strong> Node registry, health monitoring, heartbeat protocol. Knows what nodes exist, what state they're in.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Cost Oracle:</strong> Real-time pricing for RunPod + Legion. 60-second polling, degraded mode, staleness flags.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Soma Router — basic:</strong> Tier routing (Low/Medium/High), round-robin within tier. Deterministic, auditable.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Inference Services:</strong> LLM (Ollama) + Image Gen (SD Forge) wired through the Router. End-to-end path validated.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Neuron Operator Interface:</strong> I can provision, monitor, and manage Soma via conversation. Actions emit ObserverEvents.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Object Storage:</strong> R2 integration, model registry wired, weights accessible by inference nodes.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Secrets:</strong> Vault wired through Soma secrets layer. No plaintext credentials anywhere in the path.</div>
</div>
</div>
<div class="callout green">
<strong>Phase 0 Milestone:</strong> Neuron inference runs 100% on Soma. Zero OpenAI/Anthropic API calls. Every request routes through the Soma Router, is served by a Soma-managed node, and emits a telemetry event.
</div>
</div>
</div>
</div>
<!-- Phase 1 -->
<div class="phase-card" id="phase-1">
<div class="phase-header" onclick="togglePhase('phase-1')">
<div class="phase-num">1</div>
<div class="phase-meta">
<div class="phase-label-row">
<span class="phase-tag">Expansion</span>
<span class="phase-timing">Months 34</span>
<span class="phase-status-badge expansion">Multi-Provider</span>
</div>
<div class="phase-title">Multi-Provider — Traffic Spans Three Providers</div>
<div class="phase-summary">Abstract the provider layer. Cost-optimize routing. Anti-concentration enforcement begins.</div>
</div>
<span class="phase-chevron"></span>
</div>
<div class="phase-body">
<div class="phase-content">
<p>Phase 1 is where the strategic thesis is proven at small scale: Soma can span multiple providers transparently, route cost-optimally across them, and enforce anti-concentration rules so no single provider sees more than 60% of traffic.</p>
<div class="milestone-list">
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Provider Abstraction Layer:</strong> RunPod adapter, Legion adapter, AWS EC2 adapter. Each implements the same internal interface. Swappable.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Anti-Concentration Enforcement:</strong> No provider exceeds 60% of capacity. Enforced at routing time, not policy doc.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Cost Oracle Expanded:</strong> Live pricing from RunPod API, Legion static cost model, AWS spot + on-demand. Comparative routing begins.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Cost-Optimized Routing:</strong> Router selects lowest-cost node meeting tier requirement with capacity. Not round-robin — economically optimal.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Warm Pool Management:</strong> Idle-terminate after 15 minutes. Pre-warm on demand signal from Observer. Cold start mitigation: minimum always-on per tier.</div>
</div>
</div>
<div class="callout green">
<strong>Phase 1 Milestone:</strong> Traffic routes across RunPod, Legion, and AWS EC2 transparently. Soma's routing layer selects provider automatically based on live cost and capacity. No single provider sees more than 60%.
</div>
</div>
</div>
</div>
<!-- Phase 2 -->
<div class="phase-card" id="phase-2">
<div class="phase-header" onclick="togglePhase('phase-2')">
<div class="phase-num">2</div>
<div class="phase-meta">
<div class="phase-label-row">
<span class="phase-tag">Platform</span>
<span class="phase-timing">Months 57</span>
<span class="phase-status-badge foundation">Full Compute</span>
</div>
<div class="phase-title">Compute &amp; Networking — First External Customer</div>
<div class="phase-summary">Full compute and networking primitives. A complete application can be deployed on Soma.</div>
</div>
<span class="phase-chevron"></span>
</div>
<div class="phase-body">
<div class="phase-content">
<p>Phase 2 expands Soma from an inference platform into a general-purpose compute and networking platform. The test: can an external customer deploy a full-stack application — frontend, backend, database, storage — on Soma without knowing which underlying providers are serving it?</p>
<div class="milestone-list">
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Container Orchestration:</strong> Deploy Docker-compatible containers to the node pool. Soma selects optimal node transparently.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Load Balancer Service:</strong> HTTP/HTTPS routing, health checks, SSL termination, sticky sessions.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>API Gateway:</strong> Auth, rate limiting, semantic routing, usage tracking. Customer-configurable without platform involvement.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>DNS Management:</strong> One zone, multi-provider. Customer configures once; Soma handles propagation.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>VPC Abstraction:</strong> Private networks that span providers. Customer-isolated. Traffic never traverses public internet.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Managed Postgres + Redis:</strong> Automated backups, HA, point-in-time recovery. Customer manages schema, Soma manages the cluster.</div>
</div>
</div>
<div class="callout green">
<strong>Phase 2 Milestone:</strong> An external customer can deploy a complete full-stack application on Soma. Frontend, API, database, object storage. No knowledge of or access to the underlying providers.
</div>
</div>
</div>
</div>
<!-- Phase 3 -->
<div class="phase-card" id="phase-3">
<div class="phase-header" onclick="togglePhase('phase-3')">
<div class="phase-num">3</div>
<div class="phase-meta">
<div class="phase-label-row">
<span class="phase-tag">Customer Platform</span>
<span class="phase-timing">Months 810</span>
<span class="phase-status-badge scale">Self-Service</span>
</div>
<div class="phase-title">Customer Platform — First Paying Customer</div>
<div class="phase-summary">Self-service onboarding. Billing. Dashboard. Customers provision without help.</div>
</div>
<span class="phase-chevron"></span>
</div>
<div class="phase-body">
<div class="phase-content">
<p>Phase 3 is the first time Soma is a real business rather than an internal tool. Self-service means a customer with a credit card can sign up, provision infrastructure, and be paying within an hour — without any human involvement from Soma.</p>
<div class="milestone-list">
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Soma Dashboard:</strong> The customer-facing UI. "Grandma-simple" — if a technical non-expert can use it without help, it passes.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Self-Service Account Creation:</strong> Sign up, verify, configure billing, get API keys. End-to-end without human touch.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Usage-Based Billing Engine:</strong> Per-request, per-hour, per-GB. Customer sees clean invoice. Soma sees per-provider cost breakdown.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>SLA Monitoring:</strong> Customer-facing status page. Uptime SLA enforced contractually. Alerts before customers notice degradation.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Automated Onboarding Flow:</strong> From account creation to first workload running — guided, automated, audited.</div>
</div>
</div>
<div class="callout green">
<strong>Phase 3 Milestone:</strong> First paying external Soma customer. They signed up without human help, deployed a workload, and received an invoice. Soma handled everything.
</div>
</div>
</div>
</div>
<!-- Phase 4 -->
<div class="phase-card" id="phase-4">
<div class="phase-header" onclick="togglePhase('phase-4')">
<div class="phase-num">4</div>
<div class="phase-meta">
<div class="phase-label-row">
<span class="phase-tag">Scale &amp; Acquisition</span>
<span class="phase-timing">Months 1118</span>
<span class="phase-status-badge compound">Leverage Building</span>
</div>
<div class="phase-title">Scale — Leverage Begins</div>
<div class="phase-summary">Azure + GCP onboarded. Data center acquisition begins. Provider spend reaches material levels.</div>
</div>
<span class="phase-chevron"></span>
</div>
<div class="phase-body">
<div class="phase-content">
<p>Phase 4 is where the strategic play becomes visible to those watching carefully — but not to the providers. Azure and GCP are added to the node pool. Provider spend reaches the level where Soma becomes a material customer. Data center acquisitions begin — quietly, unglamorously.</p>
<div class="milestone-list">
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Azure + GCP Adapters:</strong> Both added to the provider pool. Anti-concentration rules now span five provider types.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Serverless Functions Platform:</strong> Event-triggered, scales to zero. Serverless economics on Soma's substrate.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>CDN Layer:</strong> Edge caching, asset delivery. Tight integration with Object Storage.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Message Queue Service:</strong> Full async job processing infrastructure available to external customers.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>First Data Center Acquisition:</strong> A facility, not a headline. Managed by Neuron. Adds owned compute to the node pool at dramatically lower cost.</div>
</div>
</div>
<div class="callout dark">
<p><strong>Phase 4 Milestone:</strong> Soma is the largest single customer of at least one provider region. Provider spend is material — large enough that losing Soma would be noticed on their earnings call. The leverage begins to exist.</p>
</div>
</div>
</div>
</div>
<!-- Phase 5 -->
<div class="phase-card" id="phase-5">
<div class="phase-header" onclick="togglePhase('phase-5')">
<div class="phase-num">5</div>
<div class="phase-meta">
<div class="phase-label-row">
<span class="phase-tag">Compound</span>
<span class="phase-timing">Month 18+</span>
<span class="phase-status-badge compound">Flywheel</span>
</div>
<div class="phase-title">Compound — The Flywheel Is Self-Sustaining</div>
<div class="phase-summary">Soma autonomously manages capacity. Data center fleet grows. Acquisition conversations begin.</div>
</div>
<span class="phase-chevron"></span>
</div>
<div class="phase-body">
<div class="phase-content">
<p>Phase 5 is not a destination — it is the state Soma enters when the flywheel becomes self-sustaining. Neuron manages capacity planning autonomously. Data center acquisitions continue. Provider dependency deepens. The acquisition conversations Soma initiates — or receives — happen from a position of leverage, not need.</p>
<div class="milestone-list">
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Autonomous Capacity Planning:</strong> Neuron orchestrates Soma's own growth. No human capacity planning required.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Data Center Fleet Growing:</strong> Multiple owned facilities in the node pool. Cost per compute unit well below provider rates.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Acquisition Conversations:</strong> Either we initiate or providers do. Either way, we arrive with the balance sheet of their largest customer.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Private Cloud Offering:</strong> Soma deployed inside enterprise customers' own AWS/Azure/GCP accounts. The abstraction goes everywhere they are.</div>
</div>
</div>
<div class="callout dark">
<p>The flywheel: Soma runs Neuron → Neuron licenses generate revenue at zero marginal cost → revenue funds Soma expansion → Soma expansion deepens provider dependency → provider dependency builds leverage → leverage enables acquisition → acquisition adds owned infrastructure → owned infrastructure reduces costs → lower costs improve Neuron margins → repeat.</p>
</div>
</div>
</div>
</div>
</div><!-- end phase-timeline -->
</section>
<!-- ── TECHNICAL SPECIFICATIONS ── -->
<section id="specs">
<h2>Technical Specifications</h2>
<p>Dense implementation detail. Click any section to expand.</p>
<!-- Router Logic -->
<div class="spec-block" id="spec-router">
<div class="spec-header" onclick="toggleSpec('spec-router')">
<span class="spec-title">Soma Router — Decision Logic</span>
<span class="spec-chevron"></span>
</div>
<div class="spec-body">
<div class="spec-content">
<p>The Router is a deterministic rule tree. Every routing decision is auditable. No ML involved — the routing logic is a sequence of deterministic steps, each of which can be logged and replayed.</p>
<div class="code-block"><span class="cm">// Router decision sequence (pseudo-code)</span>
<span class="kw">1.</span> Classify request:
LLM inference | Image gen | Compute | Storage | Network
<span class="kw">2.</span> Determine tier:
- Examine request complexity
- Apply customer tier setting
- Honor explicit override if present
<span class="val">LOW</span> | <span class="val">MEDIUM</span> | <span class="val">HIGH</span>
<span class="kw">3.</span> Query Cost Oracle:
- Get live pricing for all eligible nodes
- Apply staleness filter (reject stale > threshold)
<span class="kw">4.</span> Apply constraints:
- Anti-concentration: reject nodes where provider would exceed 60%
- Health filter: reject nodes with health &lt; threshold
- Warm-pool preference: prefer WARM nodes over PROVISIONING
<span class="kw">5.</span> Select node:
- Lowest cost node meeting tier requirement with capacity
<span class="kw">6.</span> Route:
- Forward request, stream response
<span class="kw">7.</span> Emit:
ObserverEvent(node_id, tier, latency, cost, outcome)</div>
<div class="callout">
The Router's determinism is a feature, not a limitation. Every production incident can be replayed by re-running the decision sequence with the same inputs. No probabilistic black boxes in the critical path.
</div>
</div>
</div>
</div>
<!-- Cost Oracle -->
<div class="spec-block" id="spec-oracle">
<div class="spec-header" onclick="toggleSpec('spec-oracle')">
<span class="spec-title">Cost Oracle — Pricing Sources &amp; Degraded Mode</span>
<span class="spec-chevron"></span>
</div>
<div class="spec-body">
<div class="spec-content">
<p>The Cost Oracle aggregates real-time pricing from all provider types. It must be available for the Router to make cost-optimal decisions. Degraded mode ensures the Router can still operate when a pricing source is unavailable.</p>
<table class="op-table">
<thead>
<tr>
<th>Source</th>
<th>Method</th>
<th>Frequency</th>
<th>Degraded Behavior</th>
</tr>
</thead>
<tbody>
<tr>
<td><strong>RunPod</strong></td>
<td>API polling</td>
<td>Every 60s</td>
<td>Cached pricing + staleness flag</td>
</tr>
<tr>
<td><strong>Legion</strong></td>
<td>Static (owned hardware)</td>
<td>Manual update</td>
<td>Known cost — never stale</td>
</tr>
<tr>
<td><strong>AWS EC2</strong></td>
<td>Spot pricing API + on-demand fallback</td>
<td>Every 60s</td>
<td>Conservative estimate (uses on-demand)</td>
</tr>
<tr>
<td><strong>Azure / GCP</strong></td>
<td>Spot pricing API + on-demand fallback</td>
<td>Every 60s</td>
<td>Conservative estimate (uses on-demand)</td>
</tr>
<tr>
<td><strong>Owned Data Centers</strong></td>
<td>Static amortized cost</td>
<td>Manual update</td>
<td>Known cost — never stale</td>
</tr>
</tbody>
</table>
<p>Degraded mode rule: when pricing is stale, the Oracle uses the <strong>higher</strong> of cached price or on-demand rate. This is conservative — it may over-cost-estimate, but it prevents the Router from routing to a node that turns out to be expensive.</p>
</div>
</div>
</div>
<!-- Control Plane State Machine -->
<div class="spec-block" id="spec-controlplane">
<div class="spec-header" onclick="toggleSpec('spec-controlplane')">
<span class="spec-title">Control Plane — Node State Machine</span>
<span class="spec-chevron"></span>
</div>
<div class="spec-body">
<div class="spec-content">
<p>Every node in the pool follows a defined state machine. Transitions are logged as ObserverEvents. The Orchestrator drives transitions; the Control Plane tracks them.</p>
<div class="state-flow">
<div class="state-node">PROVISIONING</div>
<span class="state-arrow"></span>
<div class="state-node active">WARM</div>
<span class="state-arrow"></span>
<div class="state-node active">ACTIVE</div>
<span class="state-arrow"></span>
<div class="state-node warn">DRAINING</div>
<span class="state-arrow"></span>
<div class="state-node end">TERMINATED</div>
</div>
<table class="op-table">
<thead>
<tr>
<th>State</th>
<th>Description</th>
<th>Transition Trigger</th>
</tr>
</thead>
<tbody>
<tr>
<td><span class="tag-pill navy">PROVISIONING</span></td>
<td>Node is being initialized. Not yet eligible for routing.</td>
<td>Orchestrator decision to expand pool</td>
</tr>
<tr>
<td><span class="tag-pill green">WARM</span></td>
<td>Node is ready. Router prefers WARM over PROVISIONING.</td>
<td>Health check passes, model loaded</td>
</tr>
<tr>
<td><span class="tag-pill green">ACTIVE</span></td>
<td>Node is serving requests. Normal operating state.</td>
<td>First request routed to node</td>
</tr>
<tr>
<td><span class="tag-pill amber">DRAINING</span></td>
<td>Node is finishing in-flight requests. No new requests routed.</td>
<td>15-minute idle threshold reached</td>
</tr>
<tr>
<td><span class="tag-pill">TERMINATED</span></td>
<td>Node is gone. Removed from pool inventory.</td>
<td>All in-flight requests complete</td>
</tr>
</tbody>
</table>
<p>Pre-warm trigger: Observer detects rising request rate → Orchestrator provisions new nodes ahead of demand spike → nodes enter PROVISIONING → WARM before the spike arrives. Cold start is avoided structurally, not by keeping nodes hot permanently.</p>
</div>
</div>
</div>
<!-- Neuron Operator Model -->
<div class="spec-block" id="spec-operator">
<div class="spec-header" onclick="toggleSpec('spec-operator')">
<span class="spec-title">Neuron Operator Model — How Neuron Manages Soma</span>
<span class="spec-chevron"></span>
</div>
<div class="spec-body">
<div class="spec-content">
<p>Soma is managed entirely through the Neuron conversation interface. There is no ops team, no Kubernetes console, no provider console access. Neuron is the operator.</p>
<table class="op-table">
<thead>
<tr>
<th>Action</th>
<th>What It Does</th>
<th>Scope</th>
</tr>
</thead>
<tbody>
<tr>
<td><code>provision</code></td>
<td>Bring up a new node in the pool. Specify tier, provider preference, environment profile.</td>
<td>Soma API surface only</td>
</tr>
<tr>
<td><code>terminate</code></td>
<td>Drain and terminate a specific node. Graceful — waits for in-flight requests.</td>
<td>Soma API surface only</td>
</tr>
<tr>
<td><code>scale</code></td>
<td>Adjust pool size for a tier. Orchestrator handles which nodes to add or remove.</td>
<td>Soma API surface only</td>
</tr>
<tr>
<td><code>reroute</code></td>
<td>Drain a node's traffic to other nodes without terminating. Used for maintenance.</td>
<td>Soma API surface only</td>
</tr>
<tr>
<td><code>inspect</code></td>
<td>Return state of any node, tier, or the full pool. Read-only.</td>
<td>Read-only</td>
</tr>
<tr>
<td><code>optimize</code></td>
<td>Trigger a cost-optimization pass. Orchestrator re-evaluates pool composition against current Cost Oracle data.</td>
<td>Soma API surface only</td>
</tr>
</tbody>
</table>
<div class="callout amber">
Neuron's service token is architecturally scoped — it cannot act outside Soma's own API surface. No direct kubectl. No provider console access. No ambient authority. Every action emits an ObserverEvent, closing the feedback loop and preventing runaway automation.
</div>
</div>
</div>
</div>
<!-- Customer Isolation -->
<div class="spec-block" id="spec-isolation">
<div class="spec-header" onclick="toggleSpec('spec-isolation')">
<span class="spec-title">Customer Isolation — Hard Multi-Tenancy</span>
<span class="spec-chevron"></span>
</div>
<div class="spec-body">
<div class="spec-content">
<p>Soma's isolation model is cryptographic, not organizational. It is enforced at the infrastructure layer, not at the application layer. An application bug cannot leak data between customers.</p>
<div class="milestone-list">
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Vault Namespaces:</strong> Each customer gets a separate Vault namespace. Secrets are cryptographically isolated — not just access-controlled.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Storage Buckets:</strong> Customer storage is in separate, cryptographically separated buckets. No shared bucket with path-based isolation.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>VPC Isolation:</strong> Network traffic between customer workloads is blocked at the VPC layer. Not firewall rules — separate network fabric.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>API Key Scoping:</strong> Every API key is bound to a customer namespace. A key cannot make requests that affect another customer's resources.</div>
</div>
</div>
</div>
</div>
</div>
</section>
<!-- ── COMPETITIVE POSITION ── -->
<section id="competitive">
<h2>Competitive Position</h2>
<p>Soma is not competing with AWS on price. It is competing on a dimension AWS cannot replicate: <strong>AI-native infrastructure where the operator is an AI, the economics improve automatically, and the routing intelligence is protected by patents.</strong></p>
<div class="position-grid">
<div class="pos-card highlight">
<div class="pos-label">Moat #1</div>
<div class="pos-title">Zero-Cost Ops</div>
<div class="pos-body">Neuron manages Soma. No human ops team. AWS needs thousands of engineers to keep their infrastructure running. Soma's operational cost is a fraction of theirs.</div>
</div>
<div class="pos-card highlight">
<div class="pos-label">Moat #2</div>
<div class="pos-title">AI-Native Primitives</div>
<div class="pos-body">GPU instances, Inference Router, Image Gen, Pipeline Engine are first-class, not bolted on. AWS added AI services to a 2006 platform. Soma was designed for AI workloads.</div>
</div>
<div class="pos-card highlight">
<div class="pos-label">Moat #3</div>
<div class="pos-title">Patented Backplane</div>
<div class="pos-body">The routing intelligence, provider abstraction, and Neuron operator interface are protected by patents before the architecture is disclosed. The moat is the backplane, not the models.</div>
</div>
<div class="pos-card">
<div class="pos-label">Moat #4</div>
<div class="pos-title">Self-Improving Economics</div>
<div class="pos-body">Open-source model improvements and falling GPU costs improve Soma's economics automatically. AWS's costs don't improve without AWS doing work. Ours improve by default.</div>
</div>
<div class="pos-card">
<div class="pos-label">Moat #5</div>
<div class="pos-title">Dharma R&amp;D Gap</div>
<div class="pos-body">The Dharma lab continuously widens the capability gap. Every six months that passes, the distance between Soma's routing intelligence and anything a competitor could build grows larger.</div>
</div>
<div class="pos-card">
<div class="pos-label">Moat #6</div>
<div class="pos-title">Provider Leverage</div>
<div class="pos-body">As Soma grows, providers become dependent on Soma's spend. That dependency is a one-way ratchet. It builds automatically. Soma doesn't have to do anything to accumulate it.</div>
</div>
</div>
<div class="callout dark">
<p>The incumbent cloud providers have a structural problem: they built general-purpose platforms for the pre-AI era and are retrofitting AI onto 20-year-old architecture. Their technical debt is enormous. Soma has none. Building AI-native from scratch, with an AI as the operator, is an advantage that compounds over time — not one that fades.</p>
</div>
</section>
<!-- ── OPERATIONS MODEL ── -->
<section id="operations">
<h2>Operations Model</h2>
<p>Soma's operations model is the most unusual aspect of the platform and the most important competitive advantage. There is no traditional ops team. Neuron is the operator.</p>
<div class="callout">
<strong>The operator model:</strong> Every management action in Soma is expressed as a conversation with Neuron. Neuron translates intent into Soma API calls. Every call emits an ObserverEvent. Observer feeds back into Neuron's context. The loop closes on itself.
</div>
<p><strong>What autonomous operation looks like day-to-day:</strong></p>
<div class="milestone-list">
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Morning:</strong> Observer surfaces overnight anomalies to Neuron. Cost Oracle delta shows RunPod prices dropped 12% — Neuron adjusts routing weights. No human action required.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Demand spike:</strong> Observer detects rising request rate on High tier. Neuron pre-provisions 3 additional High-tier nodes before the spike arrives. Nodes enter WARM state before requests reach them.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Node failure:</strong> Control Plane detects heartbeat loss. Neuron is notified. Neuron drains the node's traffic, terminates it, provisions a replacement. End-to-end in under 2 minutes without human involvement.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Cost optimization:</strong> Neuron runs daily cost-optimization pass. Identifies nodes where provider cost exceeds the configured threshold. Gracefully migrates workloads to cheaper nodes. Documents the savings.</div>
</div>
<div class="ms-item">
<span class="ms-icon"></span>
<div class="ms-text"><strong>Capacity planning:</strong> Neuron analyzes 30-day usage trends. Presents a capacity recommendation. If within policy, executes autonomously. If outside policy bounds, escalates for confirmation.</div>
</div>
</div>
<div class="callout amber">
Escalation policy is critical. Neuron operates autonomously within defined bounds. Actions outside those bounds — large-scale reprovisioning, provider adds, cost threshold changes — require explicit confirmation. The bounds are defined in Soma config, not in Neuron's judgment.
</div>
<p>The operations model is not "set and forget." Neuron surfaces information, makes recommendations, and executes within policy. The human relationship with Soma is strategic, not operational. You define the strategy; Neuron executes it.</p>
</section>
<!-- ── 5-YEAR ARC ── -->
<section id="arc">
<h2>The 5-Year Arc</h2>
<p>Laid out plainly: what Soma is, what it becomes, and how the strategy compresses over five years into a position that cannot be replicated.</p>
<div class="arc-timeline">
<div class="arc-item">
<div class="arc-dot"></div>
<div class="arc-year">Year 1 — 2026</div>
<div class="arc-headline">Substrate + Internal Revenue</div>
<div class="arc-body">Soma runs Neuron's inference. Every Neuron AI license sold costs almost nothing to deliver. Phase 0 and Phase 1 complete. RunPod, Legion, and AWS in the node pool. Anti-concentration enforced. First external customers onboarding in Q4. No one outside the company knows what we're building.</div>
</div>
<div class="arc-item">
<div class="arc-dot mid"></div>
<div class="arc-year">Year 2 — 2027</div>
<div class="arc-headline">External Platform + Provider Spend Growing</div>
<div class="arc-body">Full service catalog available to external customers. Self-service. Billing. Azure and GCP in the pool. Provider spend is growing rapidly — Soma's revenue is growing faster than its costs because Neuron manages operations. First data center acquisition closes. Owned compute enters the node pool for the first time. Margins begin to widen structurally.</div>
</div>
<div class="arc-item">
<div class="arc-dot mid"></div>
<div class="arc-year">Year 3 — 2028</div>
<div class="arc-headline">Material Provider Leverage</div>
<div class="arc-body">Soma is a top-10 customer for at least one major cloud provider by region. Provider account managers are calling us, not the other way around. Data center fleet has multiple facilities. The cost-per-compute-unit gap between owned infrastructure and provider rates is widening. Patents are covering the routing architecture. Dharma continues widening the capability gap.</div>
</div>
<div class="arc-item">
<div class="arc-dot mid"></div>
<div class="arc-year">Year 4 — 2029</div>
<div class="arc-headline">Acquisition Conversations Begin</div>
<div class="arc-body">Provider dependency is deep enough that losing Soma would register on earnings calls. Acquisition conversations begin — either we initiate or receive them. We arrive with leverage in both cases: we are their largest or near-largest customer in our regions, and we can credibly threaten to redirect that spend to our owned infrastructure. The negotiating position is comfortable.</div>
</div>
<div class="arc-item">
<div class="arc-dot end"></div>
<div class="arc-year">Year 5 — 2030</div>
<div class="arc-headline">The Flywheel Is Self-Sustaining</div>
<div class="arc-body">Soma manages its own capacity planning autonomously. The flywheel — Neuron AI licenses funding Soma expansion, Soma expansion deepening provider dependency, provider dependency enabling leverage, leverage enabling acquisitions, acquisitions reducing costs, lower costs improving Neuron margins — is self-sustaining. The compound rate is structural. Neuron Technologies is an infrastructure company that happened to start with an AI product.</div>
</div>
</div>
<div class="pull-quote reveal">
<blockquote>"They see growing revenue. They see a great customer. They don't see what's happening."</blockquote>
<cite>Soma Strategic Principle · Internal</cite>
</div>
<div class="callout dark">
<p>The full play, in one paragraph: <strong>Soma runs on provider infrastructure while quietly building the leverage to acquire the providers.</strong> Neuron AI licenses fund Soma at near-zero marginal cost. Soma's operations cost approaches zero because Neuron manages it. Every dollar of growth widens the moat. The strategy is self-funding, self-reinforcing, and structurally invisible to the parties whose positions it is inverting. By the time the endgame is visible, the pieces are already on the board.</p>
</div>
</section>
<div class="footer-block">
Soma · AI-Native Cloud Platform · Neuron Technologies<br>
April 25, 2026 · Eyes Only — Confidential · Internal Use Only<br>
This document is intended solely for internal planning. Do not distribute.
</div>
</div><!-- end doc-page -->
<script>
// ── REVEAL ON SCROLL ──
const reveals = document.querySelectorAll('.reveal');
const io = new IntersectionObserver(entries => {
entries.forEach(e => {
if (e.isIntersecting) {
e.target.classList.add('visible');
io.unobserve(e.target);
}
});
}, { threshold: 0.08 });
reveals.forEach(el => io.observe(el));
// Initial reveal for above-fold
setTimeout(() => {
document.querySelectorAll('.masthead').forEach(el => el.classList.add('visible'));
}, 100);
// ── PHASE ACCORDION ──
function togglePhase(id) {
const card = document.getElementById(id);
const isOpen = card.classList.contains('open');
// Close all
document.querySelectorAll('.phase-card').forEach(c => c.classList.remove('open'));
// Open clicked if it was closed
if (!isOpen) card.classList.add('open');
}
// ── SPEC ACCORDION ──
function toggleSpec(id) {
const block = document.getElementById(id);
block.classList.toggle('open');
}
// ── NAV ACTIVE STATE ──
const sections = document.querySelectorAll('section[id]');
const navLinks = document.querySelectorAll('.nav-link');
const navIO = new IntersectionObserver(entries => {
entries.forEach(e => {
if (e.isIntersecting) {
navLinks.forEach(l => l.classList.remove('active'));
const active = document.querySelector(`.nav-link[href="#${e.target.id}"]`);
if (active) active.classList.add('active');
}
});
}, { rootMargin: '-30% 0px -60% 0px' });
sections.forEach(s => navIO.observe(s));
</script>
</body>
</html>