> ## Documentation Index
> Fetch the complete documentation index at: https://runcrate.ai/docs/llms.txt
> Use this file to discover all available pages before exploring further.

# Home

> Inference first. Compute when you need it.

export const DocsHero = ({title, subtitle}) => {
  const CELL = 14;
  const ROW = 12;
  const BRAND = '#4B7BF5';
  const ACCENT = '#10B981';
  const L = (x, y, o, accent) => ({
    a: 'l',
    x,
    y,
    o,
    accent
  });
  const R = (x, y, o, accent) => ({
    a: 'r',
    x,
    y,
    o,
    accent
  });
  const C = (xo, y, o) => ({
    a: 'c',
    xo,
    y,
    o
  });
  const pattern = [L(0, 0, 0.50), L(1, 0, 0.42), L(2, 0, 0.30), L(3, 0, 0.20), L(4, 0, 0.14), L(5, 0, 0.10), L(6, 0, 0.07), L(8, 0, 0.05), L(10, 0, 0.04), L(13, 0, 0.03), L(0, 1, 0.40), L(1, 1, 0.32), L(2, 1, 0.22), L(3, 1, 0.13), L(4, 1, 0.08), L(6, 1, 0.05), L(9, 1, 0.03), L(0, 2, 0.32), L(1, 2, 0.24), L(2, 2, 0.15), L(4, 2, 0.06), L(0, 3, 0.26), L(1, 3, 0.16), L(2, 3, 0.55, true), L(5, 3, 0.04), L(0, 4, 0.21), L(1, 4, 0.10), L(3, 4, 0.04), L(0, 5, 0.17), L(1, 5, 0.07), L(0, 6, 0.13), L(2, 6, 0.04), L(0, 7, 0.09), L(0, 8, 0.06), L(1, 8, 0.03), L(0, 9, 0.04), L(0, 10, 0.02), C(-30, 0, 0.06), C(-29, 1, 0.04), C(-27, 0, 0.05), C(-26, 2, 0.04), C(-16, 0, 0.06), C(-15, 1, 0.04), C(-14, 0, 0.05), C(-12, 3, 0.04), C(-3, 0, 0.05), C(-2, 1, 0.04), C(0, 0, 0.06), C(1, 2, 0.04), C(2, 0, 0.05), C(14, 0, 0.05), C(15, 1, 0.04), C(17, 0, 0.06), C(19, 4, 0.04), C(28, 0, 0.05), C(29, 1, 0.04), C(31, 0, 0.05), C(32, 2, 0.04), R(0, 0, 0.46), R(1, 0, 0.38), R(2, 0, 0.28), R(3, 0, 0.20), R(4, 0, 0.14), R(5, 0, 0.10), R(7, 0, 0.06), R(9, 0, 0.04), R(12, 0, 0.03), R(0, 1, 0.36), R(1, 1, 0.28), R(2, 1, 0.18), R(3, 1, 0.12), R(5, 1, 0.07), R(8, 1, 0.04), R(0, 2, 0.28), R(1, 2, 0.20), R(3, 2, 0.50, true), R(5, 2, 0.04), R(0, 3, 0.21), R(1, 3, 0.12), R(4, 3, 0.05), R(0, 4, 0.16), R(1, 4, 0.07), R(0, 5, 0.10), R(0, 6, 0.05)];
  const cellStyle = c => {
    const s = {
      position: 'absolute',
      width: CELL + 'px',
      height: CELL + 'px',
      bottom: c.y * CELL + 'px',
      opacity: c.o,
      backgroundColor: c.accent ? ACCENT : BRAND
    };
    if (c.a === 'l') s.left = c.x * CELL + 'px'; else if (c.a === 'r') s.right = c.x * CELL + 'px'; else s.left = 'calc(50% + ' + c.xo * CELL + 'px)';
    return s;
  };
  return <div className="rc-hero" style={{
    position: 'relative',
    padding: '4rem 2rem 5rem',
    marginBottom: '2.5rem',
    overflow: 'hidden',
    borderRadius: '0.75rem'
  }}>
      <h1 style={{
    fontSize: 'clamp(2.5rem, 6vw, 4rem)',
    fontWeight: 500,
    letterSpacing: '-0.035em',
    lineHeight: 1.05,
    margin: 0,
    position: 'relative',
    zIndex: 1
  }}>{title}</h1>
      <p style={{
    marginTop: '1.5rem',
    maxWidth: '42rem',
    opacity: 0.7,
    fontSize: '1rem',
    lineHeight: 1.6,
    position: 'relative',
    zIndex: 1
  }}>{subtitle}</p>
      <div aria-hidden style={{
    position: 'absolute',
    bottom: 0,
    left: 0,
    right: 0,
    height: ROW * CELL + 'px',
    pointerEvents: 'none',
    zIndex: 0
  }}>
        {pattern.map((c, i) => <div key={i} style={cellStyle(c)} />)}
      </div>
    </div>;
};

export const RuncrateStyles = () => {
  if (typeof document !== 'undefined' && !document.getElementById('runcrate-overrides')) {
    const s = document.createElement('style');
    s.id = 'runcrate-overrides';
    s.textContent = `
      /* Match Runcrate's rounding scale (--radius: 0.75rem) */
      .rounded-sm { border-radius: 0.5rem !important; }   /* 8px */
      .rounded-md { border-radius: 0.625rem !important; } /* 10px */
      .rounded-lg { border-radius: 0.75rem !important; }  /* 12px */
      .rounded-l-sm { border-top-left-radius: 0.5rem !important; border-bottom-left-radius: 0.5rem !important; }
      .rounded-r-sm { border-top-right-radius: 0.5rem !important; border-bottom-right-radius: 0.5rem !important; }
      .rounded-l-md { border-top-left-radius: 0.625rem !important; border-bottom-left-radius: 0.625rem !important; }
      .rounded-r-md { border-top-right-radius: 0.625rem !important; border-bottom-right-radius: 0.625rem !important; }
      .rounded-l-lg { border-top-left-radius: 0.75rem !important; border-bottom-left-radius: 0.75rem !important; }
      .rounded-r-lg { border-top-right-radius: 0.75rem !important; border-bottom-right-radius: 0.75rem !important; }

      /* Cards: never pure white in light mode */
      .card { background-color: #fcfcfc !important; border-radius: 0.75rem !important; }
      html.dark .card { background-color: #141414 !important; }

      /* Docs hero box */
      .rc-hero { background-color: #fcfcfc; border: 1px solid #e0e0e0; }
      html.dark .rc-hero { background-color: #141414; border-color: #242424; }
      html.dark .rc-hero h1 { color: #f5f5f5; }

      /* Runcrate scrollbar — thin, transparent track, hide-until-hover thumb */
      ::-webkit-scrollbar { width: 6px; height: 6px; background-color: transparent; }
      ::-webkit-scrollbar-track { background-color: transparent; }
      ::-webkit-scrollbar-thumb { background-color: rgba(155, 155, 155, 0.5); border-radius: 10px; transition: opacity 0.3s ease; opacity: 0; }
      ::-webkit-scrollbar-thumb:hover { background-color: rgba(155, 155, 155, 0.7); }
      *:hover::-webkit-scrollbar-thumb,
      *:focus::-webkit-scrollbar-thumb,
      *:active::-webkit-scrollbar-thumb { opacity: 1; }
      * { scrollbar-width: thin; scrollbar-color: rgba(155, 155, 155, 0.5) transparent; }
    `;
    document.head.appendChild(s);
  }
  return null;
};

<RuncrateStyles />

<DocsHero title="Build on Runcrate" subtitle="Inference by the token. Compute by the second. Everything you need to ship." />

> ## For Agents
>
> Fetch the complete documentation index at: [https://runcrate.ai/docs/llms.txt](https://runcrate.ai/docs/llms.txt)

Runcrate is the complete platform for AI teams to access open-source models and GPU compute. One account gives you production inference for 140+ models, on-demand GPU instances, dedicated clusters, and the SDKs to build with all of it.

<Columns cols={4}>
  <Card title="Quickstart" icon="rocket" href="/getting-started/quickstart">
    Make your first API call in under 60 seconds.
  </Card>

  <Card title="Model Catalog" icon="brain" href="/models/model-catalog">
    Browse 140+ open-source models across text, image, video, and audio.
  </Card>

  <Card title="SDKs" icon="code" href="/sdks/overview">
    Python and TypeScript clients. Drop-in OpenAI SDK replacements.
  </Card>

  <Card title="API Reference" icon="book" href="/api-reference/introduction">
    Full REST API documentation for inference and infrastructure.
  </Card>
</Columns>

## The Runcrate Platform

Everything your AI team needs: production inference, GPU compute, and dedicated clusters — all under one account and one bill.

<Columns cols={5}>
  <Card title="Models API" icon="message" href="/models/overview">
    Chat, image, video, TTS, and transcription via OpenAI-compatible endpoints.
  </Card>

  <Card title="GPU Instances" icon="server" href="/instances/overview">
    Deploy containers with dedicated NVIDIA GPUs in 60 seconds.
  </Card>

  <Card title="Storage" icon="database" href="/storage/overview">
    Persistent volumes with built-in file explorer.
  </Card>

  <Card title="Dedicated Clusters" icon="server-2" href="/dedicated/overview">
    Reserved bare-metal from 16 to 128+ nodes.
  </Card>

  <Card title="MCP Server" icon="cpu" href="/mcp/overview">
    Control Runcrate from Claude, Cursor, or any AI assistant.
  </Card>
</Columns>

## Explore use cases

See how teams use Runcrate to build AI products, run inference at scale, train models, and deploy custom servers.

<Columns cols={4}>
  <Card title="AI SaaS Backend" icon="cloud" href="/examples/ai-saas-backend">
    Production AI backend with chat, image, and RAG.
  </Card>

  <Card title="RAG Pipeline" icon="search" href="/examples/rag-pipeline">
    Retrieval-augmented generation with embeddings and vector search.
  </Card>

  <Card title="Fine-tune LLMs" icon="adjustments-horizontal" href="/examples/fine-tune-llm">
    Fine-tune Llama, Mistral, or Qwen on your own data.
  </Card>

  <Card title="Video Generation" icon="video" href="/examples/ai-video-pipeline">
    Generate videos with Kling, Veo, Sora, and Seedance.
  </Card>
</Columns>

<Columns cols={4}>
  <Card title="AI Chatbot (Next.js)" icon="message" href="/examples/ai-chatbot-nextjs">
    Streaming chatbot with the Vercel AI SDK and Runcrate.
  </Card>

  <Card title="ComfyUI in the Cloud" icon="photo" href="/examples/comfyui-cloud">
    Run ComfyUI on a GPU instance with persistent model storage.
  </Card>

  <Card title="Deploy Llama" icon="server" href="/examples/deploy-llama">
    Self-host Llama 3 with vLLM for custom inference.
  </Card>

  <Card title="Voice Cloning" icon="microphone" href="/examples/voice-cloning-api">
    Clone any voice and generate speech with TTS models.
  </Card>
</Columns>

## Start building

<Columns cols={3}>
  <Card title="Python" icon="brand-python" href="/sdks/python">
    Official Python client. Drop-in replacement for the OpenAI SDK.
  </Card>

  <Card title="TypeScript" icon="brand-typescript" href="/sdks/typescript">
    Official TypeScript client for Node.js and edge runtimes.
  </Card>

  <Card title="Vercel AI SDK" icon="triangle" href="/sdks/vercel-ai">
    First-class Runcrate provider for the Vercel AI SDK.
  </Card>
</Columns>

<Card title="CLI" icon="terminal" href="/cli/overview" horizontal>
  Full terminal control. Deploy instances, SSH in, transfer files, manage volumes — all from your terminal.
</Card>
