2:I[23069,["931","static/chunks/app/page-1517abce0fd0d381.js"],"CopyInstallBlock"]
3:I[21194,["185","static/chunks/app/layout-1e3f5a8ca5a25f22.js"],"AppShellProvider"]
4:I[39275,[],""]
5:I[61343,[],""]
0:["RFys88GaisldQ2y_s-Mjq",[[["",{"children":["__PAGE__",{}]},"$undefined","$undefined",true],["",{"children":["__PAGE__",{},[["$L1",["$","div",null,{"className":"landing-page","children":[["$","div",null,{"className":"landing-glow","aria-hidden":true}],["$","div",null,{"className":"landing-inner","children":[["$","nav",null,{"className":"landing-nav","children":[["$","div",null,{"className":"landing-nav-brand","children":[["$","svg",null,{"width":"22","height":"22","viewBox":"0 0 22 22","fill":"none","aria-hidden":true,"children":[["$","rect",null,{"x":"1.5","y":"3.5","width":"19","height":"4","rx":"1.4","stroke":"#b86a2a","strokeWidth":"1.3"}],["$","rect",null,{"x":"4","y":"9.5","width":"14","height":"4","rx":"1.4","stroke":"#b86a2a","strokeWidth":"1.3","opacity":"0.65"}],["$","rect",null,{"x":"7","y":"15.5","width":"8","height":"3","rx":"1.4","stroke":"#b86a2a","strokeWidth":"1.3","opacity":"0.32"}]]}],["$","span",null,{"className":"pc-mono landing-nav-wordmark","children":"inferencache"}]]}],["$","div",null,{"className":"landing-nav-links","children":[["$","a",null,{"href":"https://github.com/lavondev/inferencache","target":"_blank","rel":"noopener noreferrer","children":"GitHub"}],["$","a",null,{"href":"https://twitter.com/jaybhatt_","target":"_blank","rel":"noopener noreferrer","children":"X"}]]}]]}],["$","section",null,{"className":"landing-hero","id":"main-content","tabIndex":-1,"children":[["$","div",null,{"className":"landing-hero-left","children":[["$","p",null,{"className":"landing-eyebrow pc-mono","children":"LLM cost infrastructure"}],["$","h1",null,{"className":"landing-headline","children":["Stop paying for the same prompt ",["$","em",null,{"children":"twice."}]]}],["$","p",null,{"className":"landing-subtext","children":["A local proxy for LLM APIs. Exact-match and semantic deduplication intercept redundant calls before they cost you a token."," ",["$","span",null,{"className":"landing-subtext-strong","children":"One env var. No gateway."}]]}],["$","div",null,{"className":"landing-cta-row","children":[["$","$L2",null,{}],["$","a",null,{"href":"https://github.com/lavondev/inferencache","target":"_blank","rel":"noopener noreferrer","className":"landing-github-btn","children":"View on GitHub"}]]}],["$","p",null,{"className":"landing-cta-note","children":"Open source. Runs on your machine."}]]}],["$","div",null,{"className":"landing-hero-right","children":["$","div",null,{"className":"landing-code-window","children":[["$","div",null,{"className":"landing-code-titlebar","children":[["$","div",null,{"className":"landing-code-dots","children":[["$","span",null,{}],["$","span",null,{}],["$","span",null,{}]]}],["$","span",null,{"className":"pc-mono landing-code-filename","children":"setup.sh"}],["$","span",null,{"className":"pc-mono landing-code-lang","children":"shell"}]]}],["$","div",null,{"className":"landing-code-body","children":[["$","div",null,{"className":"landing-code-gutter pc-mono","children":[["$","div","1",{"children":1}],["$","div","2",{"children":2}],["$","div","3",{"children":3}],["$","div","4",{"children":4}],["$","div","5",{"children":5}],["$","div","6",{"children":6}],["$","div","7",{"children":7}],["$","div","8",{"children":8}],["$","div","9",{"children":9}]]}],["$","div",null,{"className":"landing-code-content pc-mono","children":[[["$","div","1",{"children":[["$","span","0",{"className":"lc-kw","children":"pip install "}],["$","span","1",{"className":"lc-str","children":"\"inferencache[embed,serve]\""}]]}],["$","div","2",{"children":[["$","span","0",{"className":"lc-cmd","children":"inferencache serve"}]]}],["$","div","3",{"children":" "}],["$","div","4",{"children":[["$","span","0",{"className":"lc-cmt","children":"# Claude Code / Cursor"}]]}],["$","div","5",{"children":[["$","span","0",{"className":"lc-kw","children":"export "}],["$","span","1",{"className":"lc-str","children":"ANTHROPIC_BASE_URL=http://localhost:8080"}]]}],["$","div","6",{"children":" "}],["$","div","7",{"children":[["$","span","0",{"className":"lc-cmt","children":"# repeat call  → "}],["$","span","1",{"className":"lc-ok","children":"cache hit       0ms    $0.00"}]]}],["$","div","8",{"children":[["$","span","0",{"className":"lc-cmt","children":"# near-match     → "}],["$","span","1",{"className":"lc-ok","children":"semantic hit    4ms    $0.00"}]]}],["$","div","9",{"children":[["$","span","0",{"className":"lc-cmt","children":"# new prompt     → "}],["$","span","1",{"className":"lc-dim","children":"api call      820ms  $0.0031"}]]}]],["$","span",null,{"className":"lc-cursor","children":"▋"}]]}]]}]]}]}]]}],["$","div",null,{"className":"landing-divider"}],["$","section",null,{"className":"landing-proof-grid","children":[["$","div","01",{"className":"landing-proof-cell  border-b","children":[["$","p",null,{"className":"landing-proof-label pc-mono","children":[["$","span",null,{"className":"landing-proof-num","children":"01"}],["$","span",null,{"className":"landing-proof-sep"}],"how it works"]}],["$","h3",null,{"className":"landing-proof-title","children":"Two-tier cache, one check"}],["$","p",null,{"className":"landing-proof-body","children":"Every call runs an exact match in SQLite, then a semantic search in Qdrant. Hit either layer and the response returns immediately — no network, no tokens, no cost. Miss both and the real call goes through and writes back."}]]}],["$","div","02",{"className":"landing-proof-cell border-l border-b","children":[["$","p",null,{"className":"landing-proof-label pc-mono","children":[["$","span",null,{"className":"landing-proof-num","children":"02"}],["$","span",null,{"className":"landing-proof-sep"}],"integration"]}],["$","h3",null,{"className":"landing-proof-title","children":"Proxy-first, nothing to rearchitect"}],["$","p",null,{"className":"landing-proof-body","children":"Point Cursor or Claude Code at localhost:8080 with one env var. No decorator, no gateway, no changed call signatures — your existing SDK calls just get cheaper."}]]}],["$","div","03",{"className":"landing-proof-cell  ","children":[["$","p",null,{"className":"landing-proof-label pc-mono","children":[["$","span",null,{"className":"landing-proof-num","children":"03"}],["$","span",null,{"className":"landing-proof-sep"}],"vs alternatives"]}],["$","h3",null,{"className":"landing-proof-title","children":"GPTCache is abandoned. Gateways are overhead."}],["$","p",null,{"className":"landing-proof-body","children":"Every other caching layer either stopped shipping or routes traffic through infrastructure you don't own. inferencache is just a library — pip install inferencache. Your prompts stay on your machine."}]]}],["$","div","04",{"className":"landing-proof-cell border-l ","children":[["$","p",null,{"className":"landing-proof-label pc-mono","children":[["$","span",null,{"className":"landing-proof-num","children":"04"}],["$","span",null,{"className":"landing-proof-sep"}],"MCP server"]}],["$","h3",null,{"className":"landing-proof-title","children":"Your editor can see the cache too"}],["$","p",null,{"className":"landing-proof-body","children":"A read-only MCP server ships with the library. Cursor and Claude Code can inspect hit rates, cost savings, and cache state without leaving the editor."}]]}]]}],["$","footer",null,{"className":"landing-footer","children":[["$","span",null,{"className":"landing-footer-brand","children":[["$","svg",null,{"width":"14","height":"14","viewBox":"0 0 22 22","fill":"none","aria-hidden":true,"children":[["$","rect",null,{"x":"1.5","y":"3.5","width":"19","height":"4","rx":"1.4","stroke":"#b86a2a","strokeWidth":"1.3","opacity":"0.7"}],["$","rect",null,{"x":"4","y":"9.5","width":"14","height":"4","rx":"1.4","stroke":"#b86a2a","strokeWidth":"1.3","opacity":"0.4"}],["$","rect",null,{"x":"7","y":"15.5","width":"8","height":"3","rx":"1.4","stroke":"#b86a2a","strokeWidth":"1.3","opacity":"0.2"}]]}],"inferencache · built in public"]}],["$","div",null,{"className":"landing-footer-links","children":[["$","a",null,{"href":"https://twitter.com/jaybhatt_","target":"_blank","rel":"noopener noreferrer","children":"@jaybhatt_ on X"}],["$","a",null,{"href":"https://github.com/lavondev/inferencache","target":"_blank","rel":"noopener noreferrer","children":"GitHub"}]]}]]}]]}]]}]],null],null]},[["$","html",null,{"lang":"en","className":"__variable_3a0388 __variable_c1e5c9","suppressHydrationWarning":true,"data-theme":"dark","children":["$","body",null,{"className":"antialiased","style":{"fontFamily":"var(--font-geist-sans, var(--sans))"},"children":["$","$L3",null,{"children":[["$","a",null,{"href":"#main-content","className":"skip-link","children":"Skip to main content"}],["$","$L4",null,{"parallelRouterKey":"children","segmentPath":["children"],"error":"$undefined","errorStyles":"$undefined","errorScripts":"$undefined","template":["$","$L5",null,{}],"templateStyles":"$undefined","templateScripts":"$undefined","notFound":[["$","title",null,{"children":"404: This page could not be found."}],["$","div",null,{"style":{"fontFamily":"system-ui,\"Segoe UI\",Roboto,Helvetica,Arial,sans-serif,\"Apple Color Emoji\",\"Segoe UI Emoji\"","height":"100vh","textAlign":"center","display":"flex","flexDirection":"column","alignItems":"center","justifyContent":"center"},"children":["$","div",null,{"children":[["$","style",null,{"dangerouslySetInnerHTML":{"__html":"body{color:#000;background:#fff;margin:0}.next-error-h1{border-right:1px solid rgba(0,0,0,.3)}@media (prefers-color-scheme:dark){body{color:#fff;background:#000}.next-error-h1{border-right:1px solid rgba(255,255,255,.3)}}"}}],["$","h1",null,{"className":"next-error-h1","style":{"display":"inline-block","margin":"0 20px 0 0","padding":"0 23px 0 0","fontSize":24,"fontWeight":500,"verticalAlign":"top","lineHeight":"49px"},"children":"404"}],["$","div",null,{"style":{"display":"inline-block"},"children":["$","h2",null,{"style":{"fontSize":14,"fontWeight":400,"lineHeight":"49px","margin":0},"children":"This page could not be found."}]}]]}]}]],"notFoundStyles":[],"styles":null}]]}]}]}],null],null],[[["$","link","0",{"rel":"stylesheet","href":"/_next/static/css/8f48daab9b99c2c6.css","precedence":"next","crossOrigin":"$undefined"}]],[null,"$L6"]]]]]
6:[["$","meta","0",{"name":"viewport","content":"width=device-width, initial-scale=1"}],["$","meta","1",{"charSet":"utf-8"}],["$","title","2",{"children":"inferencache"}],["$","meta","3",{"name":"description","content":"Multi-tier semantic caching for LLM APIs. Stop paying for the same prompt twice."}],["$","meta","4",{"name":"next-size-adjust"}]]
1:null
