SubstrateLabs
diff --git a/‎.gitignore‎
Lines changed: 5 additions & 0 deletions b/‎.gitignore‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎README.md‎
Lines changed: 41 additions & 0 deletions b/‎README.md‎
Lines changed: 41 additions & 0 deletions
diff --git a/‎content/hackernews-rag.mdx‎
Lines changed: 88 additions & 0 deletions b/‎content/hackernews-rag.mdx‎
Lines changed: 88 additions & 0 deletions
diff --git a/‎content/introducing.mdx‎
Lines changed: 28 additions & 0 deletions b/‎content/introducing.mdx‎
Lines changed: 28 additions & 0 deletions
diff --git a/‎content/substack.mdx‎
Lines changed: 22 additions & 0 deletions b/‎content/substack.mdx‎
Lines changed: 22 additions & 0 deletions
diff --git a/‎next-env.d.ts‎
Lines changed: 5 additions & 0 deletions b/‎next-env.d.ts‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎next-sitemap.config.js‎
Lines changed: 5 additions & 0 deletions b/‎next-sitemap.config.js‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎next.config.mjs‎
Lines changed: 18 additions & 0 deletions b/‎next.config.mjs‎
Lines changed: 18 additions & 0 deletions
diff --git a/‎package.json‎
Lines changed: 45 additions & 0 deletions b/‎package.json‎
Lines changed: 45 additions & 0 deletions
@@ -0,0 +1,5 @@
+.next
+.vercel
+**/node_modules/**
+.DS_Store
+.map.ts
@@ -0,0 +1,41 @@
+# blog
+
+This is a Next.js application generated with
+[Create Fumadocs](https://github.com/fuma-nama/fumadocs).
+
+Install dependencies:
+
+```bash
+bun install
+```
+
+Run development server:
+
+```bash
+bun dev
+```
+
+Open http://localhost:3000 with your browser to see the result.
+
+Dev commands:
+
+```bash
+#format
+bun run format
+#lint
+bun run lint
+#lint(fix)
+bun run lint:fix
+#format, lint and import sort
+bun run check:fix
+```
+
+## Learn More
+
+To learn more about Next.js and Fumadocs, take a look at the following
+resources:
+
+- [Next.js Documentation](https://nextjs.org/docs) - learn about Next.js
+  features and API.
+- [Learn Next.js](https://nextjs.org/learn) - an interactive Next.js tutorial.
+- [Fumadocs](https://fumadocs.vercel.app) - learn about Fumadocs
@@ -0,0 +1,88 @@
+---
+title: "RAG on Hacker News comments to generate a research summary"
+description: "Learn how to search Hacker News comments for a topic, extract sentiment, and generate a research summary in 34 lines of Substrate code. Runs dozens of LLM calls in parallel and streams markdown. Built in 15 minutes, easy to remix."
+date: 2024-07-15
+image: "/hnrag.png"
+---
+
+<div class="hero-image">
+    <img width={1020} height={510} src="/hnrag.png" alt="RAG on Hacker News comments to generate a research summary" />
+</div>
+
+In this post, we'll show you how to search Hacker News comments for a topic, extract sentiment, and generate a research summary in 34 lines of code using Substrate.
+
+- [Read on Twitter](https://x.com/vprtwn/status/1812844236401762513)
+- [Read on LinkedIn](https://www.linkedin.com/pulse/rag-hacker-news-comments-34-lines-code-substratelabs-pouje)
+
+<br/>
+
+This concise RAG implementation runs dozens of LLM calls in parallel and streams the markdown in no time. It's easy to remix, and genuinely useful. Internally, we've already written several scripts like this for Reddit, LinkedIn, and Twitter, and set up alerts to Slack.
+
+<iframe width="100%" height="600px" src="https://www.val.town/embed/substrate/hackerNewsRAG" title="Val Town" frameborder="0" allow="web-share" allowfullscreen></iframe>
+
+<br/>
+
+![hnrag](/hnrag.gif)
+
+First, we search HackerNews comments using the [Algolia HN Search API](https://hn.algolia.com/api).
+
+```typescript
+const searchResults = await hnSearch({
+  query: query,
+  numericFilters: `created_at_i>${Math.floor(Date.now() / 1000) - 60 * 60 * 24 * 7 * 4}`,
+  tags: "comment",
+});
+```
+
+<br/>
+
+Next, we use ComputeJSON to extract summary, sentiment, and other metadata from each comment. Structured JSON generation is ergonomic, reliable and blazing-fast on Substrate compared to other providers. This is critical for multi-step workflows.
+
+```typescript
+let summaries = [];
+for (const hit of searchResults.hits) {
+  summaries.push(
+    new ComputeJSON({
+      prompt: `Summarize this comment and how it relates to the topic: ${query}
+      Use "negative" sentiment for posts about API, abstraction, documentation, tutorial, general quality, slowness, or performance issues.
+      COMMENT: ${JSON.stringify(hit)}`,
+      json_schema: zodToJsonSchema(commentInfo),
+    }),
+  );
+}
+```
+
+<br/>
+
+Finally, we use ComputeText to generate a markdown summary of all the extracted JSON, and stream the results. Streaming on Substrate is really cool. You can of course stream the response of an individual LLM. But you can also stream the incremental steps of your workflow.
+
+```typescript
+const markdown = new ComputeText({
+  prompt: sb.concat(
+    `Below is a list of summarized comments about ${query} on Hacker News.
+  Generate concise markdown summarizing the results.
+  Summarize the contents of the comment and the sentiment about ${query}.
+  Categorize results under sentiment headers.
+  Order from most negative to least negative within each category.
+  Add a link to the original story URL in this format: [<story title>](https://news.ycombinator.com/item?id=<objectID>)
+  Filter out posts that do not seem to be about ${query}.
+  RESULTS:\n`,
+    ...summaries.map((s) => sb.jq(s.future.json_object, "@json")),
+  ),
+  model: "Llama3Instruct70B",
+});
+const stream = await substrate.stream(markdown);
+```
+
+<br/>
+
+The code we wrote was really simple. Implicitly, we were creating the graph below. But we didn't have to think about the graph at all! With Substrate, by simply relating tasks to each other, we get automatic parallelization of dozens of LLM calls for free, and 0 roundtrips.
+
+![graph](/hnrag-graph.png)
+
+Great power with great simplicity.
+
+View the full source, fork, and remix here: https://www.val.town/v/substrate/hackerNewsRAG
+
+- [Read on Twitter](https://x.com/vprtwn/status/1812844236401762513)
+- [Read on LinkedIn](https://www.linkedin.com/pulse/rag-hacker-news-comments-34-lines-code-substratelabs-pouje)
@@ -0,0 +1,28 @@
+---
+title: "Introducing Substrate"
+description: "Introducing Substrate, the API for modular AI"
+date: 06-20-2024
+image: "/launch-image.png"
+---
+
+<div class="hero-image">
+    <img width={1020} height={510} src="/launch-image.png" alt="Introducing Substrate" />
+</div>
+
+Today, we're launching [Substrate](https://substrate.run). We're also announcing our $8M Series Seed led by [Lightspeed](https://lsvp.com/stories/substrate-building-compound-ai-systems/).
+
+We believe the most robust and productive integrations of AI are when many inference runs are used in coordination with each other in a well-defined logical structure. This leads to more capable, more reliable, and more interpretable AI systems.
+
+Most people building with AI already know this; So-called "agentic" processes are becoming the norm, along with using LLMs for structured JSON generation in more constrained logical flows. But unless you work for Google, the main barrier to realizing multi-step AI workloads in your application is an infrastructure one. Most developers are left either creating an unwieldy mess of chained API calls to multiple providers which requires slow round-trips and expensive one-off calls, or they are attempting to deploy their own infrastructure which—without massive investment—tends to result in systems that are resource inefficient and slow. 
+
+We took a hard look at this state of affairs, and recognized how much it is stifling progress.
+
+Building large multi-step AI workloads requires sophisticated high-performance tooling and infrastructure. Nobody wants to deal with more tooling and infrastructure… but everyone would benefit from simple, intuitive interfaces that abstract away a powerful system underneath if they are flexible enough to work in any domain.
+
+No tooling, no infrastructure – just elegant abstractions.
+
+Substrate is the first inference API optimized specifically for multi-step AI workloads. With Substrate, you connect nodes from a [curated library](https://docs.substrate.run/overview/api) that includes optimized ML models, built-in file and vector storage, a code interpreter, and logical control flow. By simply connecting nodes, you describe a graph program, which Substrate then analyzes and runs as fast as possible. Entire graphs of many nodes will often run on a single machine, with auto batching and microsecond communication between tasks.
+
+We've been working on Substrate privately for nearly a year. We've battle-tested the product with great customers like [Substack](/substack), and we're finally ready to open access to everyone.
+
+[Let us know](https://join.slack.com/t/substratecommunity/shared_invite/zt-2jd8w6b7n-b0qE5QWV7rsClGglHeu_rA) what you think. We can't wait to see what you build.
@@ -0,0 +1,22 @@
+---
+title: "Substack runs modular AI workloads on Substrate"
+description: "By choosing Substrate, Substack develops multi-inference AI workloads with greater speed and flexibility than ever before."
+date: 06-21-2024
+image: "/substack-substrate.png"
+---
+
+<div class="hero-image">
+    <img width={1020} height={510} src="/substack-substrate.png" alt="Substack runs modular AI workloads on Substrate" />
+</div>
+
+[Substack](https://substack.com) is a large online publishing platform that enables writers to engage directly with their readers, with over 17k active writers.
+
+Substack employs ML for various purposes, including image generation, content categorization, content recommendation, semantic search, and audio transcription. For all of these use cases, Substack has moved their inference workloads to Substrate.
+
+Initially, Substack tried using other tools to power generative AI features embedded in their publishing flow. But the result was slow and expensive, and in order to roll these features out to all writers on their platform, they had to find another solution. They knew that if they could wave a magic wand, their ideal solution would be a set of simple APIs they could call, without any additional infrastructure for their engineering team to manage. But speed, cost, reliability, and extensibility were critical, and no providers fit the bill. Substrate offered performant inference for all of the models they wanted to use, behind a polished API.
+
+Substack was also exploring ways to integrate LLMs, semantic vectors, and vector databases into their internal systems to categorize and recommend content. These tasks required using an ensemble of ML models in coordination with a vector database. When using other providers, Substack found that making many parallel or chained API requests in a single workflow was prohibitively slow, and often triggered rate limits. They considered taking on running the infrastructure themselves – which their engineering team would have been capable of – but they knew this would come at a cost to progress on their core product.
+
+Because Substack already used Substrate for performant inference running individual models, using Substrate for multi-model pipelines and integrated vector retrieval was an obvious choice. Using the Substrate TypeScript SDK, Substack started composing LLM, VLM, transcription, embedding, and retrieval tasks into graph workflows. Today, Substack runs many multi-inference workloads (some with dozens of nodes) at scale across their entire content catalog.
+
+By choosing Substrate, Substack has been able to develop large-scale, modular, multi-inference AI workflows with greater speed and flexibility than ever before.
@@ -0,0 +1,5 @@
+/// <reference types="next" />
+/// <reference types="next/image-types/global" />
+
+// NOTE: This file should not be edited
+// see https://nextjs.org/docs/basic-features/typescript for more information.
@@ -0,0 +1,5 @@
+/** @type {import('next-sitemap').IConfig} */
+module.exports = {
+  siteUrl: process.env.NEXT_PUBLIC_SITE_URL || 'https://www.substrate.run/blog',
+  generateRobotsTxt: true,
+};
@@ -0,0 +1,18 @@
+import createMDX from 'fumadocs-mdx/config';
+import rehypeKatex from 'rehype-katex';
+import remarkMath from 'remark-math';
+
+const withMDX = createMDX({
+  mdxOptions: {
+    lastModifiedTime: 'git',
+    remarkPlugins: [remarkMath],
+    rehypePlugins: (v) => [rehypeKatex, ...v],
+  },
+});
+
+/** @type {import('next').NextConfig} */
+const config = {
+  reactStrictMode: true,
+};
+
+export default withMDX(config);
@@ -0,0 +1,45 @@
+{
+  "name": "blog",
+  "version": "0.0.0",
+  "private": true,
+  "scripts": {
+    "build": "next build",
+    "postbuild": "next-sitemap",
+    "dev": "next dev",
+    "start": "next start",
+    "format": "biome format --write .",
+    "lint": "biome lint .",
+    "lint:fix": "biome lint --write --unsafe .",
+    "check": "biome check .",
+    "check:fix": "biome check --write --unsafe ."
+  },
+  "dependencies": {
+    "@next/third-parties": "^14.2.4",
+    "@radix-ui/react-dialog": "^1.1.1",
+    "class-variance-authority": "^0.7.0",
+    "clsx": "^2.0.0",
+    "fumadocs-core": "^12.5.6",
+    "fumadocs-mdx": "^8.2.33",
+    "fumadocs-ui": "^12.3.4",
+    "katex": "^0.16.10",
+    "lucide-react": "^0.399.0",
+    "next": "^14.2.4",
+    "next-sitemap": "^4.2.3",
+    "react": "^18.3.1",
+    "react-dom": "^18.3.1",
+    "rehype-katex": "^7.0.0",
+    "remark-math": "^6.0.0",
+    "tailwind-merge": "^1.14.0",
+    "zod": "^3.23.8"
+  },
+  "devDependencies": {
+    "@types/mdx": "^2.0.11",
+    "@types/node": "^20.14.9",
+    "@types/react": "^18.3.3",
+    "@types/react-dom": "^18.2.21",
+    "autoprefixer": "^10.4.18",
+    "postcss": "^8.4.39",
+    "tailwindcss": "3.4.4",
+    "typescript": "^5.5.2"
+  }
+}
-Original file line number
+Diff line change
@@ @@ -0,0 +1,5 @@ @@
 +.next
 +.vercel
 +**/node_modules/**
 +.DS_Store
 +.map.ts