<?xml version="1.0" encoding="UTF-8"?><urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9" xmlns:news="http://www.google.com/schemas/sitemap-news/0.9"><url><loc>https://dreaming.press/posts/sglang-spec-v2-speculative-decoding-default.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-03</news:publication_date><news:title>SGLang Makes Spec V2 the Default: Speculative Decoding Grows Up in v0.5.13</news:title></news:news></url><url><loc>https://dreaming.press/posts/programmatic-tool-calling-claude-explained.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-03</news:publication_date><news:title>Programmatic Tool Calling, Explained: When to Let Claude Orchestrate Your Tools in Code</news:title></news:news></url><url><loc>https://dreaming.press/posts/openai-agent-builder-evals-deprecation-migration.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-03</news:publication_date><news:title>OpenAI Is Retiring Agent Builder and Evals: Shutdown Dates and the Migration Path</news:title></news:news></url><url><loc>https://dreaming.press/posts/mcp-enterprise-managed-authorization.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-03</news:publication_date><news:title>MCP Enterprise-Managed Authorization: Zero-Touch OAuth Without the Consent Screens</news:title></news:news></url><url><loc>https://dreaming.press/posts/how-to-evaluate-a-multi-agent-system.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-03</news:publication_date><news:title>How to Evaluate a Multi-Agent System</news:title></news:news></url><url><loc>https://dreaming.press/posts/gemini-3-flash-vs-pro-for-agents.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-03</news:publication_date><news:title>Gemini 3 Flash vs Pro for Agents: The Tier Inverted</news:title></news:news></url><url><loc>https://dreaming.press/posts/deepseek-v4-pro-vs-flash-for-agents.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-03</news:publication_date><news:title>DeepSeek V4 Pro vs Flash: Which One Goes in Your Agent Loop</news:title></news:news></url><url><loc>https://dreaming.press/posts/claude-sonnet-5-tokenizer-tax.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-03</news:publication_date><news:title>Claude Sonnet 5's Tokenizer Tax: Why the Same Rate Card Costs More Per Task</news:title></news:news></url><url><loc>https://dreaming.press/posts/agent-registry-vs-mcp-registry-discovery.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-03</news:publication_date><news:title>Agent Registry vs MCP Registry: The New Discovery Layer, and Why It's Already Fragmenting</news:title></news:news></url><url><loc>https://dreaming.press/posts/zero-trust-for-ai-agents.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>Zero Trust for AI Agents: Why the New Frameworks Treat Your Agent as an Insider Threat</news:title></news:news></url><url><loc>https://dreaming.press/posts/vllm-vs-sglang-vs-lmdeploy.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>vLLM vs SGLang vs LMDeploy: Picking a Self-Hosted Inference Engine in 2026</news:title></news:news></url><url><loc>https://dreaming.press/posts/text-to-sql-accuracy-spider-vs-bird.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>Text-to-SQL Accuracy in 2026: Why the Benchmark Says 90% and Your Warehouse Says 40%</news:title></news:news></url><url><loc>https://dreaming.press/posts/stainless-alternatives-sdk-mcp-generators.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>Stainless Is Winding Down: Where to Generate SDKs and MCP Servers Now</news:title></news:news></url><url><loc>https://dreaming.press/posts/rag-faithfulness-vs-groundedness-vs-correctness.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>Faithfulness vs Groundedness vs Correctness: Which RAG Hallucination Check Catches a Wrong Answer</news:title></news:news></url><url><loc>https://dreaming.press/posts/qwen3-vs-nemotron-nano-vs-phi-vs-gemma-for-agents.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>The Best Small Model for Your Agent Isn't the Smallest — or the Smartest</news:title></news:news></url><url><loc>https://dreaming.press/posts/pydantic-ai-v2-capabilities-harness.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>Pydantic AI V2 Is Out: What 'Capabilities' and the Harness Actually Change</news:title></news:news></url><url><loc>https://dreaming.press/posts/pi-minimal-coding-agent-harness.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>Pi's System Prompt Is Under 1,000 Tokens: The Case Against Heavy Coding-Agent Harnesses</news:title></news:news></url><url><loc>https://dreaming.press/posts/nsa-mcp-security-guidance.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>The NSA's MCP Security Guidance: The First Advice That Defends Against Your Own Agent</news:title></news:news></url><url><loc>https://dreaming.press/posts/minimax-m3-open-weight-1m-context.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>MiniMax M3: Frontier Coding and 1M Context on Open Weights — Read the Latency, Not the Leaderboard</news:title></news:news></url><url><loc>https://dreaming.press/posts/mcp-deprecates-sampling-roots-logging.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>MCP Is Deprecating Sampling, Roots, and Logging: What the 2026-07-28 Spec Cuts and Why</news:title></news:news></url><url><loc>https://dreaming.press/posts/mcp-2026-spec-security-new-attack-surfaces.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>MCP's Stateless Spec Fixes Session Hijacking — and Hands You Three New Attack Surfaces</news:title></news:news></url><url><loc>https://dreaming.press/posts/mastra-npm-supply-chain-attack.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>The Mastra npm Attack: AI Agent Frameworks Are the New Supply-Chain Target</news:title></news:news></url><url><loc>https://dreaming.press/posts/llm-cascade-vs-router.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>LLM Cascade vs Router: Escalate to a Bigger Model, or Route Around It?</news:title></news:news></url><url><loc>https://dreaming.press/posts/langmem-vs-mem0.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>LangMem vs Mem0: Memory You Program vs Memory You Call</news:title></news:news></url><url><loc>https://dreaming.press/posts/interleaved-thinking-agents-reason-between-tool-calls.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>Interleaved Thinking: When Should an AI Agent Reason Between Tool Calls?</news:title></news:news></url><url><loc>https://dreaming.press/posts/how-to-enforce-a-token-budget-on-an-ai-agent.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>How to Enforce a Token Budget on an AI Agent (Not Just Measure It)</news:title></news:news></url><url><loc>https://dreaming.press/posts/how-to-distribute-an-mcp-server-oci-vs-registry.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>How MCP Servers Actually Ship: The Registry Is a Phone Book, OCI Is the Supply Chain</news:title></news:news></url><url><loc>https://dreaming.press/posts/google-always-on-memory-agent.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>Google Open-Sourced an Agent Memory System With No Vector Database. Read the Design.</news:title></news:news></url><url><loc>https://dreaming.press/posts/does-structured-output-hurt-llm-accuracy.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>Does Structured Output Hurt LLM Accuracy? The Format Tax, Measured</news:title></news:news></url><url><loc>https://dreaming.press/posts/claude-sonnet-5-vs-opus-4-8-for-agents.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>Claude Sonnet 5 vs Opus 4.8 for Agents: The Cheaper Model and the Tokenizer Catch</news:title></news:news></url><url><loc>https://dreaming.press/posts/claude-dreaming-agent-memory-consolidation.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>What Anthropic's 'Dreaming' Does to Agent Memory — and Why a Bad Dream Doesn't Wash Out</news:title></news:news></url><url><loc>https://dreaming.press/posts/batch-api-vs-real-time-llm-inference.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>Batch API vs Real-Time Inference: The 50% Discount Isn't Why You Should Use It</news:title></news:news></url><url><loc>https://dreaming.press/posts/aws-cloudfront-x402-charge-ai-agents-per-request.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>AWS Will Now Let You Charge AI Agents Per Request: How x402 Metering at the CDN Edge Works</news:title></news:news></url><url><loc>https://dreaming.press/posts/agent-skills-open-standard-portability.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>Agent Skills Are an Open Standard: What Portability Buys — and What It Can't Enforce</news:title></news:news></url><url><loc>https://dreaming.press/posts/agent-handoffs-langgraph-openai-adk.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>Agent Handoffs in LangGraph, OpenAI Agents SDK, and Google ADK: What Actually Transfers With Control</news:title></news:news></url><url><loc>https://dreaming.press/posts/tool-choice-auto-vs-required-vs-forced.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>Tool Choice: auto vs required vs Forcing One Tool</news:title></news:news></url><url><loc>https://dreaming.press/posts/telemem-vs-mem0.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>TeleMem vs Mem0: When a Drop-In Memory Layer Is Really a Different Bet</news:title></news:news></url><url><loc>https://dreaming.press/posts/right-to-be-forgotten-vector-database.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>Right to Be Forgotten in RAG: How to Actually Delete a User From a Vector Database</news:title></news:news></url><url><loc>https://dreaming.press/posts/qdrant-vs-milvus-vs-weaviate.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>Qdrant vs Milvus vs Weaviate: Filtered Search Is the Question That Separates Them</news:title></news:news></url><url><loc>https://dreaming.press/posts/prompt-injection-to-rce-agent-allowlist-bypass.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>When Prompt Injection Becomes Remote Code Execution: Why Agent Command Allowlists Keep Failing</news:title></news:news></url><url><loc>https://dreaming.press/posts/mcp-server-cards-well-known-discovery.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>MCP Server Cards: How an Agent Will Vet a Server Before It Connects</news:title></news:news></url><url><loc>https://dreaming.press/posts/mcp-confused-deputy-problem.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>The Confused Deputy Problem in MCP: Why Agent Auth Keeps Failing the Same Way</news:title></news:news></url><url><loc>https://dreaming.press/posts/mcp-bench-vs-mcptoolbench-vs-mcpagentbench.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>MCP-Bench vs MCPToolBench++ vs MCPAgentBench: How to Benchmark an Agent's MCP Tool Use</news:title></news:news></url><url><loc>https://dreaming.press/posts/llm-cost-attribution-per-agent-and-tenant.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>How to Attribute LLM Costs Per Agent, Tenant, and Feature</news:title></news:news></url><url><loc>https://dreaming.press/posts/hyperlight-vs-firecracker.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>Hyperlight vs Firecracker: The Micro-VM That Deleted the Guest Kernel to Sandbox Agent Code</news:title></news:news></url><url><loc>https://dreaming.press/posts/how-vulnerable-are-mcp-servers.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>How Vulnerable Are MCP Servers? A Scan of 39,884 Repos Found 106 Zero-Days</news:title></news:news></url><url><loc>https://dreaming.press/posts/how-to-tune-hnsw-vector-search.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>How to Tune HNSW: The Three Knobs Behind Vector Search Recall</news:title></news:news></url><url><loc>https://dreaming.press/posts/how-to-summarize-a-document-too-long-for-the-context-window.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>How to Summarize a Document That Doesn't Fit in the Context Window: Map-Reduce vs Refine vs Not at All</news:title></news:news></url><url><loc>https://dreaming.press/posts/how-to-handle-a-truncated-llm-response.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>How to Handle a Truncated LLM Response: finish_reason, max_tokens, and the Reasoning-Token Trap</news:title></news:news></url><url><loc>https://dreaming.press/posts/how-to-evaluate-an-ai-coding-agent.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>How to Evaluate an AI Coding Agent</news:title></news:news></url><url><loc>https://dreaming.press/posts/how-to-deploy-a-long-running-ai-agent-without-losing-in-flight-work.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>How to Deploy a Long-Running AI Agent Without Losing In-Flight Work</news:title></news:news></url><url><loc>https://dreaming.press/posts/how-ai-agents-forget-memory-consolidation.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>How AI Agents Decide What to Forget: Memory Consolidation in Mem0, Zep, and the Memory Tool</news:title></news:news></url><url><loc>https://dreaming.press/posts/gpt-5-5-vs-claude-opus-4-8-vs-gemini-for-coding.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>The Best AI Model for Coding Agents in 2026 Is Half a Harness</news:title></news:news></url><url><loc>https://dreaming.press/posts/gateway-api-inference-extension.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>Kubernetes' Gateway API Inference Extension: When the Load Balancer Starts Reading GPU Metrics</news:title></news:news></url><url><loc>https://dreaming.press/posts/every-ai-agent-framework-became-a-graph.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>Every AI Agent Framework Became a Graph in 2026 — and the Hard Part Is Still Unsolved</news:title></news:news></url><url><loc>https://dreaming.press/posts/declarative-agents-yaml-vs-code.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>Declarative Agents: When a YAML File Should Define Your Agent — and When It Can't</news:title></news:news></url><url><loc>https://dreaming.press/posts/cross-cluster-llm-serving.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>Cross-Cluster LLM Serving: Why KServe, llm-d, and Dynamo Stop at the Cluster Line</news:title></news:news></url><url><loc>https://dreaming.press/posts/context-compaction-erases-agent-guardrails.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>Context Compaction Is Quietly Deleting Your Agent's Guardrails</news:title></news:news></url><url><loc>https://dreaming.press/posts/brute-force-vs-approximate-vector-search.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>Brute-Force vs Approximate Vector Search: Do You Even Need a Vector Database?</news:title></news:news></url><url><loc>https://dreaming.press/posts/amazon-q-rce-coding-agent-folder-trust.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>When \&quot;Trust This Folder\&quot; Means Remote Code Execution: The Amazon Q Flaw Every Coding Agent Shipped</news:title></news:news></url><url><loc>https://dreaming.press/posts/ai-browser-prompt-injection.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>Why AI Browsers Still Can't Stop Prompt Injection</news:title></news:news></url><url><loc>https://dreaming.press/posts/ai-agents-finding-zero-days.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>AI Agents Are Finding Real Zero-Days at Scale — and Drowning Maintainers in Fake Ones</news:title></news:news></url><url><loc>https://dreaming.press/posts/ai-agent-goal-drift.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>AI Agent Goal Drift: Why Long-Running Agents Quietly Abandon the Task You Gave Them</news:title></news:news></url><url><loc>https://dreaming.press/posts/agent-memory-token-cost-read-vs-write.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>How Many Tokens Does an Agent Memory Layer Use? From 7K to 3.26M per Query</news:title></news:news></url></urlset>