<?xml version="1.0" encoding="UTF-8"?><urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9" xmlns:news="http://www.google.com/schemas/sitemap-news/0.9"><url><loc>https://dreaming.press/posts/vllm-vs-sglang-vs-lmdeploy.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>vLLM vs SGLang vs LMDeploy: Picking a Self-Hosted Inference Engine in 2026</news:title></news:news></url><url><loc>https://dreaming.press/posts/stainless-alternatives-sdk-mcp-generators.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>Stainless Is Winding Down: Where to Generate SDKs and MCP Servers Now</news:title></news:news></url><url><loc>https://dreaming.press/posts/mastra-npm-supply-chain-attack.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>The Mastra npm Attack: AI Agent Frameworks Are the New Supply-Chain Target</news:title></news:news></url><url><loc>https://dreaming.press/posts/google-always-on-memory-agent.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>Google Open-Sourced an Agent Memory System With No Vector Database. Read the Design.</news:title></news:news></url><url><loc>https://dreaming.press/posts/claude-sonnet-5-vs-opus-4-8-for-agents.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-02</news:publication_date><news:title>Claude Sonnet 5 vs Opus 4.8 for Agents: The Cheaper Model and the Tokenizer Catch</news:title></news:news></url><url><loc>https://dreaming.press/posts/tool-choice-auto-vs-required-vs-forced.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>Tool Choice: auto vs required vs Forcing One Tool</news:title></news:news></url><url><loc>https://dreaming.press/posts/telemem-vs-mem0.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>TeleMem vs Mem0: When a Drop-In Memory Layer Is Really a Different Bet</news:title></news:news></url><url><loc>https://dreaming.press/posts/right-to-be-forgotten-vector-database.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>Right to Be Forgotten in RAG: How to Actually Delete a User From a Vector Database</news:title></news:news></url><url><loc>https://dreaming.press/posts/qdrant-vs-milvus-vs-weaviate.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>Qdrant vs Milvus vs Weaviate: Filtered Search Is the Question That Separates Them</news:title></news:news></url><url><loc>https://dreaming.press/posts/prompt-injection-to-rce-agent-allowlist-bypass.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>When Prompt Injection Becomes Remote Code Execution: Why Agent Command Allowlists Keep Failing</news:title></news:news></url><url><loc>https://dreaming.press/posts/mcp-server-cards-well-known-discovery.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>MCP Server Cards: How an Agent Will Vet a Server Before It Connects</news:title></news:news></url><url><loc>https://dreaming.press/posts/mcp-confused-deputy-problem.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>The Confused Deputy Problem in MCP: Why Agent Auth Keeps Failing the Same Way</news:title></news:news></url><url><loc>https://dreaming.press/posts/mcp-bench-vs-mcptoolbench-vs-mcpagentbench.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>MCP-Bench vs MCPToolBench++ vs MCPAgentBench: How to Benchmark an Agent's MCP Tool Use</news:title></news:news></url><url><loc>https://dreaming.press/posts/llm-cost-attribution-per-agent-and-tenant.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>How to Attribute LLM Costs Per Agent, Tenant, and Feature</news:title></news:news></url><url><loc>https://dreaming.press/posts/hyperlight-vs-firecracker.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>Hyperlight vs Firecracker: The Micro-VM That Deleted the Guest Kernel to Sandbox Agent Code</news:title></news:news></url><url><loc>https://dreaming.press/posts/how-vulnerable-are-mcp-servers.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>How Vulnerable Are MCP Servers? A Scan of 39,884 Repos Found 106 Zero-Days</news:title></news:news></url><url><loc>https://dreaming.press/posts/how-to-tune-hnsw-vector-search.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>How to Tune HNSW: The Three Knobs Behind Vector Search Recall</news:title></news:news></url><url><loc>https://dreaming.press/posts/how-to-summarize-a-document-too-long-for-the-context-window.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>How to Summarize a Document That Doesn't Fit in the Context Window: Map-Reduce vs Refine vs Not at All</news:title></news:news></url><url><loc>https://dreaming.press/posts/how-to-handle-a-truncated-llm-response.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>How to Handle a Truncated LLM Response: finish_reason, max_tokens, and the Reasoning-Token Trap</news:title></news:news></url><url><loc>https://dreaming.press/posts/how-to-evaluate-an-ai-coding-agent.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>How to Evaluate an AI Coding Agent</news:title></news:news></url><url><loc>https://dreaming.press/posts/how-to-deploy-a-long-running-ai-agent-without-losing-in-flight-work.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>How to Deploy a Long-Running AI Agent Without Losing In-Flight Work</news:title></news:news></url><url><loc>https://dreaming.press/posts/how-ai-agents-forget-memory-consolidation.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>How AI Agents Decide What to Forget: Memory Consolidation in Mem0, Zep, and the Memory Tool</news:title></news:news></url><url><loc>https://dreaming.press/posts/gpt-5-5-vs-claude-opus-4-8-vs-gemini-for-coding.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>The Best AI Model for Coding Agents in 2026 Is Half a Harness</news:title></news:news></url><url><loc>https://dreaming.press/posts/gateway-api-inference-extension.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>Kubernetes' Gateway API Inference Extension: When the Load Balancer Starts Reading GPU Metrics</news:title></news:news></url><url><loc>https://dreaming.press/posts/every-ai-agent-framework-became-a-graph.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>Every AI Agent Framework Became a Graph in 2026 — and the Hard Part Is Still Unsolved</news:title></news:news></url><url><loc>https://dreaming.press/posts/declarative-agents-yaml-vs-code.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>Declarative Agents: When a YAML File Should Define Your Agent — and When It Can't</news:title></news:news></url><url><loc>https://dreaming.press/posts/cross-cluster-llm-serving.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>Cross-Cluster LLM Serving: Why KServe, llm-d, and Dynamo Stop at the Cluster Line</news:title></news:news></url><url><loc>https://dreaming.press/posts/context-compaction-erases-agent-guardrails.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>Context Compaction Is Quietly Deleting Your Agent's Guardrails</news:title></news:news></url><url><loc>https://dreaming.press/posts/brute-force-vs-approximate-vector-search.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>Brute-Force vs Approximate Vector Search: Do You Even Need a Vector Database?</news:title></news:news></url><url><loc>https://dreaming.press/posts/amazon-q-rce-coding-agent-folder-trust.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>When \&quot;Trust This Folder\&quot; Means Remote Code Execution: The Amazon Q Flaw Every Coding Agent Shipped</news:title></news:news></url><url><loc>https://dreaming.press/posts/ai-browser-prompt-injection.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>Why AI Browsers Still Can't Stop Prompt Injection</news:title></news:news></url><url><loc>https://dreaming.press/posts/ai-agents-finding-zero-days.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>AI Agents Are Finding Real Zero-Days at Scale — and Drowning Maintainers in Fake Ones</news:title></news:news></url><url><loc>https://dreaming.press/posts/ai-agent-goal-drift.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>AI Agent Goal Drift: Why Long-Running Agents Quietly Abandon the Task You Gave Them</news:title></news:news></url><url><loc>https://dreaming.press/posts/agent-memory-token-cost-read-vs-write.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-07-01</news:publication_date><news:title>How Many Tokens Does an Agent Memory Layer Use? From 7K to 3.26M per Query</news:title></news:news></url><url><loc>https://dreaming.press/posts/web-bot-auth-explained-ai-agents.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>Web Bot Auth, Explained: How a Site Will Tell Your AI Agent From a Scraper</news:title></news:news></url><url><loc>https://dreaming.press/posts/vercel-eve-vs-microsoft-agent-framework.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>Vercel eve vs Microsoft Agent Framework: Portable Agent, or Portable Runtime?</news:title></news:news></url><url><loc>https://dreaming.press/posts/unisound-u2-native-agentic-model.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>Unisound U2 and the Bet on 'Native Agentic' Models: When the Loop Moves Into the Weights</news:title></news:news></url><url><loc>https://dreaming.press/posts/spot-gpus-for-llm-inference.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>Spot GPUs for LLM Inference: How to Cut Serving Cost Without Dropping Requests</news:title></news:news></url><url><loc>https://dreaming.press/posts/skyvern-vs-browser-use.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>Skyvern vs Browser Use: You're Not Picking a Browser Agent, You're Picking How It Sees the Page</news:title></news:news></url><url><loc>https://dreaming.press/posts/provider-agnostic-ai-agents.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>Provider-Agnostic AI Agents: The Lock-In Isn't Where You Think</news:title></news:news></url><url><loc>https://dreaming.press/posts/open-source-deep-research-agents.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>Open-Source Deep Research Agents: 7 Repos to Build (or Run) Your Own</news:title></news:news></url><url><loc>https://dreaming.press/posts/mcp-vs-rest-api-for-agents.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>MCP vs REST: Do Your Agents Need a Protocol, or Just Your API?</news:title></news:news></url><url><loc>https://dreaming.press/posts/mcp-goes-stateless-2026-07-28-spec.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>MCP Goes Stateless: What the 2026-07-28 Spec Changes for Agent Builders</news:title></news:news></url><url><loc>https://dreaming.press/posts/locomo-vs-longmemeval-vs-beam-agent-memory.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>Agent Memory Benchmarks: LoCoMo vs LongMemEval vs BEAM</news:title></news:news></url><url><loc>https://dreaming.press/posts/llm-judge-bias.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>Your LLM Judge Is Biased: Position, Verbosity, and Self-Preference — and Which Ones You Can Fix</news:title></news:news></url><url><loc>https://dreaming.press/posts/langchain-1-0-and-langgraph-1-0-whats-new.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>LangChain 1.0 and LangGraph 1.0: What Actually Changed for Agent Builders</news:title></news:news></url><url><loc>https://dreaming.press/posts/kafka-vs-nats-vs-redis-streams-ai-agents.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>Kafka vs NATS vs Redis Streams: Choosing the Event Backbone for AI Agent Systems</news:title></news:news></url><url><loc>https://dreaming.press/posts/jailbreak-vs-prompt-injection.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>Jailbreak vs Prompt Injection: Two Attacks That Live in Different Layers</news:title></news:news></url><url><loc>https://dreaming.press/posts/how-to-write-a-system-prompt-for-an-ai-agent.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>How to Write a System Prompt for an AI Agent</news:title></news:news></url><url><loc>https://dreaming.press/posts/how-to-ship-ai-agent-changes-safely.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>How to Ship an AI Agent Change Without Breaking It: Eval Gates, Shadow Replay, and Why Canaries Lie</news:title></news:news></url><url><loc>https://dreaming.press/posts/how-to-read-an-agent-memory-benchmark.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>How to Read an Agent-Memory Benchmark: The LoCoMo and LongMemEval Number Wars</news:title></news:news></url><url><loc>https://dreaming.press/posts/how-to-evaluate-an-embedding-model-on-your-own-data.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>How to Evaluate an Embedding Model on Your Own Data</news:title></news:news></url><url><loc>https://dreaming.press/posts/how-to-evaluate-a-deep-research-agent.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>How to Evaluate a Deep Research Agent: Report Quality vs. Citation Accuracy</news:title></news:news></url><url><loc>https://dreaming.press/posts/glm-5-2-open-weight-agentic-coding.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>GLM-5.2 Matched the Closed Models on Agentic Coding — for a Sixth of the Cost</news:title></news:news></url><url><loc>https://dreaming.press/posts/expose-agent-as-mcp-server.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>Your Agent Is Now an MCP Server: What Exposing an Agent as a Tool Quietly Throws Away</news:title></news:news></url><url><loc>https://dreaming.press/posts/eval-driven-development-for-ai-agents.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>Eval-Driven Development: How to Ship an AI Agent Without Guessing</news:title></news:news></url><url><loc>https://dreaming.press/posts/eu-ai-act-for-ai-agents.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>The EU AI Act Deadline Didn't Really Move: What Still Hits AI Agents on August 2</news:title></news:news></url><url><loc>https://dreaming.press/posts/claude-agent-sdk-vs-openai-agents-sdk.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>Claude Agent SDK vs OpenAI Agents SDK: A Harness vs an Orchestration Library</news:title></news:news></url><url><loc>https://dreaming.press/posts/bedrock-agentcore-vs-vertex-agent-engine-vs-foundry-hosted-agents.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>Bedrock AgentCore vs Vertex Agent Engine vs Foundry Hosted Agents: The Managed Agent Runtime, Compared</news:title></news:news></url><url><loc>https://dreaming.press/posts/autoscaling-llm-inference-on-kubernetes.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>Autoscaling LLM Inference on Kubernetes: Scale on the Queue, Not the GPU</news:title></news:news></url><url><loc>https://dreaming.press/posts/any-llm-vs-litellm.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>Any-LLM vs LiteLLM: You're Comparing a Library to a Building</news:title></news:news></url><url><loc>https://dreaming.press/posts/ai-agent-sprawl-governance-registry.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>Agent Sprawl: Why AI Agent Governance Now Starts With a Registry</news:title></news:news></url><url><loc>https://dreaming.press/posts/ai-agent-act-warner-bill-explained.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>The AI AGENT Act, Explained: Warner's Bill Treats Blocking Your Agent as the Harm</news:title></news:news></url><url><loc>https://dreaming.press/posts/a2a-protocol-at-one-year-adoption-reality.html</loc><news:news><news:publication><news:name>dreaming.press</news:name><news:language>en</news:language></news:publication><news:publication_date>2026-06-30</news:publication_date><news:title>A2A at One Year: Is Agent-to-Agent Interoperability Actually Happening?</news:title></news:news></url></urlset>