<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:dc="http://purl.org/dc/elements/1.1/" version="2.0">
  <channel>
    <title>InfoQ - Observability</title>
    <link>https://www.infoq.com</link>
    <description>InfoQ Observability feed</description>
    <item>
      <title>Article: Kernel-Level Ground Truth: Why eBPF is Replacing User-Space Agents for Security Observability</title>
      <link>https://www.infoq.com/articles/ebpf-for-security-observability/?utm_campaign=infoq_content&amp;utm_source=infoq&amp;utm_medium=feed&amp;utm_term=Observability</link>
      <description>&lt;img src="https://res.infoq.com/articles/ebpf-for-security-observability/en/headerimage/ebpf-for-security-observability-header-1778674557176.jpg"/&gt;&lt;p&gt;eBPF is emerging as a preferred method for security observability over traditional user-space agents. By attaching probes directly to the Linux kernel's syscall interface, it provides consistent visibility even during container-level compromises. eBPF reduces security-related CPU consumption and limits data volume by performing filtering at the kernel level, enhancing operational efficiency.&lt;/p&gt; &lt;i&gt;By Niranjan Sharma&lt;/i&gt;</description>
      <category>Application Security</category>
      <category>eBPF</category>
      <category>Observability</category>
      <category>DevOps</category>
      <category>article</category>
      <pubDate>Tue, 19 May 2026 09:00:00 GMT</pubDate>
      <guid>https://www.infoq.com/articles/ebpf-for-security-observability/?utm_campaign=infoq_content&amp;utm_source=infoq&amp;utm_medium=feed&amp;utm_term=Observability</guid>
      <dc:creator>Niranjan Sharma</dc:creator>
      <dc:date>2026-05-19T09:00:00Z</dc:date>
      <dc:identifier>/articles/ebpf-for-security-observability/en</dc:identifier>
    </item>
    <item>
      <title>Cloudflare Introduces Workflows V2 with Deterministic Execution and 50K Concurrent Workflows</title>
      <link>https://www.infoq.com/news/2026/05/cloudflare-workflows-v2-release/?utm_campaign=infoq_content&amp;utm_source=infoq&amp;utm_medium=feed&amp;utm_term=Observability</link>
      <description>&lt;img src="https://res.infoq.com/news/2026/05/cloudflare-workflows-v2-release/en/headerimage/generatedHeaderImage-1777438019188.jpg"/&gt;&lt;p&gt;Cloudflare introduces Workflows V2, a redesigned distributed workflow orchestration system with deterministic replayable execution, improved observability, and major scaling upgrades, including 50,000 concurrent instances and 2M queued workflows. It supports AI agents, data pipelines, and background processing with improved reliability across distributed systems.&lt;/p&gt; &lt;i&gt;By Leela Kumili&lt;/i&gt;</description>
      <category>Event Driven Architecture</category>
      <category>Microservices</category>
      <category>Serverless</category>
      <category>Scalability</category>
      <category>Orchestration</category>
      <category>Observability</category>
      <category>AI Architecture</category>
      <category>Data Pipelines</category>
      <category>Cloud Computing</category>
      <category>Agents</category>
      <category>Concurrency</category>
      <category>Cloudflare</category>
      <category>Windows Workflow Foundation</category>
      <category>Development</category>
      <category>Architecture &amp; Design</category>
      <category>news</category>
      <pubDate>Fri, 15 May 2026 14:04:00 GMT</pubDate>
      <guid>https://www.infoq.com/news/2026/05/cloudflare-workflows-v2-release/?utm_campaign=infoq_content&amp;utm_source=infoq&amp;utm_medium=feed&amp;utm_term=Observability</guid>
      <dc:creator>Leela Kumili</dc:creator>
      <dc:date>2026-05-15T14:04:00Z</dc:date>
      <dc:identifier>/news/2026/05/cloudflare-workflows-v2-release/en</dc:identifier>
    </item>
    <item>
      <title>Pinterest Engineers Eliminate CPU Zombies to Resolve Production Bottlenecks</title>
      <link>https://www.infoq.com/news/2026/05/pinterest-cpu-zombies-bottleneck/?utm_campaign=infoq_content&amp;utm_source=infoq&amp;utm_medium=feed&amp;utm_term=Observability</link>
      <description>&lt;img src="https://res.infoq.com/news/2026/05/pinterest-cpu-zombies-bottleneck/en/headerimage/header-1778308038640.jpeg"/&gt;&lt;p&gt;Pinterest identified and resolved CPU starvation issues that affected machine learning training jobs on its Kubernetes-based platform, PinCompute. The engineers traced the problem to an unused Amazon ECS agent, which caused memory cgroup leaks. By disabling the agent, they stabilised performance. This case illustrates the importance of understanding system defaults for effective troubleshooting.&lt;/p&gt; &lt;i&gt;By Mark Silvester&lt;/i&gt;</description>
      <category>Performance</category>
      <category>Debugging</category>
      <category>Performance Tuning</category>
      <category>Observability</category>
      <category>DevOps</category>
      <category>Development</category>
      <category>Architecture &amp; Design</category>
      <category>news</category>
      <pubDate>Thu, 14 May 2026 10:00:00 GMT</pubDate>
      <guid>https://www.infoq.com/news/2026/05/pinterest-cpu-zombies-bottleneck/?utm_campaign=infoq_content&amp;utm_source=infoq&amp;utm_medium=feed&amp;utm_term=Observability</guid>
      <dc:creator>Mark Silvester</dc:creator>
      <dc:date>2026-05-14T10:00:00Z</dc:date>
      <dc:identifier>/news/2026/05/pinterest-cpu-zombies-bottleneck/en</dc:identifier>
    </item>
    <item>
      <title>Grafana's Pyroscope 2.0 Makes Continuous Profiling Practical at Scale</title>
      <link>https://www.infoq.com/news/2026/05/pyroscope-2-profiling/?utm_campaign=infoq_content&amp;utm_source=infoq&amp;utm_medium=feed&amp;utm_term=Observability</link>
      <description>&lt;img src="https://res.infoq.com/news/2026/05/pyroscope-2-profiling/en/headerimage/generatedHeaderImage-1778539051167.jpg"/&gt;&lt;p&gt;Grafana Labs has launched Pyroscope 2.0, a rearchitected open-source continuous profiling database. This version improves storage costs, query performance, and operational complexity. Key changes include single write paths for profiles, stateless query processing, and enhanced capabilities for profiling data. It supports the OpenTelemetry Protocol, aligning with current trends in observability.&lt;/p&gt; &lt;i&gt;By Matt Saunders&lt;/i&gt;</description>
      <category>Grafana</category>
      <category>Observability</category>
      <category>DevOps</category>
      <category>news</category>
      <pubDate>Wed, 13 May 2026 08:00:00 GMT</pubDate>
      <guid>https://www.infoq.com/news/2026/05/pyroscope-2-profiling/?utm_campaign=infoq_content&amp;utm_source=infoq&amp;utm_medium=feed&amp;utm_term=Observability</guid>
      <dc:creator>Matt Saunders</dc:creator>
      <dc:date>2026-05-13T08:00:00Z</dc:date>
      <dc:identifier>/news/2026/05/pyroscope-2-profiling/en</dc:identifier>
    </item>
    <item>
      <title>Netflix Serves 84% of Query Results from Cache with Interval-Aware Caching in Apache Druid</title>
      <link>https://www.infoq.com/news/2026/05/netflix-druid-interval-cache/?utm_campaign=infoq_content&amp;utm_source=infoq&amp;utm_medium=feed&amp;utm_term=Observability</link>
      <description>&lt;img src="https://res.infoq.com/news/2026/05/netflix-druid-interval-cache/en/headerimage/generatedHeaderImage-1777092326529.jpg"/&gt;&lt;p&gt;Netflix improves Apache Druid performance with interval aware caching, serving 84% of analytics results from cache and reducing query load by 33%. The system decomposes rolling window queries into reusable time segments, enabling partial cache reuse and recomputation only for recent data. At scale, it reduces scan volume, improves P90 latency, and optimizes real time analytics workloads.&lt;/p&gt; &lt;i&gt;By Leela Kumili&lt;/i&gt;</description>
      <category>Time Series Data</category>
      <category>Data Analytics</category>
      <category>Caching</category>
      <category>Apache</category>
      <category>Observability</category>
      <category>Distributed Systems</category>
      <category>Optimization</category>
      <category>Development</category>
      <category>Architecture &amp; Design</category>
      <category>news</category>
      <pubDate>Mon, 11 May 2026 14:36:00 GMT</pubDate>
      <guid>https://www.infoq.com/news/2026/05/netflix-druid-interval-cache/?utm_campaign=infoq_content&amp;utm_source=infoq&amp;utm_medium=feed&amp;utm_term=Observability</guid>
      <dc:creator>Leela Kumili</dc:creator>
      <dc:date>2026-05-11T14:36:00Z</dc:date>
      <dc:identifier>/news/2026/05/netflix-druid-interval-cache/en</dc:identifier>
    </item>
    <item>
      <title>Article: Local-First AI Inference: a Cloud Architecture Pattern for Cost-Effective Document Processing</title>
      <link>https://www.infoq.com/articles/local-first-ai-inference-cloud/?utm_campaign=infoq_content&amp;utm_source=infoq&amp;utm_medium=feed&amp;utm_term=Observability</link>
      <description>&lt;img src="https://res.infoq.com/articles/local-first-ai-inference-cloud/en/headerimage/Local-First-AI-Inference-A-Cloud-Architecture-Pattern-for-Cost-Effective-Document-Processing-header-1778141518292.jpg"/&gt;&lt;p&gt;The Local-First AI Inference pattern routes 70–80% of documents to deterministic local extraction at zero API cost, reserving Azure OpenAI calls for edge cases and flagging low-confidence results for human review. Deployed on 4,700 engineering drawing PDFs, it cut API costs by 75% and processing time by 55%, while bounding errors through a human review tier.&lt;/p&gt; &lt;i&gt;By Obinna Iheanachor&lt;/i&gt;</description>
      <category>Generative AI</category>
      <category>Cost Optimization</category>
      <category>Model Inference</category>
      <category>Cloud</category>
      <category>GPT-4</category>
      <category>Artificial Intelligence</category>
      <category>Observability</category>
      <category>Azure</category>
      <category>Microsoft Azure</category>
      <category>AI, ML &amp; Data Engineering</category>
      <category>DevOps</category>
      <category>Development</category>
      <category>article</category>
      <pubDate>Mon, 11 May 2026 11:00:00 GMT</pubDate>
      <guid>https://www.infoq.com/articles/local-first-ai-inference-cloud/?utm_campaign=infoq_content&amp;utm_source=infoq&amp;utm_medium=feed&amp;utm_term=Observability</guid>
      <dc:creator>Obinna Iheanachor</dc:creator>
      <dc:date>2026-05-11T11:00:00Z</dc:date>
      <dc:identifier>/articles/local-first-ai-inference-cloud/en</dc:identifier>
    </item>
  </channel>
</rss>
