<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:dc="http://purl.org/dc/elements/1.1/" version="2.0">
  <channel>
    <title>InfoQ - Site Reliability Engineering - News</title>
    <link>https://www.infoq.com</link>
    <description>InfoQ Site Reliability Engineering News feed</description>
    <item>
      <title>How a Culture of Data-Driven Conversations Can Support Platform Engineering</title>
      <link>https://www.infoq.com/news/2026/06/data-driven-platform-engineering/?utm_campaign=infoq_content&amp;utm_source=infoq&amp;utm_medium=feed&amp;utm_term=Site+Reliability+Engineering-news</link>
      <description>&lt;img src="https://res.infoq.com/news/2026/06/data-driven-platform-engineering/en/headerimage/generatedHeaderImage-1780255652688.jpg"/&gt;&lt;p&gt;To provide SRE as a service, a team built a center of excellence, introducing Federated SREs and roles like production manager and technical tribe lead. They created a culture of data-driven conversations where SLOs and SLAs were democratised. Surviving growing cognitive load meant continuously simplifying architecture and embedding sovereignty and resilience into platform design decisions.&lt;/p&gt; &lt;i&gt;By Ben Linders&lt;/i&gt;</description>
      <category>Value &amp; Metrics</category>
      <category>Platform Engineering</category>
      <category>InfoQ Dev Summit Munich 2025</category>
      <category>QCon Software Development Conference</category>
      <category>Resilience</category>
      <category>Platforms</category>
      <category>Cloud</category>
      <category>Metrics</category>
      <category>Site Reliability Engineering</category>
      <category>Culture &amp; Methods</category>
      <category>news</category>
      <pubDate>Thu, 04 Jun 2026 11:54:00 GMT</pubDate>
      <guid>https://www.infoq.com/news/2026/06/data-driven-platform-engineering/?utm_campaign=infoq_content&amp;utm_source=infoq&amp;utm_medium=feed&amp;utm_term=Site+Reliability+Engineering-news</guid>
      <dc:creator>Ben Linders</dc:creator>
      <dc:date>2026-06-04T11:54:00Z</dc:date>
      <dc:identifier>/news/2026/06/data-driven-platform-engineering/en</dc:identifier>
    </item>
    <item>
      <title>Google Cloud Suspends Railway's Production Account, Causing Eight-Hour Platform-Wide Outage</title>
      <link>https://www.infoq.com/news/2026/05/railway-gcp-account-outage/?utm_campaign=infoq_content&amp;utm_source=infoq&amp;utm_medium=feed&amp;utm_term=Site+Reliability+Engineering-news</link>
      <description>&lt;img src="https://res.infoq.com/news/2026/05/railway-gcp-account-outage/en/headerimage/generatedHeaderImage-1779878225205.jpg"/&gt;&lt;p&gt;Google Cloud's automated systems suspended Railway's production account without notice, triggering an eight-hour platform-wide outage affecting 3 million users. The cascade took down workloads across all providers including AWS and bare metal because Railway's control plane was hosted on GCP. Railway is demoting GCP to backup-only status.&lt;/p&gt; &lt;i&gt;By Steef-Jan Wiggers&lt;/i&gt;</description>
      <category>Cloud Architecture</category>
      <category>Google</category>
      <category>Google Cloud Platform</category>
      <category>Google Cloud</category>
      <category>Cloud</category>
      <category>Site Reliability Engineering</category>
      <category>DevOps</category>
      <category>Development</category>
      <category>Architecture &amp; Design</category>
      <category>news</category>
      <pubDate>Sat, 30 May 2026 10:03:00 GMT</pubDate>
      <guid>https://www.infoq.com/news/2026/05/railway-gcp-account-outage/?utm_campaign=infoq_content&amp;utm_source=infoq&amp;utm_medium=feed&amp;utm_term=Site+Reliability+Engineering-news</guid>
      <dc:creator>Steef-Jan Wiggers</dc:creator>
      <dc:date>2026-05-30T10:03:00Z</dc:date>
      <dc:identifier>/news/2026/05/railway-gcp-account-outage/en</dc:identifier>
    </item>
  </channel>
</rss>
