<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:dc="http://purl.org/dc/elements/1.1/" version="2.0">
  <channel>
    <title>InfoQ - Data Warehouse - News</title>
    <link>https://www.infoq.com</link>
    <description>InfoQ Data Warehouse News feed</description>
    <item>
      <title>350PB, Millions of Events, One System: inside Uber’s Cross-Region Data Lake and Disaster Recovery</title>
      <link>https://www.infoq.com/news/2026/01/uber-hivesync-data-lake/?utm_campaign=infoq_content&amp;utm_source=infoq&amp;utm_medium=feed&amp;utm_term=Data+Warehouse-news</link>
      <description>&lt;img src="https://res.infoq.com/news/2026/01/uber-hivesync-data-lake/en/headerimage/generatedHeaderImage-1768281800202.jpg"/&gt;&lt;p&gt;Uber’s HiveSync is a sharded, cross-region batch replication system keeping Hive/HDFS data consistent across multiple regions. Handling 5M daily Hive events and 8PB of data replication, it uses event-driven jobs, hybrid RPC and DistCp strategies, DAG-based orchestration, and dynamic sharding, enabling disaster recovery, horizontal scaling, and 99.99% cross-region data accuracy.&lt;/p&gt; &lt;i&gt;By Leela Kumili&lt;/i&gt;</description>
      <category>Event Driven Architecture</category>
      <category>Hive</category>
      <category>Hadoop</category>
      <category>ETL</category>
      <category>Sharding</category>
      <category>MySQL</category>
      <category>Apache Hive</category>
      <category>Deployment / Datacenter</category>
      <category>State-machine</category>
      <category>Apache Hadoop</category>
      <category>Orchestration</category>
      <category>RPC</category>
      <category>Data Warehouse</category>
      <category>Database Replication</category>
      <category>Open Source</category>
      <category>Data Lake</category>
      <category>Architecture &amp; Design</category>
      <category>Development</category>
      <category>news</category>
      <pubDate>Fri, 16 Jan 2026 15:00:00 GMT</pubDate>
      <guid>https://www.infoq.com/news/2026/01/uber-hivesync-data-lake/?utm_campaign=infoq_content&amp;utm_source=infoq&amp;utm_medium=feed&amp;utm_term=Data+Warehouse-news</guid>
      <dc:creator>Leela Kumili</dc:creator>
      <dc:date>2026-01-16T15:00:00Z</dc:date>
      <dc:identifier>/news/2026/01/uber-hivesync-data-lake/en</dc:identifier>
    </item>
  </channel>
</rss>
