<?xml version="1.0" encoding="utf-8" standalone="yes"?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
  <channel>
    <title>Apache on Marsettler</title>
    <link>https://marsettler.com/tags/apache/</link>
    <description>Recent content in Apache on Marsettler</description>
    <generator>Hugo</generator>
    <language>en-us</language>
    <lastBuildDate>Tue, 07 Oct 2025 06:45:55 +0900</lastBuildDate>
    <atom:link href="https://marsettler.com/tags/apache/index.xml" rel="self" type="application/rss+xml" />
    <item>
      <title>Apache DataFusion</title>
      <link>https://marsettler.com/apache-datafusion/</link>
      <pubDate>Sun, 05 Oct 2025 00:00:00 +0000</pubDate>
      <guid>https://marsettler.com/apache-datafusion/</guid>
      <description>&lt;h2 id=&#34;using-external-indexes-metadata-stores-catalogs-and-caches-to-accelerate-queries-on-apache-parquet-by-andrew-lamb-influxdata&#34;&gt;&lt;a href=&#34;https://datafusion.apache.org/blog/2025/08/15/external-parquet-indexes/&#34;&gt;Using External Indexes, Metadata Stores, Catalogs and Caches to Accelerate Queries on Apache Parquet by Andrew Lamb (InfluxData)&lt;/a&gt;&lt;/h2&gt;&#xA;&lt;h2 id=&#34;embedding-user-defined-indexes-in-apache-parquet-files-by-qi-zhu-cloudera-jigao-luo-systems-group-at-tu-darmstadt-and-andrew-lamb-influxdata&#34;&gt;&lt;a href=&#34;https://datafusion.apache.org/blog/2025/07/14/user-defined-parquet-indexes/&#34;&gt;Embedding User-Defined Indexes in Apache Parquet Files by Qi Zhu (Cloudera), Jigao Luo (Systems Group at TU Darmstadt), and Andrew Lamb (InfluxData)&lt;/a&gt;&lt;/h2&gt;&#xA;&lt;h2 id=&#34;apache-datafusion-4900-released&#34;&gt;&lt;a href=&#34;https://datafusion.apache.org/blog/2025/07/28/datafusion-49.0.0/&#34;&gt;Apache DataFusion 49.0.0 Released&lt;/a&gt;&lt;/h2&gt;&#xA;&lt;p&gt;Highlights I found impressive&lt;/p&gt;&#xA;&lt;ul&gt;&#xA;&lt;li&gt;Dynamic Filters and TopK pushdown&lt;/li&gt;&#xA;&lt;li&gt;Async User-Defined Functions (ask_llm?!)&lt;/li&gt;&#xA;&lt;li&gt;Better Cancellation for Certain Long-Running Queries&lt;/li&gt;&#xA;&lt;/ul&gt;</description>
    </item>
  </channel>
</rss>
