adbc-drivers
diff --git a/‎csharp/Benchmarks/CloudFetchBenchmarkRunner.cs‎
Lines changed: 7 additions & 0 deletions b/‎csharp/Benchmarks/CloudFetchBenchmarkRunner.cs‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎csharp/Benchmarks/QuickValidation.cs‎
Lines changed: 90 additions & 0 deletions b/‎csharp/Benchmarks/QuickValidation.cs‎
Lines changed: 90 additions & 0 deletions
diff --git a/‎csharp/Benchmarks/benchmark-queries.json‎
Lines changed: 8 additions & 0 deletions b/‎csharp/Benchmarks/benchmark-queries.json‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎csharp/src/DatabricksParameters.cs‎
Lines changed: 8 additions & 0 deletions b/‎csharp/src/DatabricksParameters.cs‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎csharp/src/Http/HttpClientFactory.cs‎
Lines changed: 15 additions & 0 deletions b/‎csharp/src/Http/HttpClientFactory.cs‎
Lines changed: 15 additions & 0 deletions
diff --git a/‎csharp/src/Lz4Utilities.cs‎
Lines changed: 40 additions & 0 deletions b/‎csharp/src/Lz4Utilities.cs‎
Lines changed: 40 additions & 0 deletions
diff --git a/‎csharp/src/Reader/CloudFetch/CloudFetchConfiguration.cs‎
Lines changed: 21 additions & 6 deletions b/‎csharp/src/Reader/CloudFetch/CloudFetchConfiguration.cs‎
Lines changed: 21 additions & 6 deletions
@@ -43,6 +43,13 @@ public static void Main(string[] args)
             // Enable TLS 1.2/1.3 for .NET Framework 4.7.2 (required for modern HTTPS endpoints)
             ServicePointManager.SecurityProtocol = SecurityProtocolType.Tls12 | SecurityProtocolType.Tls11 | (SecurityProtocolType)3072; // 3072 = Tls13
 #endif
+            // Quick validation mode: run a single query to verify CloudFetch correctness
+            if (args.Length > 0 && args[0] == "--validate")
+            {
+                QuickValidation.RunValidation();
+                return;
+            }
+
             // Configure with custom columns for CloudFetch-specific metrics + built-in GC columns
             var config = DefaultConfig.Instance
                 .AddColumn(new ColumnsColumn())
 
@@ -0,0 +1,90 @@
+/*
+* Quick validation script for CloudFetch parity changes.
+* Runs catalog_returns SF10 query and reports row count + timing.
+*/
+
+using System;
+using System.Collections.Generic;
+using System.Diagnostics;
+using AdbcDrivers.Databricks;
+using AdbcDrivers.HiveServer2.Spark;
+
+namespace Apache.Arrow.Adbc.Benchmarks
+{
+    public class QuickValidation
+    {
+        public static void RunValidation()
+        {
+            string uri = Environment.GetEnvironmentVariable("DATABRICKS_URI")
+                ?? throw new InvalidOperationException("Set DATABRICKS_URI env var (e.g. https://host/sql/1.0/warehouses/id)");
+            string token = Environment.GetEnvironmentVariable("DATABRICKS_TOKEN")
+                ?? throw new InvalidOperationException("Set DATABRICKS_TOKEN env var");
+            string query = Environment.GetEnvironmentVariable("DATABRICKS_QUERY")
+                ?? "SELECT * FROM main.tpcds_sf10_delta.catalog_sales";
+            long expectedRows = long.Parse(
+                Environment.GetEnvironmentVariable("DATABRICKS_EXPECTED_ROWS") ?? "14400425");
+
+            Console.WriteLine("=== ADBC CloudFetch Validation ===");
+            Console.WriteLine($"Query: {query}");
+            Console.WriteLine($"Expected rows: {expectedRows}");
+
+            var parameters = new Dictionary<string, string>
+            {
+                [AdbcOptions.Uri] = uri,
+                [SparkParameters.Token] = token,
+                [DatabricksParameters.UseCloudFetch] = "true",
+                [DatabricksParameters.EnableDirectResults] = "true",
+                [DatabricksParameters.CanDecompressLz4] = "true",
+            };
+
+            var driver = new DatabricksDriver();
+            using var database = driver.Open(parameters);
+            using var connection = database.Connect(parameters);
+            using var statement = connection.CreateStatement();
+
+            statement.SqlQuery = query;
+
+            var sw = Stopwatch.StartNew();
+            var queryResult = statement.ExecuteQuery();
+
+            long totalRows = 0;
+            int totalBatches = 0;
+            long ttfrMs = 0;
+
+            using (var reader = queryResult.Stream)
+            {
+                while (true)
+                {
+                    var batch = reader.ReadNextRecordBatchAsync().Result;
+                    if (batch == null) break;
+
+                    totalBatches++;
+                    totalRows += batch.Length;
+
+                    if (totalBatches == 1)
+                    {
+                        ttfrMs = sw.ElapsedMilliseconds;
+                        Console.WriteLine($"TTFR_MS={ttfrMs}");
+                    }
+
+                    batch.Dispose();
+                }
+            }
+
+            sw.Stop();
+
+            Console.WriteLine($"TOTAL_ROWS={totalRows}");
+            Console.WriteLine($"TOTAL_BATCHES={totalBatches}");
+            Console.WriteLine($"TOTAL_TIME_MS={sw.ElapsedMilliseconds}");
+            Console.WriteLine($"ROWS_PER_SEC={totalRows / (sw.ElapsedMilliseconds / 1000.0):F0}");
+
+            if (totalRows != expectedRows)
+            {
+                Console.Error.WriteLine($"ROW COUNT MISMATCH! Expected {expectedRows}, got {totalRows}");
+                Environment.Exit(1);
+            }
+
+            Console.WriteLine("Row count verified OK.");
+        }
+    }
+}
@@ -7,6 +7,14 @@
     "columns": 23,
     "category": "large-wide"
   },
+  {
+    "name": "catalog_sales_sf10",
+    "description": "Catalog sales SF10 - 14.4M rows, 34 columns (CloudFetch parity benchmark with JDBC)",
+    "query": "select * from main.tpcds_sf10_delta.catalog_sales",
+    "expected_rows": 14400425,
+    "columns": 34,
+    "category": "large-wide"
+  },
   {
     "name": "catalog_sales",
     "description": "Catalog sales - 1.4M rows, 34 columns (current default)",
 
@@ -182,6 +182,14 @@ public class DatabricksParameters : SparkParameters
         /// </summary>
         public const string CloudFetchPrefetchEnabled = "adbc.databricks.cloudfetch.prefetch_enabled";
 
+        /// <summary>
+        /// Size of the link prefetch window — how many chunk links to fetch ahead of downloads.
+        /// Links are lightweight metadata, so a large window uses minimal memory while ensuring
+        /// the download pipeline never starves. Matches JDBC's LinkPrefetchWindow=128 default.
+        /// Default value is 128.
+        /// </summary>
+        public const string CloudFetchLinkPrefetchWindowSize = "adbc.databricks.cloudfetch.link_prefetch_window_size";
+
         /// <summary>
         /// Maximum bytes per fetch request when retrieving query results from servers.
         /// The value can be specified with unit suffixes: B (bytes), KB (kilobytes), MB (megabytes), GB (gigabytes).
 
@@ -17,6 +17,7 @@
 using System;
 using System.Collections.Generic;
 using System.Net.Http;
+using AdbcDrivers.Databricks.Reader.CloudFetch;
 using AdbcDrivers.HiveServer2;
 using AdbcDrivers.HiveServer2.Hive2;
 using AdbcDrivers.HiveServer2.Spark;
@@ -66,6 +67,8 @@ public static HttpClient CreateBasicHttpClient(IReadOnlyDictionary<string, strin
         /// <summary>
         /// Creates an HttpClient for CloudFetch downloads.
         /// Includes TLS and proxy settings but no auth headers (CloudFetch uses pre-signed URLs).
+        /// On .NET Framework 4.7.2, increases ServicePointManager.DefaultConnectionLimit to
+        /// support parallel downloads (default is 2 per server, which throttles CloudFetch).
         /// </summary>
         /// <param name="properties">Connection properties containing TLS and proxy configuration.</param>
         /// <returns>Configured HttpClient for CloudFetch.</returns>
@@ -76,6 +79,18 @@ public static HttpClient CreateCloudFetchHttpClient(IReadOnlyDictionary<string,
                 DatabricksParameters.CloudFetchTimeoutMinutes,
                 DatabricksConstants.DefaultCloudFetchTimeoutMinutes);
 
+#if NETFRAMEWORK || NETSTANDARD2_0
+            // .NET Framework defaults to 2 connections per server via ServicePointManager.
+            // CloudFetch uses 16 parallel downloads to cloud storage — the 2-connection limit
+            // throttles throughput to ~1/8th of what's possible. Raise to match ParallelDownloads.
+            int parallelDownloads = PropertyHelper.GetPositiveIntPropertyWithValidation(
+                properties,
+                DatabricksParameters.CloudFetchParallelDownloads,
+                CloudFetchConfiguration.DefaultParallelDownloads);
+            System.Net.ServicePointManager.DefaultConnectionLimit =
+                Math.Max(System.Net.ServicePointManager.DefaultConnectionLimit, parallelDownloads);
+#endif
+
             return CreateBasicHttpClient(properties, TimeSpan.FromMinutes(timeoutMinutes));
         }
 
 
@@ -170,5 +170,45 @@ public static async Task<RecyclableMemoryStream> DecompressLz4Async(
                 throw new AdbcException($"Failed to decompress LZ4 data: {ex.Message}", ex);
             }
         }
+        /// <summary>
+        /// Decompresses LZ4 data from a stream (e.g., HTTP response stream) without
+        /// buffering the compressed data as a byte[]. This saves one memory copy vs
+        /// DecompressLz4Async(byte[]) when the caller already has a stream.
+        /// </summary>
+        public static async Task<RecyclableMemoryStream> DecompressLz4FromStreamAsync(
+            Stream compressedStream,
+            RecyclableMemoryStreamManager memoryStreamManager,
+            ArrayPool<byte> bufferPool,
+            CancellationToken cancellationToken = default)
+        {
+            try
+            {
+                var outputStream = memoryStreamManager.GetStream();
+                try
+                {
+                    using (var decompressor = new CustomLZ4DecoderStream(
+                        compressedStream,
+                        descriptor => descriptor.CreateDecoder(),
+                        bufferPool,
+                        leaveOpen: false,
+                        interactive: false))
+                    {
+                        await decompressor.CopyToAsync(outputStream, DefaultBufferSize, cancellationToken).ConfigureAwait(false);
+                    }
+
+                    outputStream.Position = 0;
+                    return outputStream;
+                }
+                catch
+                {
+                    outputStream?.Dispose();
+                    throw;
+                }
+            }
+            catch (Exception ex)
+            {
+                throw new AdbcException($"Failed to decompress LZ4 stream: {ex.Message}", ex);
+            }
+        }
     }
 }
@@ -28,10 +28,16 @@ namespace AdbcDrivers.Databricks.Reader.CloudFetch
     /// </summary>
     internal sealed class CloudFetchConfiguration
     {
-        // Default values
-        internal const int DefaultParallelDownloads = 3;
-        internal const int DefaultPrefetchCount = 2;
-        internal const int DefaultMemoryBufferSizeMB = 200;
+        // Default values — tuned for CloudFetch parity with JDBC driver.
+        // ParallelDownloads: HTTP concurrency. 5 is a conservative bump from 3 that
+        // improves network utilization without excessive TCP/TLS overhead.
+        // PrefetchCount: controls resultQueue capacity (PrefetchCount * 2). This is
+        // the implicit sliding window — when full, downloader blocks until reader consumes.
+        // MemoryBufferSizeMB: byte-level cap on in-flight compressed data.
+        internal const int DefaultParallelDownloads = 16;
+        internal const int DefaultPrefetchCount = 16;
+        internal const int DefaultMemoryBufferSizeMB = 400;
+        internal const int DefaultLinkPrefetchWindowSize = 128;
         internal const int DefaultTimeoutMinutes = 5;
         internal const int DefaultMaxRetries = 0; // 0 = no limit (use timeout only)
         internal const int DefaultRetryTimeoutSeconds = 300; // 5 minutes
@@ -45,10 +51,18 @@ internal sealed class CloudFetchConfiguration
         public int ParallelDownloads { get; set; } = DefaultParallelDownloads;
 
         /// <summary>
-        /// Number of files to prefetch ahead of the reader.
+        /// Number of files to prefetch ahead of the reader (controls download window / result queue size).
         /// </summary>
         public int PrefetchCount { get; set; } = DefaultPrefetchCount;
 
+        /// <summary>
+        /// Size of the link prefetch window — how many chunk links to fetch ahead of downloads.
+        /// The fetcher runs on a background task and can fetch links far ahead while downloads
+        /// are paced by memory and download slots. This matches JDBC's LinkPrefetchWindow=128.
+        /// Links are lightweight metadata (URL + offsets), so a large window uses minimal memory.
+        /// </summary>
+        public int LinkPrefetchWindowSize { get; set; } = DefaultLinkPrefetchWindowSize;
+
         /// <summary>
         /// Memory buffer size limit in MB for buffered files.
         /// </summary>
@@ -151,7 +165,8 @@ public static CloudFetchConfiguration FromProperties(
                 RetryTimeoutSeconds = PropertyHelper.GetPositiveIntPropertyWithValidation(properties, DatabricksParameters.CloudFetchRetryTimeoutSeconds, DefaultRetryTimeoutSeconds),
                 RetryDelayMs = PropertyHelper.GetPositiveIntPropertyWithValidation(properties, DatabricksParameters.CloudFetchRetryDelayMs, DefaultRetryDelayMs),
                 MaxUrlRefreshAttempts = PropertyHelper.GetPositiveIntPropertyWithValidation(properties, DatabricksParameters.CloudFetchMaxUrlRefreshAttempts, DefaultMaxUrlRefreshAttempts),
-                UrlExpirationBufferSeconds = PropertyHelper.GetPositiveIntPropertyWithValidation(properties, DatabricksParameters.CloudFetchUrlExpirationBufferSeconds, DefaultUrlExpirationBufferSeconds)
+                UrlExpirationBufferSeconds = PropertyHelper.GetPositiveIntPropertyWithValidation(properties, DatabricksParameters.CloudFetchUrlExpirationBufferSeconds, DefaultUrlExpirationBufferSeconds),
+                LinkPrefetchWindowSize = PropertyHelper.GetPositiveIntPropertyWithValidation(properties, DatabricksParameters.CloudFetchLinkPrefetchWindowSize, DefaultLinkPrefetchWindowSize)
             };
 
             return config;