Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
20 commits
Select commit Hold shift + click to select a range
b4e3218
Arrow row-by-row processing: ColumnDispatcher, RecordBatchRowProcessor
arhamchopra Apr 27, 2026
63565bc
Remove old C++ reader classes and file wrappers
arhamchopra Apr 27, 2026
364b392
Rewrite ParquetInputAdapterManager for RecordBatch input
arhamchopra Apr 27, 2026
efd9217
Python adapter: RecordBatch stream factories and C Stream Interface
arhamchopra Apr 27, 2026
468bd2a
Tests for parquet input adapter rewrite
arhamchopra Apr 27, 2026
2ac4688
Qualify arrow:: as ::arrow:: in writer headers to avoid namespace amb…
arhamchopra Apr 28, 2026
f89e359
Fix Arrow 21 compatibility: use out-parameter FileReader::Make
arhamchopra Apr 29, 2026
bb19d88
Add comprehensive test coverage for parquet input adapter
arhamchopra Apr 29, 2026
366f76f
Remove dead m_rbSources member from DictBasketReaderRecord, and format
arhamchopra Apr 29, 2026
483950d
Optimize hot path: InlineReader for zero-overhead value extraction
arhamchopra Apr 29, 2026
ff982c7
Add comprehensive tests for all Arrow types and edge cases
arhamchopra Apr 30, 2026
d039d0d
Address review: remove dead code, hoist loop invariant, deduplicate s…
arhamchopra May 13, 2026
c3332f6
Address review: private SourceEntry, const fields, deduplicate batch …
arhamchopra May 13, 2026
c72a9d8
Address review: static lambda, remove tz member, remove redundant ove…
arhamchopra May 13, 2026
662da22
perf: add prefetch and parallel column decode for parquet reading
arhamchopra May 18, 2026
9eeb2f7
Address comments
arhamchopra Jun 8, 2026
1873f03
Address review: fix bugs, remove dead code, clean up test scaffolding
arhamchopra Jun 8, 2026
b0855cc
Clean up tests
arhamchopra Jun 8, 2026
14b8fbc
Replace PrefetchingRecordBatchReader with async generator API
arhamchopra Jun 9, 2026
66decbd
Fix allow_missing_files not honored in split-columns native path
arhamchopra Jun 9, 2026
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
6 changes: 6 additions & 0 deletions CMakeLists.txt
Original file line number Diff line number Diff line change
Expand Up @@ -74,6 +74,12 @@ option(CSP_ENABLE_UBSAN "Build with undefined behavior sanitizer" OFF)
option(CSP_BUILD_KAFKA_ADAPTER "Build kafka adapter" ON)
option(CSP_BUILD_ARROW_ADAPTER "Build arrow adapter" ON)
option(CSP_BUILD_PARQUET_ADAPTER "Build parquet adapter" ON)

# Parquet adapter depends on arrow adapter
if(CSP_BUILD_PARQUET_ADAPTER AND NOT CSP_BUILD_ARROW_ADAPTER)
message(STATUS "Enabling arrow adapter (required by parquet adapter)")
set(CSP_BUILD_ARROW_ADAPTER ON CACHE BOOL "Build arrow adapter" FORCE)
endif()
option(CSP_BUILD_WS_CLIENT_ADAPTER "Build ws client adapter" ON)

# Normalize build type for downstream comparisons
Expand Down
22 changes: 19 additions & 3 deletions cpp/cmake/modules/FindDepsParquetAdapter.cmake
Original file line number Diff line number Diff line change
@@ -1,13 +1,29 @@
cmake_minimum_required(VERSION 3.7.2)

# ARROW
find_package(Arrow REQUIRED)
include_directories(${ARROW_INCLUDE_DIR})
# ARROW (reuse FindDepsArrowAdapter for find_package + link target resolution)
find_package(DepsArrowAdapter REQUIRED)

# PARQUET
find_package(Parquet REQUIRED)
include_directories(${PARQUET_INCLUDE_DIR})

# Resolve Parquet link targets based on platform and vcpkg configuration.
# Sets CSP_PARQUET_LINK_LIBS for use in target_link_libraries().
if(WIN32)
if(CSP_USE_VCPKG)
set(CSP_PARQUET_LINK_LIBS Parquet::parquet_static)
add_compile_definitions(PARQUET_STATIC)
else()
set(CSP_PARQUET_LINK_LIBS parquet_shared)
endif()
else()
if(CSP_USE_VCPKG)
set(CSP_PARQUET_LINK_LIBS parquet_static)
else()
set(CSP_PARQUET_LINK_LIBS parquet)
endif()
endif()

# Other deps
find_package(Thrift REQUIRED)
find_package(Brotli REQUIRED)
Expand Down
Loading
Loading