Skip to content

Instantly share code, notes, and snippets.

tf <- tempfile()
table <- Table$create(
some_datetime = as.POSIXct("2001-01-01 12:34:56.789")
)
write_parquet(
table,
tf,
use_deprecated_int96_timestamps = TRUE
└ Testing wheel
=========================================================== test session starts ============================================================
platform linux -- Python 3.12.7, pytest-8.3.3, pluggy-1.5.0 -- /tmp/nanoarrow-0.6.0.UP7Lid/venv/bin/python
cachedir: .pytest_cache
rootdir: /tmp/nanoarrow-0.6.0.UP7Lid/apache-arrow-nanoarrow-0.6.0/python
configfile: pyproject.toml
collected 230 items / 2 skipped
tests/test_array.py::test_array_construct PASSED [ 0%]
tests/test_array.py::test_array_alias_constructor PASSED [ 0%]
(lldb) bt all
* thread #1, queue = 'com.apple.main-thread', stop reason = signal SIGSTOP
* frame #0: 0x000000019213bee8 libsystem_kernel.dylib`__select + 8
frame #1: 0x00000001a9c3cc64 libcurl.4.dylib`Curl_poll + 516
frame #2: 0x00000001a9c3501c libcurl.4.dylib`multi_wait + 640
frame #3: 0x00000001a9c0eda8 libcurl.4.dylib`curl_easy_perform + 268
frame #4: 0x0000000105b7f720 libaws-cpp-sdk-core.dylib`Aws::Http::CurlHttpClient::MakeRequest(std::__1::shared_ptr<Aws::Http::HttpRequest> const&, Aws::Utils::RateLimits::RateLimiterInterface*, Aws::Utils::RateLimits::RateLimiterInterface*) const + 3524
frame #5: 0x0000000105b425a8 libaws-cpp-sdk-core.dylib`std::__1::shared_ptr<Aws::Http::HttpResponse> smithy::components::tracing::TracingUtils::MakeCallWithTiming<std::__1::shared_ptr<Aws::Http::HttpResponse>>(std::__1::function<std::__1::shared_ptr<Aws::Http::HttpResponse> ()>, std::__1::basic_string<char, std::__1::char_traits<char>, std::__1::allocator<char>> const&, smithy::components::tracing
$ cd ~/src/apache/arrow
$ arrow rebase
Current branch main is up to date.
$ cd cpp
$ mkdir build
$ cd build
$ arrow cmake
+ cmake .. -GNinja -DARROW_ACERO=ON -DARROW_COMPUTE=ON -DARROW_CSV=ON -DARROW_DATASET=ON -DARROW_FILESYSTEM=ON -DARROW_FLIGHT=ON -DARROW_JSON=ON -DARROW_PARQUET=ON -DARROW_AZURE=ON -DARROW_S3=ON -DARROW_GCS=ON -DARROW_SUBSTRAIT=ON -DARROW_BUILD_TESTS=ON -DARROW_MIMALLOC=OFF -DARROW_WITH_BROTLI=ON -DARROW_WITH_BZ2=ON -DARROW_WITH_LZ4=ON -DARROW_WITH_SNAPPY=ON -DARROW_WITH_ZLIB=ON -DARROW_WITH_ZSTD=ON -DARROW_INSTALL_NAME_RPATH=OFF -DARROW_EXTRA_ERROR_CONTEXT=ON -DCMAKE_INSTALL_PREFIX=/home/bryce/builds/arrow-x86_64 -DCMAKE_INSTALL_LIBDIR=lib -DCMAKE_BUILD_TYPE=Debug -DCMAKE_EXPORT_COMPILE_COMMANDS=ON
-- Building using CMake version: 3.25.1
-- The C compiler identification is GNU 12.2.0
``` r "repero.R" #> [1] "repero.R" ``` <sup>Created on 2024-09-05 with [reprex v2.1.1](https://reprex.tidyverse.org)</sup>
diff --git forkSrcPrefix/cpp/src/parquet/arrow/reader_writer_benchmark.cc forkDstPrefix/cpp/src/parquet/arrow/reader_writer_benchmark.cc
index 95c4a659297d93f0927a8f36bb25607b15e5a0fa..d450431eae5133daf24066f8d01701cd34af63c9 100644
--- forkSrcPrefix/cpp/src/parquet/arrow/reader_writer_benchmark.cc
+++ forkDstPrefix/cpp/src/parquet/arrow/reader_writer_benchmark.cc
@@ -15,6 +15,8 @@
// specific language governing permissions and limitations
// under the License.
+#include <sys/_types/_int64_t.h>
+#include "arrow/io/file.h"
library(dplyr)
library(readr)
library(rvest)
library(glue)
years <- 1984:2023
get_one <- function(year) {
url <- glue::glue("https://registration.klondikeroadrelay.com/results?year={year}&leg=Any&gender=Any&name=&team_type=Adult+Running+-+Skagway+Start&division=Any&category=Any&commit=Reload")
doc <- rvest::read_html(url)
❯ arrow cmake
+ cmake .. -GNinja -DARROW_ACERO=ON -DARROW_COMPUTE=ON -DARROW_CSV=ON -DARROW_DATASET=ON -DARROW_FILESYSTEM=ON -DARROW_FLIGHT=ON -DARROW_JSON=ON -DARROW_PARQUET=ON -DARROW_AZURE=ON -DARROW_S3=ON -DARROW_GCS=ON -DARROW_SUBSTRAIT=ON -DARROW_BUILD_TESTS=ON -DARROW_MIMALLOC=OFF -DARROW_WITH_BROTLI=ON -DARROW_WITH_BZ2=ON -DARROW_WITH_LZ4=ON -DARROW_WITH_SNAPPY=ON -DARROW_WITH_ZLIB=ON -DARROW_WITH_ZSTD=ON -DARROW_INSTALL_NAME_RPATH=OFF -DARROW_EXTRA_ERROR_CONTEXT=ON -DCMAKE_INSTALL_PREFIX=/Users/bryce/builds/arrow-arm64 -DCMAKE_BUILD_TYPE=Debug -DGTest_SOURCE=BUNDLED -DCMAKE_EXPORT_COMPILE_COMMANDS=ON
-- Building using CMake version: 3.30.2
-- The C compiler identification is AppleClang 15.0.0.15000309
-- The CXX compiler identification is AppleClang 15.0.0.15000309
-- Detecting C compiler ABI info
-- Detecting C compiler ABI info - done
-- Check for working C compiler: /Applications/Xcode.app/Contents/Developer/Toolchains/XcodeDefault.xctoolchain/usr/bin/cc - skipped
-- Detecting C compile features
-

From main:

Benchmark Time CPU Iterations items_per_second
AllocateDeallocate/size:4096/real_time/threads:1 40.6 ns 40.5 ns 17256246 24.6592M/s
AllocateDeallocate/size:4096/real_time/threads:2 37.1 ns 74.3 ns 18816032 26.9313M/s
AllocateDeallocate/size:4096/real_time/threads:4 68.5 ns 274 ns 10096888 14.5911M/s
AllocateDeallocate/size:4096/real_time/threads:8 85.2 ns 682 ns 8969680 11.733M/s
AllocateDeallocate/size:4096/real_time/threads:16 64.1 ns 1022 ns 10904176 15.5995M/s
AllocateDeallocate/size:4096/real_time/threads:32 57.1 ns 1033 ns 13711680 17.5085M/s
require 'net/http'
require "arrow"
url = URI('http://localhost:9292')
Net::HTTP.start("localhost", 9292) do |http|
req = Net::HTTP::Get.new(url)
http.request(req) do |res|
res.read_body do |chunk|
Gio::RubyInputStream.open(chunk)