Skip to content

Instantly share code, notes, and snippets.

@wesm
Created May 18, 2017 13:10
Show Gist options
  • Save wesm/fef0fd1c442bd7789b2fa9665c48cc24 to your computer and use it in GitHub Desktop.
Save wesm/fef0fd1c442bd7789b2fa9665c48cc24 to your computer and use it in GitHub Desktop.
==22942== Invalid write of size 8
==22942== at 0xBAF4362: int parquet::RleDecoder::GetBatchWithDictSpaced<parquet::Int96>(parquet::Vector<parquet::Int96> const&, parquet::Int96*, int, int, unsigned char const*, long) (rle-encoding.h:398)
==22942== by 0xBAF19CC: parquet::DictionaryDecoder<parquet::DataType<(parquet::Type::type)3> >::DecodeSpaced(parquet::Int96*, int, int, unsigned char const*, long) (encoding-internal.h:341)
==22942== by 0xBACB9C3: parquet::TypedColumnReader<parquet::DataType<(parquet::Type::type)3> >::ReadValuesSpaced(long, parquet::Int96*, int, unsigned char*, long) (reader.h:216)
==22942== by 0xBACAFB7: parquet::TypedColumnReader<parquet::DataType<(parquet::Type::type)3> >::ReadBatchSpaced(int, short*, short*, parquet::Int96*, unsigned char*, long, long*, long*, long*) (reader.h:341)
==22942== by 0xBFE0644: arrow::Status parquet::arrow::ColumnReader::Impl::ReadNullableBatch<arrow::TimestampType, parquet::DataType<(parquet::Type::type)3> >(parquet::TypedColumnReader<parquet::DataType<(parquet::Type::type)3> >*, short*, short*, long, long*, long*) (reader.cc:637)
==22942== by 0xBFF5F2C: arrow::Status parquet::arrow::ColumnReader::Impl::TypedReadBatch<arrow::TimestampType, parquet::DataType<(parquet::Type::type)3> >(int, std::shared_ptr<arrow::Array>*) (reader.cc:869)
==22942== by 0xBFE3A5B: parquet::arrow::ColumnReader::Impl::NextBatch(int, std::shared_ptr<arrow::Array>*) (reader.cc:1139)
==22942== by 0xBFE3DBA: parquet::arrow::ColumnReader::NextBatch(int, std::shared_ptr<arrow::Array>*) (reader.cc:1164)
==22942== by 0xBFDCCED: parquet::arrow::FileReader::Impl::ReadColumn(int, std::shared_ptr<arrow::Array>*) (reader.cc:303)
==22942== by 0xBFDD6C3: parquet::arrow::FileReader::Impl::ReadTable(std::vector<int, std::allocator<int> > const&, std::shared_ptr<arrow::Table>*)::{lambda(int)#1}::operator()(int) const (reader.cc:367)
==22942== by 0xBFDD954: parquet::arrow::FileReader::Impl::ReadTable(std::vector<int, std::allocator<int> > const&, std::shared_ptr<arrow::Table>*) (reader.cc:374)
==22942== by 0xBFDE341: parquet::arrow::FileReader::ReadTable(std::vector<int, std::allocator<int> > const&, std::shared_ptr<arrow::Table>*) (reader.cc:443)
==22942== Address 0x13ecb17c is 60 bytes inside a block of size 64 alloc'd
==22942== at 0x4C2BB84: memalign (vg_replace_malloc.c:857)
==22942== by 0x4C2BC4C: posix_memalign (vg_replace_malloc.c:1020)
==22942== by 0xB37AF8C: arrow::(anonymous namespace)::AllocateAligned(long, unsigned char**) (memory_pool.cc:49)
==22942== by 0xB37B295: arrow::DefaultMemoryPool::Allocate(long, unsigned char**) (memory_pool.cc:79)
==22942== by 0xB331F62: arrow::PoolBuffer::Reserve(long) (buffer.cc:80)
==22942== by 0xB33206D: arrow::PoolBuffer::Resize(long, bool) (buffer.cc:91)
==22942== by 0xBFE059E: arrow::Status parquet::arrow::ColumnReader::Impl::ReadNullableBatch<arrow::TimestampType, parquet::DataType<(parquet::Type::type)3> >(parquet::TypedColumnReader<parquet::DataType<(parquet::Type::type)3> >*, short*, short*, long, long*, long*) (reader.cc:634)
==22942== by 0xBFF5F2C: arrow::Status parquet::arrow::ColumnReader::Impl::TypedReadBatch<arrow::TimestampType, parquet::DataType<(parquet::Type::type)3> >(int, std::shared_ptr<arrow::Array>*) (reader.cc:869)
==22942== by 0xBFE3A5B: parquet::arrow::ColumnReader::Impl::NextBatch(int, std::shared_ptr<arrow::Array>*) (reader.cc:1139)
==22942== by 0xBFE3DBA: parquet::arrow::ColumnReader::NextBatch(int, std::shared_ptr<arrow::Array>*) (reader.cc:1164)
==22942== by 0xBFDCCED: parquet::arrow::FileReader::Impl::ReadColumn(int, std::shared_ptr<arrow::Array>*) (reader.cc:303)
==22942== by 0xBFDD6C3: parquet::arrow::FileReader::Impl::ReadTable(std::vector<int, std::allocator<int> > const&, std::shared_ptr<arrow::Table>*)::{lambda(int)#1}::operator()(int) const (reader.cc:367)
==22942==
==22942== Invalid write of size 4
==22942== at 0xBAF4368: int parquet::RleDecoder::GetBatchWithDictSpaced<parquet::Int96>(parquet::Vector<parquet::Int96> const&, parquet::Int96*, int, int, unsigned char const*, long) (rle-encoding.h:398)
==22942== by 0xBAF19CC: parquet::DictionaryDecoder<parquet::DataType<(parquet::Type::type)3> >::DecodeSpaced(parquet::Int96*, int, int, unsigned char const*, long) (encoding-internal.h:341)
==22942== by 0xBACB9C3: parquet::TypedColumnReader<parquet::DataType<(parquet::Type::type)3> >::ReadValuesSpaced(long, parquet::Int96*, int, unsigned char*, long) (reader.h:216)
==22942== by 0xBACAFB7: parquet::TypedColumnReader<parquet::DataType<(parquet::Type::type)3> >::ReadBatchSpaced(int, short*, short*, parquet::Int96*, unsigned char*, long, long*, long*, long*) (reader.h:341)
==22942== by 0xBFE0644: arrow::Status parquet::arrow::ColumnReader::Impl::ReadNullableBatch<arrow::TimestampType, parquet::DataType<(parquet::Type::type)3> >(parquet::TypedColumnReader<parquet::DataType<(parquet::Type::type)3> >*, short*, short*, long, long*, long*) (reader.cc:637)
==22942== by 0xBFF5F2C: arrow::Status parquet::arrow::ColumnReader::Impl::TypedReadBatch<arrow::TimestampType, parquet::DataType<(parquet::Type::type)3> >(int, std::shared_ptr<arrow::Array>*) (reader.cc:869)
==22942== by 0xBFE3A5B: parquet::arrow::ColumnReader::Impl::NextBatch(int, std::shared_ptr<arrow::Array>*) (reader.cc:1139)
==22942== by 0xBFE3DBA: parquet::arrow::ColumnReader::NextBatch(int, std::shared_ptr<arrow::Array>*) (reader.cc:1164)
==22942== by 0xBFDCCED: parquet::arrow::FileReader::Impl::ReadColumn(int, std::shared_ptr<arrow::Array>*) (reader.cc:303)
==22942== by 0xBFDD6C3: parquet::arrow::FileReader::Impl::ReadTable(std::vector<int, std::allocator<int> > const&, std::shared_ptr<arrow::Table>*)::{lambda(int)#1}::operator()(int) const (reader.cc:367)
==22942== by 0xBFDD954: parquet::arrow::FileReader::Impl::ReadTable(std::vector<int, std::allocator<int> > const&, std::shared_ptr<arrow::Table>*) (reader.cc:374)
==22942== by 0xBFDE341: parquet::arrow::FileReader::ReadTable(std::vector<int, std::allocator<int> > const&, std::shared_ptr<arrow::Table>*) (reader.cc:443)
==22942== Address 0x13ecb184 is 4 bytes after a block of size 64 alloc'd
==22942== at 0x4C2BB84: memalign (vg_replace_malloc.c:857)
==22942== by 0x4C2BC4C: posix_memalign (vg_replace_malloc.c:1020)
==22942== by 0xB37AF8C: arrow::(anonymous namespace)::AllocateAligned(long, unsigned char**) (memory_pool.cc:49)
==22942== by 0xB37B295: arrow::DefaultMemoryPool::Allocate(long, unsigned char**) (memory_pool.cc:79)
==22942== by 0xB331F62: arrow::PoolBuffer::Reserve(long) (buffer.cc:80)
==22942== by 0xB33206D: arrow::PoolBuffer::Resize(long, bool) (buffer.cc:91)
==22942== by 0xBFE059E: arrow::Status parquet::arrow::ColumnReader::Impl::ReadNullableBatch<arrow::TimestampType, parquet::DataType<(parquet::Type::type)3> >(parquet::TypedColumnReader<parquet::DataType<(parquet::Type::type)3> >*, short*, short*, long, long*, long*) (reader.cc:634)
==22942== by 0xBFF5F2C: arrow::Status parquet::arrow::ColumnReader::Impl::TypedReadBatch<arrow::TimestampType, parquet::DataType<(parquet::Type::type)3> >(int, std::shared_ptr<arrow::Array>*) (reader.cc:869)
==22942== by 0xBFE3A5B: parquet::arrow::ColumnReader::Impl::NextBatch(int, std::shared_ptr<arrow::Array>*) (reader.cc:1139)
==22942== by 0xBFE3DBA: parquet::arrow::ColumnReader::NextBatch(int, std::shared_ptr<arrow::Array>*) (reader.cc:1164)
==22942== by 0xBFDCCED: parquet::arrow::FileReader::Impl::ReadColumn(int, std::shared_ptr<arrow::Array>*) (reader.cc:303)
==22942== by 0xBFDD6C3: parquet::arrow::FileReader::Impl::ReadTable(std::vector<int, std::allocator<int> > const&, std::shared_ptr<arrow::Table>*)::{lambda(int)#1}::operator()(int) const (reader.cc:367)
==22942==
==22942== Invalid read of size 4
==22942== at 0xBFDC7ED: parquet::arrow::impala_timestamp_to_nanoseconds(parquet::Int96 const&) (reader.cc:55)
==22942== by 0xBFE0710: arrow::Status parquet::arrow::ColumnReader::Impl::ReadNullableBatch<arrow::TimestampType, parquet::DataType<(parquet::Type::type)3> >(parquet::TypedColumnReader<parquet::DataType<(parquet::Type::type)3> >*, short*, short*, long, long*, long*) (reader.cc:644)
==22942== by 0xBFF5F2C: arrow::Status parquet::arrow::ColumnReader::Impl::TypedReadBatch<arrow::TimestampType, parquet::DataType<(parquet::Type::type)3> >(int, std::shared_ptr<arrow::Array>*) (reader.cc:869)
==22942== by 0xBFE3A5B: parquet::arrow::ColumnReader::Impl::NextBatch(int, std::shared_ptr<arrow::Array>*) (reader.cc:1139)
==22942== by 0xBFE3DBA: parquet::arrow::ColumnReader::NextBatch(int, std::shared_ptr<arrow::Array>*) (reader.cc:1164)
==22942== by 0xBFDCCED: parquet::arrow::FileReader::Impl::ReadColumn(int, std::shared_ptr<arrow::Array>*) (reader.cc:303)
==22942== by 0xBFDD6C3: parquet::arrow::FileReader::Impl::ReadTable(std::vector<int, std::allocator<int> > const&, std::shared_ptr<arrow::Table>*)::{lambda(int)#1}::operator()(int) const (reader.cc:367)
==22942== by 0xBFDD954: parquet::arrow::FileReader::Impl::ReadTable(std::vector<int, std::allocator<int> > const&, std::shared_ptr<arrow::Table>*) (reader.cc:374)
==22942== by 0xBFDE341: parquet::arrow::FileReader::ReadTable(std::vector<int, std::allocator<int> > const&, std::shared_ptr<arrow::Table>*) (reader.cc:443)
==22942== by 0x3BA9B673: __pyx_pw_7pyarrow_8_parquet_13ParquetReader_9read_all(_object*, _object*, _object*) (in /home/wesm/code/arrow/python/pyarrow/_parquet.cpython-35m-x86_64-linux-gnu.so)
==22942== by 0x4EF11E0: PyCFunction_Call (methodobject.c:98)
==22942== by 0x4F773EA: do_call (ceval.c:4884)
==22942== by 0x4F773EA: call_function (ceval.c:4683)
==22942== by 0x4F773EA: PyEval_EvalFrameEx (ceval.c:3185)
==22942== Address 0x13ecb184 is 4 bytes after a block of size 64 alloc'd
==22942== at 0x4C2BB84: memalign (vg_replace_malloc.c:857)
==22942== by 0x4C2BC4C: posix_memalign (vg_replace_malloc.c:1020)
==22942== by 0xB37AF8C: arrow::(anonymous namespace)::AllocateAligned(long, unsigned char**) (memory_pool.cc:49)
==22942== by 0xB37B295: arrow::DefaultMemoryPool::Allocate(long, unsigned char**) (memory_pool.cc:79)
==22942== by 0xB331F62: arrow::PoolBuffer::Reserve(long) (buffer.cc:80)
==22942== by 0xB33206D: arrow::PoolBuffer::Resize(long, bool) (buffer.cc:91)
==22942== by 0xBFE059E: arrow::Status parquet::arrow::ColumnReader::Impl::ReadNullableBatch<arrow::TimestampType, parquet::DataType<(parquet::Type::type)3> >(parquet::TypedColumnReader<parquet::DataType<(parquet::Type::type)3> >*, short*, short*, long, long*, long*) (reader.cc:634)
==22942== by 0xBFF5F2C: arrow::Status parquet::arrow::ColumnReader::Impl::TypedReadBatch<arrow::TimestampType, parquet::DataType<(parquet::Type::type)3> >(int, std::shared_ptr<arrow::Array>*) (reader.cc:869)
==22942== by 0xBFE3A5B: parquet::arrow::ColumnReader::Impl::NextBatch(int, std::shared_ptr<arrow::Array>*) (reader.cc:1139)
==22942== by 0xBFE3DBA: parquet::arrow::ColumnReader::NextBatch(int, std::shared_ptr<arrow::Array>*) (reader.cc:1164)
==22942== by 0xBFDCCED: parquet::arrow::FileReader::Impl::ReadColumn(int, std::shared_ptr<arrow::Array>*) (reader.cc:303)
==22942== by 0xBFDD6C3: parquet::arrow::FileReader::Impl::ReadTable(std::vector<int, std::allocator<int> > const&, std::shared_ptr<arrow::Table>*)::{lambda(int)#1}::operator()(int) const (reader.cc:367)
==22942==
==22942== Invalid read of size 8
==22942== at 0xBFDC800: parquet::arrow::impala_timestamp_to_nanoseconds(parquet::Int96 const&) (reader.cc:56)
==22942== by 0xBFE0710: arrow::Status parquet::arrow::ColumnReader::Impl::ReadNullableBatch<arrow::TimestampType, parquet::DataType<(parquet::Type::type)3> >(parquet::TypedColumnReader<parquet::DataType<(parquet::Type::type)3> >*, short*, short*, long, long*, long*) (reader.cc:644)
==22942== by 0xBFF5F2C: arrow::Status parquet::arrow::ColumnReader::Impl::TypedReadBatch<arrow::TimestampType, parquet::DataType<(parquet::Type::type)3> >(int, std::shared_ptr<arrow::Array>*) (reader.cc:869)
==22942== by 0xBFE3A5B: parquet::arrow::ColumnReader::Impl::NextBatch(int, std::shared_ptr<arrow::Array>*) (reader.cc:1139)
==22942== by 0xBFE3DBA: parquet::arrow::ColumnReader::NextBatch(int, std::shared_ptr<arrow::Array>*) (reader.cc:1164)
==22942== by 0xBFDCCED: parquet::arrow::FileReader::Impl::ReadColumn(int, std::shared_ptr<arrow::Array>*) (reader.cc:303)
==22942== by 0xBFDD6C3: parquet::arrow::FileReader::Impl::ReadTable(std::vector<int, std::allocator<int> > const&, std::shared_ptr<arrow::Table>*)::{lambda(int)#1}::operator()(int) const (reader.cc:367)
==22942== by 0xBFDD954: parquet::arrow::FileReader::Impl::ReadTable(std::vector<int, std::allocator<int> > const&, std::shared_ptr<arrow::Table>*) (reader.cc:374)
==22942== by 0xBFDE341: parquet::arrow::FileReader::ReadTable(std::vector<int, std::allocator<int> > const&, std::shared_ptr<arrow::Table>*) (reader.cc:443)
==22942== by 0x3BA9B673: __pyx_pw_7pyarrow_8_parquet_13ParquetReader_9read_all(_object*, _object*, _object*) (in /home/wesm/code/arrow/python/pyarrow/_parquet.cpython-35m-x86_64-linux-gnu.so)
==22942== by 0x4EF11E0: PyCFunction_Call (methodobject.c:98)
==22942== by 0x4F773EA: do_call (ceval.c:4884)
==22942== by 0x4F773EA: call_function (ceval.c:4683)
==22942== by 0x4F773EA: PyEval_EvalFrameEx (ceval.c:3185)
==22942== Address 0x13ecb17c is 60 bytes inside a block of size 64 alloc'd
==22942== at 0x4C2BB84: memalign (vg_replace_malloc.c:857)
==22942== by 0x4C2BC4C: posix_memalign (vg_replace_malloc.c:1020)
==22942== by 0xB37AF8C: arrow::(anonymous namespace)::AllocateAligned(long, unsigned char**) (memory_pool.cc:49)
==22942== by 0xB37B295: arrow::DefaultMemoryPool::Allocate(long, unsigned char**) (memory_pool.cc:79)
==22942== by 0xB331F62: arrow::PoolBuffer::Reserve(long) (buffer.cc:80)
==22942== by 0xB33206D: arrow::PoolBuffer::Resize(long, bool) (buffer.cc:91)
==22942== by 0xBFE059E: arrow::Status parquet::arrow::ColumnReader::Impl::ReadNullableBatch<arrow::TimestampType, parquet::DataType<(parquet::Type::type)3> >(parquet::TypedColumnReader<parquet::DataType<(parquet::Type::type)3> >*, short*, short*, long, long*, long*) (reader.cc:634)
==22942== by 0xBFF5F2C: arrow::Status parquet::arrow::ColumnReader::Impl::TypedReadBatch<arrow::TimestampType, parquet::DataType<(parquet::Type::type)3> >(int, std::shared_ptr<arrow::Array>*) (reader.cc:869)
==22942== by 0xBFE3A5B: parquet::arrow::ColumnReader::Impl::NextBatch(int, std::shared_ptr<arrow::Array>*) (reader.cc:1139)
==22942== by 0xBFE3DBA: parquet::arrow::ColumnReader::NextBatch(int, std::shared_ptr<arrow::Array>*) (reader.cc:1164)
==22942== by 0xBFDCCED: parquet::arrow::FileReader::Impl::ReadColumn(int, std::shared_ptr<arrow::Array>*) (reader.cc:303)
==22942== by 0xBFDD6C3: parquet::arrow::FileReader::Impl::ReadTable(std::vector<int, std::allocator<int> > const&, std::shared_ptr<arrow::Table>*)::{lambda(int)#1}::operator()(int) const (reader.cc:367)
==22942==
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment