You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@arrow.apache.org by we...@apache.org on 2018/09/08 14:27:43 UTC
[arrow] branch master updated (17999a8 -> 9b4cd9c)
This is an automated email from the ASF dual-hosted git repository.
wesm pushed a change to branch master
in repository https://gitbox.apache.org/repos/asf/arrow.git.
omit 17999a8 [R] Add link to R folder in README.md
omit 03e9bb9 ARROW-3171: [Java] Enable checkstyle for line length and indentation
omit f3247e8 ARROW-3127: [Doc] Add Tutorial for Sending Tensor from C++ to Python
omit e7b269d ARROW-1325: [R] Initial R package that builds against the arrow C++ library
omit fbba3be ARROW-3061: [JAVA] Fix BufferAllocator#getHeadroom (#2434)
omit 4007aff ARROW-2948: [Packaging] Generate changelog with crossbow
omit 5d4d6ba ARROW-3177: [Rust] Update expected error messages for tests that 'should panic'
omit c1f528c ARROW-2974: [Python] Replace usages of "source activate" with "conda activate" in CI scripts
omit e0c07f4 ARROW-3172: [Rust] Update documentation for datatypes.rs
omit 21ef18b ARROW-3160: [Python] Improve pathlib.Path support in parquet and filesystem modules
omit 3eaf46e ARROW-3090: [Rust] Accompany error messages with assertions
omit ad7e6c3 ARROW-2989: [C++/Python] Remove API deprecations in 0.10
omit ea728c7 ARROW-3167: [CI] Limit clcache cache size
omit f209645 ARROW-3163: [Python] Add missing Cython dependency to source package
omit 7483331 ARROW-3158: [C++] Handle float truncation during casting
omit a712165 ARROW-1949: [Python/C++] Add option to Array.from_pandas and pyarrow.array to perform unsafe casts
omit 20c0405 ARROW-3153: [Packaging] Fix broken nightly package builds introduced with recent cmake changes and orc tests
omit c282a14 ARROW-3115: [JAVA] Style checks - fix import ordering
omit 84fcb82 ARROW-3142: [C++] Fetch all libs from toolchain environment
omit 927bd34 ARROW-3018: [Plasma][FOLLOWUP] Update plasma documentation
omit 5829f10 ARROW-3147: [C++] Improve MSVC version detection
omit b79b869 ARROW-3148: [C++] Remove needless U+00A0 NO-BREAK SPACE (#2500)
omit 658087e ARROW-3140: [Plasma] Fix Plasma build with GPU support
omit 44c2fa7 [Python] [DOC] Fix a typo in doc/source/ipc.rst
omit 56b50f6 ARROW-3119: [Packaging] Nightly packaging script fails
omit ef21ec9 ARROW-3130: [Go] add initial support for Go modules
omit 0311f63 ARROW-2734: [Python] Cython api example doesn't work by default on macOS
omit 3e61e63 ARROW-3129: [Packaging] Stop to use deprecated BuildRoot and Group in .spec
omit 498215f ARROW-3049: [C++/Python] Fix reading empty ORC file
omit d20147e ARROW-3125: [Python] Update ASV instructions
omit f841b90 ARROW-3017: [C++] Don't throw exception in arrow/util/thread-pool.h
omit a5c8a02 ARROW-3117: [GLib] Add garrow_chunked_array_to_string()
omit 628b74b ARROW-3116: [Plasma] Add "ls" to object store
omit b73aa20 ARROW-1563: [C++][FOLLOWUP] Use std::function instead of declaring auxiliary helper classes
omit 5a01af8 ARROW-3114: [Website] Add information about user@ mailing list to website / Community page
omit 588c1fa ARROW-1563: [C++] Implement logical unary and binary kernels for boolean arrays
omit 06e7a1b ARROW-3018: [Plasma] Remove Mersenne twister
omit 65a391a ARROW-3111: [Java] Adding logback config file to allow running tests with different log level
omit 6cf8ea7 ARROW-1661: [Python] Build Python 3.7 in manylinux container
omit fda4b3d ARROW-3105: [Plasma] Improve flushing error message
omit f3542c2 ARROW-2705: [JS] CombinationPredicates should take list of predicates
omit 23045d2 ARROW-2965: [Python] Guard against overflow when serializing Numpy uint64 scalar
omit 12a5755 ARROW-3110: [C++] Fix warnings with gcc 7.3.0
omit 4969da7 ARROW-3109: [Python] Add Python 3.7 virtualenvs to manylinux1 container
omit 8602509 ARROW-3099: [C++] Add benchmark for number parsing
omit 47f831b ARROW-3106: [Website] Update committers and PMC roster on website
omit 9f04fc2 ARROW-3100: [GLib] Follow Homebrew change that lua splits luarocks
omit 53e7594 ARROW-3095: [Plasma] Move plasma store
omit 27f990a ARROW-3098: [C++/Python] Allow seeking at end of BufferReader and FixedSizeBufferWriter
omit e8e82d0 ARROW-3094: [Python] Easier construction of schemas and struct types
omit dbf531b ARROW-3050: [C++] Adopt HiveServer2 client codebase from cloudera/hs2client. Add Thrift to thirdparty toolchain
omit 94e8196 ARROW-3088: [Rust] Use internal `Result<T>` type instead of `Result<T, ArrowError>`
omit a43e670 ARROW-3083: [CI] Use higher clone depth to pick up tags [skip appveyor]
omit c453a7a ARROW-1968: [C++/Python] Add basic unit tests for ORC reader
omit 349e6b0 ARROW-2971: [Python] Give some modules in arrow/python more descriptive names
omit da73971 ARROW-3053: [Python] Add unit test for strided object conversion that was failing in 0.9.0
omit 8db4e10 ARROW-3060: [C++] Factor out string-to-X conversion routines
omit 16bbec8 ARROW-3068: [Packaging] Bump version to 0.11.0-SNAPSHOT
omit c82dfcd ARROW-3067: [Packaging] Support dev/rc/release .deb/.rpm builds
omit 1209a80 ARROW-2583: [Rust] Buffer should be typeless
omit 170dc75 ARROW-1799: [Plasma C++] Make unittest does not create plasma store executable
omit 9428b86 ARROW-3064: [C++] Add option to ADD_ARROW_TEST to indicate additional dependencies for particular unit test executables
omit 719c954 ARROW-3059: [C++] Remove namespace arrow::test
omit 51410bc ARROW-3062: [Python] Fix python package finder to also work in Python 2.7
omit f62e07a ARROW-2687: [JS] Example usage in README is outdated
omit 3214e99 ARROW-2925: [JS] Documentation failing in docker container
omit 3edfd7c ARROW-3057: [INTEGRATION] Fix spark and hdfs dockerfiles
omit 8c42737 ARROW-3035 [Rust] Examples in README.md do not run
omit 08fa38b ARROW-3037: [Go] implement Null array
omit 1810db2 ARROW-3036: [Go] implement array.NewSlice
omit 72e4470 ARROW-3031: [Go] streamline Release of Arrays and Builders
omit ef4622b ARROW-3044: [Python] Remove all occurrences of cython's legacy property definition syntax
omit b99d8f3 ARROW-3045: [Python] Remove nullcheck from ipc Message and MessageReader
omit 7c93d0a ARROW-3034: [Packaging] Resolve symbolic link in tar.gz
omit f708c63 ARROW-3043: [C++] pthread doesn't exist on MinGW
omit 7031a86 ARROW-3047: [C++/Python] Better build instructions with ORC
omit affd6d7 ARROW-2952: [C++] Dockerized include-what-you-use
omit 21c3a18 ARROW-3042: [Go] add godoc badge to README
omit 2dfb01f ARROW-3022: [Go] add support for Struct arrays
omit ed3306b ARROW-3046: [GLib] Use rubyish method
omit baff6d8 ARROW-2979: [GLib] Add operator functions in GArrowDecimal128
omit b5a97cb ARROW-2998: [C++] Add unique_ptr versions of Allocate[Resizable]Buffer
omit 0c38a21 ARROW-3029: [Python] Generate version file when building
omit 78a4d65 ARROW-2814: [Python] Unify conversion paths for sequences of Python objects
omit aff1dca ARROW-3015: [Python] Fix typo in uint8() docstring
omit 216f3e4 ARROW-3028: [Python] Do less work to test Python documentation build
omit 699b0d2 ARROW-3000: [C++] Add option to label test groups then only build those unit tests
omit 18edb97 ARROW-3012: [Python] Fix setuptools_scm usage
omit 6e5bfe2 ARROW-3026: [Python] [Plasma] Only run Plasma unit tests with valgrind under Python 3.6
omit 2359de4 ARROW-3027: [Ruby] Stop "git tag" by "rake release"
omit 89120f0 ARROW-3023: [C++] Add gold linker enabling logic from Apache Kudu
omit 7b611f7 [C++] Fix a typo in `FindClangTools.cmake`. (#2404)
omit 67aae05 ARROW-3021: [Go] add support for List arrays
omit 9b24c3e ARROW-3024: [C++] Remove mutex in MemoryPool implementations
omit 4660833 ARROW-2975: [Plasma] Fix TensorFlow operator compilation with pip package
omit 5c97cd6 ARROW-2994: [Python] Only include Python and NumPy include directories for libarrow_python targets
omit e9c52f2 ARROW-2986: [C++] Use /EHsc flag for exception handling on MSVC, disable C4772 compiler warning in arrow/util/logging.h
omit 479c011 ARROW-2950: [C++] Clean up util/bit-util.h
omit c114783 ARROW-3019: [Packaging] Use Bundler to verify Arrow GLib
omit 0cef55a ARROW-2976: [Python] Fix pyarrow.get_library_dirs
omit d247c5b ARROW-3002: [Python] Hash more parts of pyarrow.Field
omit 5fda431 ARROW-3010: [GLib] Update README to use Bundler
omit 91ffc00 ARROW-3009: [Python] Fix pyarrow ORC reader
omit 25cc0d7 ARROW-3006: [GLib] Fix a bug that .gir/.typelib for GPU aren't installed
omit 1ad11fd ARROW-3008: [Packaging] Verify GPU related modules if available
omit 568f1cb ARROW-3011: [CI] Remove Slack notification
omit 29c4f76 ARROW-3007: [Packaging] Remove needless dependencies
omit e4f2713 ARROW-2992: [Python] Fix Parquet benchmark
omit 9f0a63d ARROW-3005: [Release] Update website, draft simple release blog post for 0.10.0
omit b6e5653 ARROW-2999: [Python] Disable ASV runs in Travis CI for now
omit bfe5eb3 ARROW-2992: [CI] Remove some AppVeyor build configurations
omit 632b8ce ARROW-3003: [Doc] Enable Java doc generation
omit 6a5d6c9 ARROW-2220: Only suggest default fix version that is a mainline release in merge tool
omit 7bead55 ARROW-3001: [Packaging] Don't modify PATH during rust release verification
omit a51d81e ARROW-1491: [C++] Add casting from strings to numbers and booleans
omit 34d383b ARROW-2996: [C++] Fix typo in cpp/.clang-tidy
omit edfbf84 ARROW-2964: [Go] wire all primitive arrays into array.MakeFromArray
omit 551e9ce ARROW-2813: [CI] [Followup] Disable gcov output in Travis-CI logs
omit 71145cd ARROW-2988: Improve Windows release verification script to be more automated
omit d3c9c1d ARROW-2061: [C++] Make tests a bit faster with Valgrind
omit e10f2b3 ARROW-2815: [CI] Skip Java tests and style checks on C++ job [skip appveyor]
omit ea9157a ARROW-2982: Ensure release verification script works with wget < 1.16, build ORC in C++ libraries
omit 91eab98 ARROW-2951: [CI] Don't skip AppVeyor build on format-only changes
omit 00aed05 ARROW-2990: [GLib] Support building with rpath-ed Arrow C++ on macOS
omit 072fa77 ARROW-2985: [Ruby] Add support for verifying RC
omit de50744 ARROW-2869: [Python] Add documentation for Array.to_numpy
omit 7c953a0 ARROW-2977: [Packaging] Release verification script should check rust too
omit 1b2a42e ARROW-2978: [Rust] Change argument to rust fmt to fix build
omit 495bf36 ARROW-2480: [C++] Enable casting the value of a decimal to int32_t or int64_t
omit 0c29673 ARROW-2962: [Packaging] Bintray descriptor files are no longer needed
omit ef933a6 ARROW-2666: [Python] Add __array__ method to Array, ChunkedArray, Column
omit 0f5fb20 ARROW-2813: [CI] Mute uninformative lcov warnings
omit 07f142d [maven-release-plugin] prepare release apache-arrow-0.10.0
omit d38bc66 [Release] Update .deb/.rpm changelogs for 0.10.0
omit 446dd45 [Release] Update CHANGELOG.md for 0.10.0
omit 7afa4af ARROW-2963: [C++] Make thread pool fork-safe
omit d48dce2 ARROW-2953: [Plasma] Reduce plasma memory usage
omit cf79192 ARROW-2911: [Python] Parquet binary statistics that end in '\0' truncate last byte
omit 567e33b ARROW-2960: [Packaging] Fix verify-release-candidate for binary packages and fix release cutting script for lib64 cmake issue
omit 0fc224b ARROW-2930: [C++] migrated MacOS specific code for shared library target
omit 3b24bc2 ARROW-2954: [Plasma] Reduce plasma store memory usage
omit f0cbfc3 ARROW-2955: Fix typo in pyarrow's HDFS API result
omit beefaca ARROW-2949: [CI] Add retry logic when downloading miniconda to reduce flakiness
omit f61d739 ARROW-2944: [Format] Synchronize some metadata changes to columnar format Markdown documents
omit c7175c4 ARROW-2943: [C++] Implement BufferedOutputStream::Flush
omit 29408fd ARROW-2946: [Packaging] Stop to use $PWD
omit f0de121 ARROW-2947: [Packaging] Remove Ubuntu Artful
omit 8c964a7 ARROW-2945: [Packaging] Update argument check
omit 4c0d49f ARROW-2875: [Packaging] Don't attempt to download arrow archive in linux builds
omit 300d914 ARROW-2935: [Packaging] Add verify_binary_artifacts function to verify-release-candidate.sh
omit 26affd7 ARROW-2940: [Python] Fix OSError when trying to load libcaffe2.so in pytorch 0.3.0
omit 734828d ARROW-2937: [Java] Followup to ARROW-2704. Make MessageReader classes immutable and clarify docs
omit 2422d9c ARROW-2660: [Python] Experimental zero-copy pickling
omit 161d1f0 ARROW-2926: [Python] Do not attempt to write tables with invalid schemas in ParquetWriter.write_table
omit 7ffb6c5 ARROW-2934: [Packaging] Add checksums creation to sign subcommand
omit cd162f5 ARROW-2704: [Java] Change MessageReader API to improve custom message handling for streams
omit bbf2e0f ARROW-2929: [C++] ARROW-2826 Breaks parquet-cpp 1.4.0 builds
omit b56d269 ARROW-2700: [Python] Add simple examples to Array.cast docstring
omit 0707b16 ARROW-2927: [Packaging] AppVeyor wheel task is failing on initial checkout
omit c6e33d8 ARROW-2924: [Java] mvn release fails when an older maven javadoc plugin is installed
omit 432dd93 ARROW-2923: [DOC] Adding Apache Spark integration test instructions
omit a18f362 ARROW-2922: [Release] Make python command name customizable
omit 537e7f7 ARROW-2920: [Python] Fix pytorch segfault
omit 4ba2d19 ARROW-2921: [Release] Update .deb/.rpm changelogs in preparation
omit 49ccf6a ARROW-2760: [Python] Remove legacy property definition syntax from parquet module and test them
omit 76033f4 ARROW-2918: [C++] Improve formatting of Struct pretty prints
omit fdc8e6a ARROW-2917: [Python] Use detach() to avoid PyTorch gradient errors
omit 47e462f ARROW-2915: [Packaging] Remove artifact form ubuntu-trusty build
omit 8e6af29 ARROW-2914: [Integration] Add WindowPandasUDFTests to Spark integration script
omit 16bbdd4 ARROW-2777: [JS] Friendlier onboarding readme
omit 5033f6e ARROW-2826: [C++] Remove ArrayBuilder::Init method, clean up Resize, remove PoolBuffer from public API
omit 3642e81 ARROW-2881: [Website] Add community tab to header, add link and callout to dev wiki
omit f019601 ARROW-2908: [Rust] Update version to 0.10.0
omit 2657f9d ARROW-2701: [C++] Make MemoryMappedFile resizable redux
omit 752d20c ARROW-2907: [GitHub] Improve the first paragraph of "How to contribute patches"
omit 9b85118 ARROW-2852: [Rust] Make Array sync and send
omit 6d0747a ARROW-2906: [Website] Remove the link to slack channel
omit a8a48c2 ARROW-2901: [Java] Build is failing on Java9
omit 4bed3bc ARROW-2864: [Plasma] Add deletion cache to delete objects later when they are not in use.
omit 0269203 ARROW-2756: [Python] Remove redundant imports and minor fixes in parquet tests
omit 2a0128d ARROW-2859: [Python] Accept buffer-like objects as sources in open_file, open_stream APIs
omit 078b806 ARROW-2656: [Python] Improve creation time of ParquetManifest for partitioned datasets using thread pool
omit aaf8d5d ARROW-2575: [Python] Exclude hidden files starting with . in ParquetManifest
omit b0ac721 ARROW-2902: [Python] Clean up after build artifacts created by root docker user in HDFS integration test
omit 566e398 ARROW-2586: [C++] Changing the type of ListBuilder's and StructBuilder's children from unique_ptr to shared_ptr so that it can support deserialization from Parquet to Arrow with arbitrary nesting
omit eaa6053 ARROW-2300: [C++/Python] Integration test for HDFS
omit 491114b ARROW-2744: [C++] Avoid creating list arrays with a null values buffer
omit a495885 ARROW-2514: [Python] Speed up inferring nested Numpy array
omit c8728de ARROW-2897: [Packaging] Organize supported Ubuntu versions
omit 141b2c3 ARROW-2711: [Python] Fix inference from Pandas column with first empty list
omit 0ecf88d ARROW-2891: [Python] Preserve schema in write_to_dataset
omit 13c103a ARROW-2876: [Packaging] Replace ssh-URLs with https://
omit 355ff08 ARROW-2816: [Python] Make NativeFile BufferedIOBase-compliant
omit d42a7d7 ARROW-2895: [CI] Add missing Ruby dependency on C++
omit 26cf346 ARROW-2896: [GLib] Add missing exports
omit a8ec080 ARROW-2894: [Glib] Adjust tests to format refactor
omit 0b838f9 ARROW-2845: [Packaging] Upload additional debian artifacts
omit 3c10ed2 ARROW-2884: [Packaging] Support RC
omit 2ff8708 ARROW-2878: [Packaging] README.md does not mention setting GitHub API token in user's crossbow repo settings
omit 0172169 ARROW-2886: [Release] Remove an unused variable
omit 73aee8c ARROW-889: [Python/C++] Unify PrettyPrints between Python and C++
omit 4b74592 ARROW-2877: [Packaging] crossbow submit results in duplicate Travis CI build
omit 89d92dd ARROW-2890: [Plasma] Make python client release method private
omit 87c976a ARROW-2855: [C++] Blog post that outlines the benefits of using jemalloc
omit 35c541a ARROW-2883: [C++] Fix Clang warnings in code built with -DARROW_GPU=ON
omit 7d2fbeb ARROW-2822: [C++] Remove the unneeded const qualifier and clarify the comments
omit ec9b72a ARROW-1715: [Python] Implement pickling for Column, ChunkedArray, RecordBatch, Table
omit aedba2c ARROW-2822: [C++] Zero padding bytes in PoolBuffer
omit f8cd36a ARROW-2326: [Python] Use @loader_path/ as rpath instead of @loader_path when bundling C++ libraries in wheels on macOS
omit 35ef303 ARROW-2810: [Plasma] Remove flatbuffers from public API
omit 277365a [Packaging] Make OSX wheel build verbose
omit 401c8df ARROW-2874: [Packaging] Pass job prefix when putting on Queue
omit 8443759 ARROW-2871: [Python] Raise when calling to_numpy() on boolean array
omit 31a9d38 ARROW-2868: [Packaging] Fix Apache Arrow ORC GLib related problems
omit 4ba8769 ARROW-2872: [Python] Add tensorflow mark to opt-in to TF-related unit tests
omit 5063b33 ARROW-2690: [Plasma] Use uniform function names in public APIs in Plasma. Add namespace around Flatbuffers
omit 3d5b4d8 ARROW-2847: [Packaging] Fix artifact name matching for conda forge packages
omit 8d8645c ARROW-564: [Python] Add Array.to_numpy()
omit faf16be ARROW-2787: [Python] Fix Cython usage instructions
omit 3419058 ARROW-2806: [C++/Python] More consistent null/nan handling
omit c49a57d ARROW-2663: [Python] Make dictionary_encode and unique accesible on Column / ChunkedArray
omit cecbcf7 ARROW-1744: [Plasma] Provide TensorFlow operator to transfer Tensors between Plasma and TensorFlow
omit 3fd913e ARROW-2861: [Python] Add note about how to not write DataFrame index to Parquet
omit ebc8dab ARROW-2771: [JS] Add row proxy object accessor
omit 56497ba ARROW-2844: [Packaging] Test OSX wheels after build
omit dea6ced ARROW-2841: [Go] support building in forks
omit d6aa492 ARROW-2850: [C++/Python] Correctly set RPATHs on all binaries
omit 6a2d4e8 ARROW-2846: [Packaging] Update nightly build in crossbow as well as the sample configuration
omit cbb13ea ARROW-2851: [C++] Update RAT excludes for new install file names
omit 4e8165c ARROW-2825: [C++] Add AllocateBuffer / AllocateResizableBuffer variants with default memory pool
omit 59ec2b1 ARROW-2849: [Ruby] Arrow::Table#load supports ORC
omit 82f2843 ARROW-2848: [Packaging] Use lib*10.deb instead of lib*0.deb
omit b4e3017 ARROW-2836: [Packaging] Expand build matrices to multiple tasks
omit 2c90eff ARROW-2829: [GLib] Add GArrowORCFileReader
omit 5ee8ed7 ARROW-2830: [deb] Enable parallel build again
omit fa4f2aa ARROW-2838: [Python] Speed up PandasObjectIsNull
omit e147057 ARROW-2834: [GLib] Remove "enable_" prefix from Meson options
omit e366604 ARROW-2824: [GLib] Add garrow_decimal128_array_get_value()
omit 35e85b8 ARROW-2820: [Python] Check that array lengths in RecordBatch.from_arrays are all the same
omit 7a413fe ARROW-2827: [C++] Stop to use -jN in sub make
omit 113430a ARROW-2383: [deb] Use system Protocol Buffers
omit bce0ca4 [Packaging] Fix fallback value code in Ruby
omit bd1c332 ARROW-2724: [Packaging] Determine whether all the expected artifacts are uploaded
omit a096eb1 ARROW-2821: [C++] Remove redundant memsets in BooleanBuilder
omit d130a00 ARROW-2812: [Ruby] Fix Arrow::Array#[] interface for Arrow::StructArray
omit e515ba3 ARROW-2823: [C++] Search for flatbuffers in <root>/lib64
omit fa08ddf [CI] Add missing quote for omittable variable (#2235)
omit b926574 ARROW-2722: [Python] Sanitize dtype number to handle edge cases
omit 8cfa51a ARROW-2790: [C++] Minor style changes from the review
omit 1a419fe ARROW-2790: [C++] Buffers can contain uninitialized memory
omit ddcb8f5 ARROW-2789: [JS] Add iterator to DataFrame
omit fbfddfd ARROW-1722: [C++] Add linting script to find C++/CLI incompatibilities
omit ae5e4b8 ARROW-2809: [C++] Only print cpplint and clang-format output for failures by default
omit 735e38b ARROW-2784: [C++] MemoryMappedFile::WriteAt allow writing past the end
omit 528cb7d ARROW-1454: [Python] Also match ArrowNotImplementedError in unsupported type conversions from pandas
omit 0933b4f ARROW-2601: [Python] Prevent user from calling *MemoryPool constructors directly
omit d7ad70d ARROW-2802: [Docs] Move all release management instructions to Confluence
omit 836afac ARROW-2634: [Go] Add Go license details to LICENSE.txt
omit 010c874 ARROW-2805: [Python] Use official way to find TensorFlow module
omit 148c05c ARROW-2754: [Python] Change Python setup.py to make release builds by default
omit 9d1432e ARROW-2798: [Plasma] Use hashing function that takes into account all UniqueID bytes
omit d5d39f7 ARROW-2779: [JS] stream reader fixes
omit 0175167 ARROW-2795: [Python] Run TensorFlow import workaround only on Linux platforms
omit 037c156 ARROW-2794: [Plasma] Add the RPC of a list of Delete Objects in Plasma
omit e7aaf7b ARROW-2657: [Python] Import TensorFlow python extension before pyarrow to avoid segfault
omit c8d97fa ARROW-2650: [JS] Implement Unions
omit 782c5a5 ARROW-2773: [Python] corrected partition_cols parameter name
omit 42c2101 ARROW-2780: [Go] Run code coverage analysis
omit 7deb141 ARROW-1954: [Python] Add metadata accessor to pyarrow.Field
omit 18f31e2 ARROW-2782: [Plasma] xfail plasma hugepage test
omit ceae13d ARROW-2344: [Go] Run Go unit tests in Travis CI
omit 35b1f9a [Python] MNT: Switch manylinux1 image back to latest tag (#2204)
omit c9613cc ARROW-2781: [Python] Download boost using curl in manylinux1 image
omit 4b2e52c ARROW-2335: [Go] move README one directory higher
omit 88f6794 ARROW-2763: [Python] Make _metadata file accessible in ParquetDataset
omit c56d881 ARROW-2761: [Python] Add support for set operations in hive partition filtering
omit c9ce215 ARROW-2747: [Python] Fix huge pages Plasma test
omit 6cf5809 ARROW-2755: [Python] Allow using Ninja to build extension
omit cac2c07 ARROW-2749: [GLib] Rename *garrow_decimal128_array_get_value to *garrow_decimal128_array_format_value
omit d38e862 ARROW-2758: [Plasma] Use Scope enum in Plasma
omit 4a20fc7 ARROW-2683: [Python] Resource Warning (Unclosed File) when using pyarrow.parquet.read_table()
omit 32de512 ARROW-2751: [GLib] Add garrow_table_replace_column()
omit 9979729 [Python] Fix typo in ipc.rst
omit 5e6c773 ARROW-2752: [GLib] Document garrow_decimal_data_type_new()
omit 6a70680 ARROW-2753: [GLib] Add garrow_schema_*_field()
omit 66c017e [GLib] Fix a typo
omit 9a9445a ARROW-2748: [GLib] Add garrow_decimal_data_type_get_scale() (and _precision())
omit 8c9890c ARROW-2742: [Python] Allow Table.from_batches to use iterator of record batches
omit 7e6dd60 ARROW-2662: [Python] Add to_pandas to ChunkedArray
omit 98253f3 [C++] Fix typo in README.md
omit 061aa5e [JS] Add NPM shield, add yarn installation (#2124)
omit ae69a78 [JS] Add example to load data via fetch (#2125)
omit c4d1001 ARROW-2740: [Python] Add address property to Buffer
omit c73a88d ARROW-2745: [C++] ORC ExternalProject needs to declare dependency on vendored protobuf
omit 4481b07 ARROW-2608: [Java/Python] Add pyarrow.{Array,Field}.from_jvm / jvm_buffer
omit e757e7e ARROW-2739: [GLib] Use G_DECLARE_DERIVABLE_TYPE
omit 2484278 ARROW-2738: [GLib] Use Brewfile on installation process
omit 27ddd3f ARROW-2741: [Python] pa.array from np.datetime[D] and type=pa.date64 produces invalid results
omit b165c86 ARROW-2727: [Java] Fix POM file issue causing build failure in java/adapters/jdbc
omit ac0e521 ARROW-2725: [Java] make Accountant.AllocationOutcome publicly visible (#2149)
omit 4db8a36 ARROW-2731 Add external Orc capability
omit 58a2366 ARROW-2676: [Packaging] Deploy build artifacts to github releases
omit 6ef9888 ARROW-2733: [GLib] Cast garrow_decimal128 to gint64
omit df327f6 ARROW-2732: [GLib] Update brew packages for macOS
omit 5cd1df6 ARROW-902: [C++] Script for downloading all thirdparty build dependencies and configuration for offline builds
omit 1ab2abc ARROW-2729: [GLib] Add decimal128 array builder
omit 87cb95c ARROW-2716: [Python] Make manylinux1 base image independent of Python patch releases
omit 1442816 ARROW-2400: [C++] Fix Status destructor performance
omit 884474c ARROW-2699: [C++/Python] Add Table method that replaces a column with a new supplied column
omit 97c24d7 ARROW-2726: [C++] Fix the latest Boost version
omit 7c81bd6 ARROW-2723: [C++] Add .pc for arrow orc
omit e17f95d ARROW-1780 - JDBC Adapter to convert Relational Data objects to Arrow Data Format Vector Objects (#1759)
omit a82a027 ARROW-2721: [C++] Fix ORC and Protocol Buffers link error
omit 392fd02 ARROW-2696: [JAVA] enhance AllocationListener with an onFailedAllocation() call (#2133)
omit c15eee7 ARROW-2395: [Python] Fix flake8 warnings outside of pyarrow/ directory. Check in CI
omit d4755e4 ARROW-2677: [Python] Expose Parquet ZSTD compression
omit 2b00b8a ARROW-2488: [C++] Add Boost 1.67 and 1.68 as recognized versions
omit 8d296cc ARROW-2554: [Python] fix timestamp unit detection from python lists
omit df44691 ARROW-2694 - [Python] ArrayValue string conversion returns the representation instead of the converted python object string
omit 53cc09e ARROW-2626: [Python] Add column name to exception message when writing pandas df fails
omit 6b80fa8 ARROW-2693: [Python] pa.chunked_array causes a segmentation fault on empty input
omit 9a76caa ARROW-2692: [Python] Add test for writing dictionary encoded columns to chunked Parquet files
omit 34890cc ARROW-2689: [Python] Remove parameter timestamps_to_ms
omit dc80a76 ARROW-2695: [Python] Prevent calling scalar constructors directly
omit 6df28d3 ARROW-2691: [Rust] Update code formatting with latest Rust stable
omit 1e4f8dd Add Ruby to README.md
omit 8156e25 ARROW-2551: [Plasma] Improve notification logic
omit d5c5f39 [JS] Add note about IPC format to readme (#2122)
omit 3155291 ARROW-2680: [Python] Add documentation about type inference in Table.from_pandas
omit 5b4728b ARROW-2635: [Ruby] Add LICENSE.txt and NOTICE.txt for Apache Arrow Ruby
omit 27b869a ARROW-2649: [C++] Add GenerateBits() function to improve bitmap writing performance
omit f0a8811 ARROW-2682: [CI] Notify in Slack about broken builds
omit dffd193 ARROW-2672: [Python] Build ORC extension in manylinux1 wheels
omit e82a34a ARROW-530: [C++/Python] Provide subpools for better memory allocation …
omit b165e46 ARROW-2675: Fix build error with clang-10 (Apple Clang / LLVM)
omit 0a3bdba ARROW-2287: [Python] chunked array not iterable, not indexable
omit 88fe5d7 ARROW-2678: [GLib] Add more common problems compiling c_glib on OSX
omit b1d1633 ARROW-2661: [Python] Adding the ability to programmatically pass hdfs configration key/value pairs via pyarrow
omit b9b4376 ARROW-2664: [Python] Implement __getitem__ / slicing on Buffer
omit 2fdacde ARROW-2603: [Python] Allow date and datetime subclassing
omit 9aa7c52 ARROW-2640: [JS] Write schema metadata
omit 44bfd0d ARROW-2638: [Python] Prevent calling extension class constructors directly
omit 5eaa3ab ARROW-2655: [C++] Fix compiler warnings with gcc 7
omit 3960db9 ARROW-2668: [C++] Suppress -Wnull-pointer-arithmetic when compiling plasma/malloc.cc on clang
omit 79a2207 ARROW-2430: [Packaging] MVP for branch based packaging automation
omit 0894d97 ARROW-2645: [Java] Refactor ArrowWriter to remove all ArrowFileWriter specifc logic
omit 94409a6 ARROW-906: [C++/Python] Read and write field metadata in IPC
omit d19089e ARROW-2641: [C++] Avoid spurious memset() calls, improve bitmap write performance
omit cdacb09 ARROW-2644: [Python] Fix prototype declaration in Parquet binding
omit d8bce06 ARROW-2632: [Java] ArrowStreamWriter accumulates ArrowBlock but does not use them
omit 1a922fd ARROW-2593: [Python] TypeError: data type "mixed-integer" not understood
omit 6646864 ARROW-2636: [Ruby] Add missing "unofficial" notes
omit ce23c06 ARROW-1163: [Java] Java client support for plasma
omit 01202cc ARROW-2568: [Python] Expose thread pool size setting to Python, and deprecate "nthreads" where possible
omit 338e597 ARROW-2537: [Ruby] Import
omit 5c5e95a ARROW-2604: [Java] Add convenience method to VarCharVector to set Text
omit d9f0cca ARROW-2630: [JAVA] typo fix
omit fc7a382 ARROW-2116: [JS] implement IPC writers
omit 1d9d893 ARROW-2629: [Plasma] Iterator invalidation for pending_notifications_
omit fcc13f5 ARROW-2585: [C++] Add Decimal::FromBigEndian, which was formerly a static method in parquet-cpp/src/parquet/arrow/reader.cc
omit 0374adb ARROW-2613: [Docs] Update the gen_apidocs docker script
omit 15e416e ARROW-2614: Remove 'group: deprecated' in Travis
omit 6132fd3 ARROW-2615: [Rust] Post refactor cleanup
omit f319bca ARROW-2597: [Plasma] remove UniqueIDHasher
omit bd25a65 ARROW-2612: [Plasma] Fix deprecated PLASMA_DEFAULT_RELEASE_DELAY
omit 3d41978 ARROW-2611: [Python] Fix Python 2 integer serialization
omit bd54041 [GLib] Use the default directory of GTK-Doc (#2058)
omit 936115c ARROW-2594: [Java] When realloc Vectors, zero out all unfilled bytes of new buffer
omit 635ee1f ARROW-2521: [Rust] Refactor Rust API to use traits and generic to represent Array instead of enum
omit 7764bc8 ARROW-2574: [Python] Add Cython and Python code coverage
omit 941a1b7 ARROW-2486: [C++/Python] Provide a Docker image that contains all dependencies for development
omit df20683 ARROW-2595: [Plasma] Use map.find instead of operator[] to avoid producing garbage data
omit e237918 ARROW-2561: [C++] Fix double free in cuda-test under code coverage
omit 5bb3d85 ARROW-2589: [Python] Workaround regression in Pandas 0.23.0
omit 6ca246a ARROW-2582: [GLib] Add negate functions for Decimal128
omit 38db8ed ARROW-2558: [Plasma] avoid walk through all the objects when a client disconnects
omit 71d487a ARROW-2584: [JS] Fixes for node v10
omit 48eee79 Removing extraneous debug print statement from run_clang_format.py (#2045)
omit 27fc25c ARROW-2332: Add Feather Dataset class
omit df9bdc1 Serialize tensors in PyTorch 0.4 (#2033)
omit 75acaba ARROW-2577: [Plasma] Add asv benchmarks for plasma
omit 63da09a ARROW-2580: [GLib] Fix abs functions for Decimal128
omit 5a29ab8 ARROW-2563: [Rust] Poor caching in Travis-CI
omit 4b8511f ARROW-2578: [Plasma] Use mersenne twister to generate random number
omit 19af862 ARROW-2576: [GLib] Add abs functions for Decimal128
omit 90fb5a3 ARROW-2571: [C++] Lz4Codec doesn't properly handle empty data
omit da3f843 ARROW-2569: [C++] Improve thread pool size heuristic
omit 321773c ARROW-2567: [C++] Not only compare type ids on Array equality
omit e1c3d4b ARROW-2517: [Java] Add list<decimal> writer (#1965)
omit 6a7ccd2 ARROW-2207: [GLib] Support GArrowDecimal128
omit 1d42efa ARROW-2500: [Java] IPC Writers/readers are not always setting validity bits correctly
omit 1c1c187 ARROW-2570: [Python] Add support for writing parquet files with LZ4 compression
omit bb47c36 ARROW-2565: [Plasma] new subscriber cannot receive notifications about existing objects
omit 2093f6e ARROW-2479: [C++] Add ThreadPool class
omit 414268b ARROW-1964: [Python] Expose StringBuilder to Python
omit b93faac ARROW-2566: [CI] Add codecov.io badge
omit 777e6b5 ARROW-2562: [CI] C++ and Rust code coverage using codecov.io
omit a0299bf ARROW-2564: [C++] Replace deprecated method in documentation
omit 35da703 ARROW-2557: [Rust] Add badge for code coverage in README
omit ac91d72 ARROW-2552: [Plasma] Fix memory error
omit bb67939 ARROW-2491: [Python] raise NotImplementedError on from_buffers with nested types
omit a426c1b ARROW-2549: [GLib] Apply arrow::StatusCode changes to GArrowError
omit 64923d5 ARROW-2550: [C++] Add missing status codes into arrow::Status::CodeAsString()
omit 488a8c0 ARROW-2546: [JS] Update to npm>=5.7.1 to fight EINTEGRITY problems
omit 0f07171 ARROW-2540: [Plasma] Create constructors & destructors for ObjectTableEntry
omit 9c31eec ARROW-2545: [Python] Link against required system libraries
omit c46f625 ARROW-2477: [Rust] Set up code coverage in CI
omit 0ecbbf4 ARROW-2285: [C++/Python] Can't convert Numpy string arrays
omit 0ef8ce3 ARROW-2548: Clarify `List<Char>` Array example
omit 0cb992a ARROW-2547: Fix off-by-one in `List<List<byte>>` example
omit a28a198 ARROW-2389: [C++] Add CapacityError
omit 2f453a0 ARROW-2544: [CI] Run the C++ tests with two jobs
omit 1b78ac2 ARROW-2543: [Rust] Cache dependencies when building our rust library
omit bcd5967 [Website] Update SciDB in "Powered By" (#2004)
omit 3d594bc ARROW-2273: [Python] Raise NotImplementedError when pandas Sparse types serializing
omit 5bdfff8 ARROW-2541: [Plasma] Replace macros with constexpr
omit b916c79 ARROW-2539: [Plasma] Use unique_ptr instead of raw pointer
omit 73f0d8e ARROW-2478: [C++] Introduce a checked_cast function that performs a dynamic_cast in debug mode
omit 8428c51 ARROW-2516: [CI] Filter changes in AppVeyor builds
omit 26c6805 ARROW-1886: [C++/Python] Flatten struct columns in table
omit 8797390 ARROW-2522: [C++] Version shared library files
omit f75bbc0 [C++] Fix a typo in cpplint (#1986)
omit c884f32 ARROW-2536: [Rust] optimize capacity allocation for ListBuilder
omit fbce08d ARROW-2511: [Java] Fix BaseVariableWidthVector.allocateNew to not swallow exception (#1947)
omit 6bf1c66 ARROW-2505: [C++] Disable MSVC warning C4800
omit 7323b60 ARROW-2493: [Python] Add support for pickling to buffers and arrays
omit 15e4811 ARROW-2531: [C++] Update clang bits to 6.0
omit 4cc9157 ARROW-2466: [C++] Fix "append" flag to FileOutputStream
omit 5bef985 ARROW-2332: Feather Reader option to return Table
omit 9b76ee4 ARROW-2533: [CI] Fast finish failing AppVeyor builds
omit 6f9c4db ARROW-2534: [C++] Hide all zlib symbols from libarrow.so
omit 2bc110d ARROW-2499: [C++] Factor out Python iteration routines
omit 0562d3b ARROW-2417: [Rust] Fix API safety issues
omit eda5ca8 ARROW-2509: Build for node 9.8
omit a3aaff5 ARROW-2503: [Python] Prevent trailing space character for string statistics
omit ea76265 ARROW-2484: [C++] Document ABI compliance checking
omit f056ef0 ARROW-2485: Re-write of run_clang_format.py, such that it outputs the diffs of th…
omit 113835a ARROW-2530: [GLib] Support out-of-source directory build again
omit 138c491 ARROW-2422: Support more operators for partition filtering
omit 4ac7b29 ARROW-2507: [Rust] Don't take a reference when not needed.
omit 3c8cb4d ARROW-2482: [Format] Clarify struct field alignment
omit 03be2a0 ARROW-2525: [GLib] Add garrow_struct_array_flatten()
omit 109942c ARROW-2527: [GLib] Enable GPU document
omit 1c5f06e ARROW-2474: [Rust] Add windows support for memory pool abstraction
omit af5bd80 ARROW-2526: [GLib] Update .gitignore
omit 07e0778 ARROW-2302: [GLib] Unify GNU Autotools build and Meson build into one Travis CI job
omit 101b319 ARROW-2462: [C++] Fix Segfault in UnpackBinaryDictionary
omit a2aba52 ARROW-2436: [Rust] Add windows CI
omit bdd5cad ARROW-2529: [C++] Update mention of clang-format to 5.0 in the docs
omit e3fafae ARROW-2513: [Python] DictionaryType should give access to index type and dictionary array
omit e8d45eb ARROW-2515 [Python] Add DictionaryValue class, fixing bugs with nested dictionaries
omit 3f5819a [GLib] Fix a typo
omit 16820a2 ARROW-2452: [TEST] Spark integration test fails with permission error
omit c8f17dd ARROW-2518: [Java] Re-instate JDK tests in matrix, but with JDK 8 instead of JDK 7
omit c574006 ARROW-2498: [Java] Use java 1.8 instead of java 1.7
omit c8a3ed8 ARROW-2286: [C++/Python] Allow subscripting pyarrow.lib.StructValue
omit 5f9cf9c ARROW-2448: [Plasma] Reference counting for PlasmaClient::Impl
omit 3d7a5a6 ARROW-2074: [Python] Infer lists of dicts as struct arrays
omit 2d278ab ARROW-2508: [Python] Fix pytest.raises msg to message
omit a609309 ARROW-2502: [Rust] Restore Windows Compatibility
omit 2abc889 ARROW-2489: [Plasma] Fix PlasmaClient ABI variation
omit b65205e ARROW-2470: [C++] Avoid seeking in GetFileSize
omit 7545e3e ARROW-2492: [Python] Prevent segfault on accidental call of pyarrow.Array
omit 77a5c59 ARROW-2494: [C++] Return status codes from PlasmaClient::Seal instead of crashing
omit 03251e9 ARROW-2427: [C++] Implement ReadAt properly
omit a5ae134 ARROW-1731: [Python] Add columns selector in Table.from_array
omit a6c9d30 ARROW-2453: [Python] Improve Table column access
omit 138717a ARROW-1858: [Python] Added documentation for pq.write_dataset
omit 5381295 ARROW-2314: [C++/Python] Fix union array slicing
omit 1ba7d51 ARROW-2222: handle untrusted inputs
omit 3b69c5a ARROW-2450: [Python] Test for Parquet roundtrip of null lists
omit 2452a46 ARROW-2393: [C++] Moving ARROW_CHECK_OK_[PREPEND] macros from status.h into util/logging.h since they use the logging infrastructure and shouldn't be in the public API.
omit 54df19d ARROW-1018: [C++] Create FileOutputStream, ReadableFile from file descriptor
omit c9ad33e ARROW-2457: [GLib] Support large is_valids in builder's append_values()
omit 4c71f30 ARROW-2390: [C++/Python] Map Python exceptions to Arrow status codes
omit 249e039 ARROW-1928: [C++] Add BitmapReader/BitmapWriter benchmarks
omit c19b1f0 ARROW-2481: [Rust] Move all calls to free() into memory.rs
omit 46fe09a ARROW-2471: [Rust] Builder zero capacity fix
omit 09be7b4 ARROW-2472: [Rust] Remove public attributes from Schema and Field and add accessors
omit 7eeca3a ARROW-2458: [Plasma] Use one thread pool per PlasmaClient
omit 1299931 ARROW-2443: [Python] Allow creation of empty Dictionary indices
omit 18999bb ARROW-2469: [C++] Make out arguments last in ReadMessage.
omit c2e0d42 ARROW-2423: [Python] Enable DataType, Field and plasma ObjectID equality checks against no…
omit d58057b ARROW-2473: [Rust] List empty slice assertion
omit 25eff99 ARROW-2468: [Rust] Builder::slice_mut() should take mut self.
omit 4c31b37 ARROW-2147: [Python] Fix type inference of numpy arrays
omit 72df18c ARROW-2465: [Plasma/GPU] Preserve plasma_store rpath
omit d7d3196 ARROW-2442: [C++] Disambiguate builder Append() overloads
omit f1ef708 ARROW-2319: [C++] Add BufferedOutputStream class
omit 2876a3f ARROW-2463: [C++] Update flatbuffers to 1.9.0
omit 66d0ad1 ARROW-2315: [C++/Python] Flatten struct array
omit 72c7f5d ARROW-2454: [C++] Allow zero-array chunked arrays
omit 2d0fbf1 ARROW-2464: [Python] Use a python_version marker instead of a condition
omit 3eee3e4 ARROW-2101: [Python/C++] Correctly convert numpy arrays of bytes to arrow arrays of strings when user specifies arrow type of string
omit b2167e4 ARROW-2435: [Rust] Add memory pool abstraction.
omit 98d250e ARROW-2397: [Documentation] Update format documentation to describe tensor alignment.
omit 7de1264 ARROW-2387: [Python] Flip test for rescale loss if value < 0
omit c96747b ARROW-2455: [C++] Initialize the atomic bytes_allocated_ properly
omit 0f87c12 ARROW-2437: [C++] Add ReadMessage without aligned argument.
omit 685147c ARROW-2451: [Python] Handle non-object arrays more efficiently in custom serializer.
omit f177404 ARROW-2369: [Python] Fix reading large Parquet files (> 4 GB)
omit 9ad8602 ARROW-2432: [Python] Fix Pandas decimal type conversion with None values
omit db03663 ARROW-2182: [Python] Build C++ libraries in benchmarks build step
omit 6e8ecb5 ARROW-2445: [Rust] Add documentation and make some fields private
omit 4009b62 ARROW-2224: [C++] Remove boost-regex dependency
omit ed7db7c ARROW-2097: [CI, Python] Reduce Travis-CI verbosity
omit 1ee7d11 ARROW-2407: [GLib] Add garrow_string_array_builder_append_values()
omit 42e195b ARROW-2440: [Rust] Implement ListBuilder<T>
omit 265142b ARROW-2441: [Rust] Builder<T>::slice_mut assertions are too strict
omit 91ec792 ARROW-2411: [C++] Add StringBuilder::Append(const char **values)
omit 6633cc9 ARROW-2433: [Rust] Add Builder.push_slice(&[T])
omit c5574f4 ARROW-2426: [GLib] Follow python -> python@3 change in Homebrew
omit ca277ae ARROW-2425: [Rust] BUG FIX: Add u8 mappings for Array::from
omit 33d92a0 ARROW-2434: [Rust] Add windows support
omit e941af8 ARROW-2391: [C++/Python] Segmentation fault from PyArrow when mapping Pandas datetime column to pyarrow.date64
omit 27417b2 ARROW-2328: [C++] Fixed and unit tested feather writing with slice
omit f56d765 ARROW-2305: [Python] Bump Cython requirement to 0.27+
omit 1bb7fba ARROW-2100: [Python] Drop Python 3.4 support
omit ad39d1f ARROW-2424: [Rust] Fix build - add missing import
omit 5030e23 ARROW-2420: [Rust] Fix major memory bug and add benches
omit abf4ed2 ARROW-2408: [Rust] Ability to get `&mut [T]` from `Buffer<T>`
omit ca3dbbb ARROW-2415: [Rust] Fix clippy ref-match-pats warnings.
omit 7376aab ARROW-2413: [Rust] Remove useless calls to format!().
omit 57db8b5 ARROW-2419: [Site] Hard-code timezone
omit b095994 ARROW-2408: [Rust] Remove build warnings
omit 55c1075 ARROW-2353: [CI] Check correctness of built wheel on AppVeyor
omit b4dafa5 ARROW-2414: Fix a variety of typos.
omit 408aa5a ARROW-2416: [C++] Support system libprotobuf
omit f88949b ARROW-2418: [Rust] BUG FIX: reserve memory when building list
omit 87284a5 [Site] Add Antoine to committers list (#1853)
omit f9c0701 ARROW-2402: [C++] Avoid spurious copies with FixedSizeBinaryBuilder
omit e3f7edc ARROW-2401 Support filters on Hive partitioned Parquet files
omit 946517d ARROW-2405: [C++] <function> is required for std::function
omit 83bfb39 ARROW-2404: [C++] Fix "declaration of 'type_id' hides class member" w…
omit 29c376d ARROW-2398: [Rust] Create Builder<T> for building buffers directly in aligned memory
omit 9515fe9 ARROW-2380: [Python] Streamline conversions
omit 045470c ARROW-2396: [Rust] Unify Rust Errors
omit 02b0c72 ARROW-2325: [Python] Update setup.py to use Markdown project description
omit 486d592 ARROW-2384: [Rust] Additional test & Trait standardization
omit 76edf43 ARROW-1463: [Java] Cleanup usage of Types.MinorType to MinorType
omit 640fc83 ARROW-2276: [Python] Expose buffer protocol on Tensor
omit 26bc4ab ARROW-2308: [Python] Make deserialized numpy arrays 64-byte aligned.
omit cf39686 ARROW-2195: [Plasma] Return auto-releasing buffers
omit 7081752 ARROW-2385: [Rust] implement to_json for DataType and Field
omit 806979b ARROW-2382: [Rust] Bug fix: List was not using aligned mem
omit 933b32b ARROW-2388: [C++] Use valid_bytes API for StringBuilder::Append
omit 82d4555 ARROW-2141: [Python] Support variable length binary conversion from Pandas
omit b0f376a Fix broken build on master (remove duplicate Drop impl for Buffer) (#1828)
omit 9fc4d89 DOC: Fix a tiny typo in parquet documentation (#1824)
omit 65493a6 ARROW-2014: [Python] Document read_pandas method in pyarrow.parquet
omit 65d2558 ARROW-2351 [C++] StringBuilder::append(vector<string>...) not impleme…
omit 4c68eca ARROW-2375: [Rust] Implement Drop for Buffer so memory is released
omit fce183c ARROW-2378: [Rust] Rustfmt
omit b6e8b4b ARROW-2381: [Rust] Adds iterator support to Buffer<T>
omit fff992a ARROW-2122: [Python] Pyarrow fails to serialize dataframe with timestamp.
omit 11b15a5 ARROW-2357: [Python] Add microbenchmark for PandasObjectIsNull()
omit 8fdad18 ARROW-2377: [GLib] Support old GObject Introspection
omit 7e27cf5 ARROW-2376: [Rust] Travis builds the Rust library
omit d2d4cc7 ARROW-2371: [GLib] Update "Requires" in .pc on GNU Autotools build
omit be049fa ARROW-2370: [GLib] Fix include path in .pc on Meson build
omit 00b334f [Rust] Update READMEs to add Rust libraries link and to remove out-of-data comment about memory alignment (#1817)
omit 3975de5 Update README.md to include new components
omit 3f72d14 ARROW-2361: [Rust] Starting point for a native Rust implementation of Arrow
omit ba0cea3 ARROW-2140: [Python] Improve float16 support
omit 97f5ec0 [C++] Fix documentation typo in arrow/array.h
omit 866e9b8 ARROW-2327: [JS] Table.fromStruct missing from externs
omit f29e5a1 ARROW-2368: [JAVA] Correctly pad negative values in DecimalVector#setBigEndian (#1809)
omit 3d4b6c1 ARROW-2356: [JS] Fix JSON Reader FixedSizeBinary Vectors
omit f9f8320 ARROW-2354: [C++] Make PyDecimal_Check() faster
omit 27f5a42 ARROW-2301: [Python] Build source distribution inside the manylinux1 docker
omit 6156b1d ARROW-640: [Python] Implement __hash__ and equality for Array scalar values Arrow scalar values
omit 9c7e06b ARROW-2348: [GLib] Remove GLib + Go example
omit 29f744f ARROW-2350: Consolidated RUN step in spark_integration Dockerfile
omit af6e3ec ARROW-1913: [Java] Disable Javadoc doclint with Java 8
omit 7b2c797 ARROW-2349: [Python] Opt in to bundling Boost shared libraries separately
omit 777f986 ARROW-2331: [Python] Fix indexing for negative or out-of-bounds indices
omit a0ca9b4 ARROW-2346: [Python] Fix PYARROW_CXX_FLAGS with multiple options
omit e6d8eed ARROW-2322: [Java] Document dev environment requirements for publishing Java release artifacts
omit 0c8d164 ARROW-2345: [Documentation] Fix bundle exec and set sphinx nosidebar to True
omit 29268ec ARROW-2342: [Python] Allow pickling more types
omit f50d858 ARROW-2343: [Java/Packaging] Run mvn clean in API doc builds
omit eecb1bc ARROW-2281: [Python] Add Array.from_buffers()
omit d623567 ARROW-2341: [Python] Improve pa.union() mode argument behaviour
omit 47fcef3 ARROW-2334: [C++] Update boost to 1.66.0
omit 07beb51 ARROW-2333: [Python] Fix bundling boost with default namespace
omit f45abf0 [Website] Add link to press release
omit 948cb4a ARROW-2336: [Website] Add 0.9.0 release blog post
omit 607c7fa ARROW-2340: [Website] Add blog post about Go code donation
omit 60848c0 ARROW-2299: [Go] Import Go arrow implementation from influxdata/arrow
omit a50ef9f ARROW-2329: [Website] 0.9.0 release update
omit bb17a0d [maven-release-plugin] prepare for next development iteration
omit c695a5d [maven-release-plugin] prepare release apache-arrow-0.9.0
omit 7be8d37 [Release] Update CHANGELOG.md for 0.9.0
omit 95ba6ef ARROW-2321: [C++] Release verification script fails with if CMAKE_INSTALL_LIBDIR is not $ARROW_HOME/lib
omit 82c8b6f ARROW-2318: [Plasma] Run plasma store tests with unique socket
omit 79e19c3 [JS] Small fixes to source release workflow and e-mail template (#1750)
omit e29df7d ARROW-2320: [C++] Vendored Boost build does not build regex library
omit 20ea781 [Python] Pin Cython to 0.27.3 in verify-release-candidate.sh (#1758)
omit 60749b2 ARROW-2316: [C++] Revert Buffer::mutable_data to inline so that linkers do not have to remember to define NDEBUG for release builds
omit 019a560 ARROW-2309: [C++] Use std::make_unsigned
omit 630ce5e ARROW-2311: [Python/C++] Fix struct array slicing
omit b185951 ARROW-2313: [C++] Add -NDEBUG flag to arrow.pc
omit 98012cb ARROW-2312: [JS] run test_js before test_integration
omit e25e3ef ARROW-2307: [Python] Allow reading record batch streams with zero record batches
omit 385656c ARROW-2304: [C++] Fix HDFS MultipleClients unit test
omit a430758 ARROW-2306: [Python] Fix partitioned Parquet test against HDFS
omit 33d1091 ARROW-2227: [Python] Fix off-by-one error in chunked binary conversions
omit 7c7b09f ARROW-1643: [Python] Accept hdfs:// prefixes in parquet.read_table and attempt to connect to HDFS
omit 0b28dc5 ARROW-2142: [Python] Allow conversion from Numpy struct array
omit 171340f ARROW-2135: [Python] Fix NaN conversion when casting from Numpy array
omit 6fc9922 ARROW-2118: [C++] Fix misleading error when memory mapping a zero-length file
omit 317b543 ARROW-2293: [JS] Print release vote e-mail template when making source release
omit 58fa873 ARROW-2282: [Python] Create StringArray from buffers
omit 3917e85 ARROW-2292: [Python] Rename frombuffer() to py_buffer()
omit 8f2ff30 ARROW-2240: [Python] Array initialization with leading numpy nan fails with exception
omit c7b3c05 ARROW-2297: [JS] babel-jest is not listed as a dev dependency
omit dc45a1a ARROW-2099: [Python] Add safe option to DictionaryArray.from_arrays to do boundschecking of indices by default
omit d64a231 ARROW-2181: [PYTHON][DOC] Add doc on usage of concat_tables
omit 2f718d7 ARROW-2262: [Python] Support slicing on pyarrow.ChunkedArray
omit 907a27d ARROW-2288: [Python] Fix slicing logic
omit 412bb91 ARROW-2291: [C++] Add additional libboost-regex-dev to build instructions in README
omit d0284cb ARROW-2236: [JS] Add more complete set of predicates
omit fc9f89a ARROW-2250: [Python] Do not create a subprocess for plasma but just use existing process
omit c7c2393 ARROW-2269: [Python] Make boost namespace selectable in wheels
omit 3511c65 ARROW-2268: Drop usage of md5 checksums for source releases, verification scripts
omit 8167472 ARROW-2275: [C++] Guard against bad use of Buffer.mutable_data()
omit 7354a19 ARROW-2284: [Python] Fix error display on test_plasma error
omit 23d08b7 ARROW-2150: [Python] Raise NotImplementedError when comparing with pyarrow.Array for now
omit 40a0008 [Python] Adding more missing Linux dependencies to developer docs
omit f56fdc9 ARROW-2270: [Python] Fix lifetime of ForeignBuffer base object
omit 04f4e6b ARROW-2289: [GLib] Add Numeric, Integer, FloatingPoint data types
omit 34b18f7 ARROW-1940: [Python] Extra metadata gets added after multiple conversions between pd.DataFrame and pa.Table
omit f3f91b0 ARROW-2263: [Python] Prepend local pyarrow/ path to PYTHONPATH in test_cython.py
omit 5e945a3 ARROW-2239: [C++] Update Windows build docs
omit c372dfb ARROW-2280: [Python] Return the offset for the buffers in pyarrow.Array
omit fb2316c ARROW-2238: [C++] Detect and use clcache in cmake configuration
omit 9effbed ARROW-2283: [C++] Support Arrow C++ installed in /usr detection by pkg-config
omit 60c8081 ARROW-2261: [GLib] Improve memory management for GArrowBuffer data
omit 5f8a793 ARROW-2279: [Python] Better error message if lib cannot be found
omit a58bd72 ARROW-2272: [Python] Clean up leftovers in test_plasma.py
omit cde18a6 ARROW-2234: [JS] Read timestamp low bits as Uint32s
omit 51e117d ARROW-2154: [Python] Implement equality on buffers
omit 57e4dd8 ARROW-2265: [Python] Use CheckExact when serializing lists and numpy arrays.
omit 06e9fb4 [Python] Add missing dependency to development.rst
omit 01a099c ARROW-2199: [JAVA] Control the memory allocated for inner vectors in containers. (#1646)
omit 45f5da2 ARROW-1982: [Python] Coerce Parquet statistics as bytes to more useful Python scalar types
omit c6359cb ARROW-1929: [C++] Copy over testing utility code from PARQUET-1092
omit 55bdae5 ARROW-2254: [Python] Ignore JS tags in local dev versions
omit 49f1d00 ARROW-2258: [Python] Add additional information to find Boost on windows
omit b89c124 ARROW-2253: [Python] Support __eq__ on scalar values
omit 9ceda35 ARROW-2244: [C++] Add unit test to explicitly check that NullArray internal data set correctly in Slice operations
omit 03db8a3 ARROW-2251: [GLib] Keep GArrowBuffer alive while GArrowTensor for the buffer is live
omit 6e699d7 ARROW-2252: [Python] Create buffer from address, size and base
omit 8b1c811 ARROW-2245: ARROW-2246: [Python] Revert static linkage of parquet-cpp in manylinux1 wheel
omit 34c33f1 [Python] Document serialization parameter as "string" instead of "bytes"
omit 5994094 ARROW-2209: [Python] Partition columns are not correctly loaded in schema of ParquetDataset
omit f403804 ARROW-2205: [Python] Option for integer object nulls
omit 29495ce ARROW-2176: [C++] Extend DictionaryBuilder to support delta dictionaries
omit 99899d6 ARROW-2232: [Python] pyarrow.Tensor constructor segfaults
omit bfac60d ARROW-2145/ARROW-2153/ARROW-2157/ARROW-2160/ARROW-2177: [Python] Decimal conversion not working for NaN values
omit b2eb6ac ARROW-1632: [Python] Permit categorical conversions in Table.to_pandas on a per-column basis
omit 8b3bbae ARROW-2198: [Python] correct docstring for parquet.read_table
omit af2047e ARROW-2215: [Plasma] Hugetables munmap issue
omit 5321582 ARROW-2231: [CI] Use clcache on AppVeyor for faster builds
omit 3d5880a ARROW-2040: [Python] Deserialized Numpy array must keep ref to underlying tensor
omit 671b53c ARROW-2046: [Python] Support path-like objects
omit 1d9b834 ARROW-2225: [JS] support tables split across buffers
omit 0a672bc ARROW-2226, ARROW-2233: [JS] Dictionary bugfixes
omit 524b522 ARROW-2218: [Python] PythonFile should infer mode when not given
omit d3fabe0 ARROW-2230: [Python] Strip catch-all tag matching from git-describe
omit 1a92846 ARROW-2223: [JS] compile src/bin as es5-cjs to all output targets
omit 482fc58 ARROW-2210: [C++] Reset ptr on failed memory allocation
omit 887e893 ARROW-1937: [Python] Document nested array initialization
omit a5c5ad2 ARROW-2203: [C++] StderrStream class
omit c017a63 ARROW-1035: [Python] Add streaming dataframe reconstruction benchmark
omit e0328b0 ARROW-2023: [C++] Fix ASAN failure on malformed / empty stream input, enable ASAN builds, add more dev docs
omit e50a8ec ARROW-2206: [JS] Document Perspective project
omit 8c493cd ARROW-2219: [JS] rename indicies to indices
omit 564fefe ARROW-2213: [JS] fix npm release
omit 5521bcf ARROW-2094: [C++] Install libprotobuf and set PROTOBUF_HOME when using toolchain
omit 655eb74 ARROW-2212: [C++/Python] Build Protobuf in base manylinux 1 docker image
omit 27d8339 ARROW-2214: [JS] add nullBitmap getter to DictionaryData that proxies to its indices' nullBitmap
omit 2fd8f0a ARROW-2204: Fix TLS errors in manylinux1 build
omit c0b0e33 ARROW-2191: [C++] Only use specific version of jemalloc
omit e2dd864 ARROW-2184: [C++] Add static constructor for FileOutputStream returning shared_ptr to OutputStream
omit cca4a74 ARROW-2197: Document C++ ABI issue and workaround
omit 3e3f7c2 ARROW-2066: [Python] Document using pyarrow with Azure Blob Store
omit 2f01658 ARROW-2201: [Website] Publish JS API Docs
omit c2865d0 ARROW-2093: [Python] Do not install PyTorch in Travis CI
omit d52f2ff [Dev] Follow-up, use angle brackets for commit author instead of square brackets
omit 81bfb38 ARROW-2185: Strip CI directives from commit messages
omit 27f7eba ARROW-2069: [Python] Add note that Plasma is not supported on Windows
omit cdc347c ARROW-2132: Add link to Plasma in main README
omit 5f10067 ARROW-2180: [C++] Remove deprecated APIs from 0.8.0 cycle
omit bcbcf02 [JS] Fix typo in npm target for esNext/CommonJS. (#1645)
omit 3e87f77 ARROW-2131: [Python] Prepend module path to PYTHONPATH when spawning subprocess
omit 897cc4d ARROW-1345: [Python] Test conversion from nested NumPy arrays with smaller int, float types
omit 9fefc23 ARROW-2162: [Python/C++] Decimal Values with too-high precision are multiplied by 100
omit 9298c93 ARROW-2192: [CI] Always build on master branch and repository
omit 7d11d02 ARROW-2190: [GLib] Add add/remove field functions for RecordBatch
omit 94fd3ee ARROW-2172: [C++/Python] Fix converting from Numpy array with non-natural stride
omit f357906 ARROW-1942: [C++] Hash table specializations for small integers
omit e06cfdd ARROW-2179: [C++] Install omitted headers in arrow/util
omit ac2637a ARROW-2175: [Python] Install Arrow libraries in Travis CI builds when only Python directory is affected
omit 46aa99e ARROW-2121: [Python] Handle object arrays directly in pandas serializer.
omit 7d992de [Release] Apache Arrow JavaScript 0.3.0
omit 77f2841 ARROW-2159: [JS] Support custom predicates
omit 8e90836 ARROW-2168: [C++] Build toolchain on CI with jemalloc
omit 3da9fd3 ARROW-2178: [JS] Fix JS html FileReader example
omit d5c507a ARROW-2143: [Python] Provide a manylinux1 wheel for cp27m
omit f8445a3 ARROW-2171: [C++/Python] Make OwnedRef safer
omit 64d2af6 ARROW-2144: [JS] Don't repeat dictionary lookups in DataFrame ops
omit 080ce12 ARROW-2173: [C++/Python] Hold the GIL in NumPyBuffer destructor
omit d64e144 ARROW-2170: [Python] construct_metadata fails on reading files where no index was preserved
omit 2106152 ARROW-2163: [CI] Make apt installs explicit
omit 864c939 ARROW-2174: [JS] export arrow format and schema enums
omit a1a34b8 ARROW-2169: [C++] MSVC is complaining about uncaptured variables
omit 62b9eb2 ARROW-1579: [Java] Adding containerized Spark Integration tests
omit c71a565 ARROW-2117: [C++] Update codebase / CI toolchain for clang 5.0
omit 7c37b0d ARROW-2161: [Python] Skip test_cython_api if ARROW_HOME isn't defined
omit e8870d1 ARROW-2166: [GLib] Add Slice api to Column
omit 148ab9c ARROW-2156: [CI] Isolate Sphinx dependencies
omit c077986 ARROW-2068: [Python] Expose array's buffers
omit 0265fb4 ARROW-2151: [Python] Fix conversion from np.uint64 scalars
omit e15f545 ARROW-2039: [Python] Avoid crashing on uninitialized Buffer
omit 7c88443 [Website] Add SciDB to "Powered By" (#1604)
omit 78152f1 ARROW-1815: [Java] Rename MapVector to StructVector
omit 5dce01f ARROW-2155: [Python] frombuffer() should respect mutability of argument
omit c78c92a ARROW-2149: [Python] Reorganize test_convert_pandas.py
omit d28f055 ARROW-2146: [GLib] Add Slice api to ChunkedArray
omit 4a8a102 ARROW-969: [C++] Add add/remove field functions for RecordBatch
omit 0ffc882 ARROW-1998: [Python] fix crash on empty Numpy arrays
omit 30ab43f ARROW-2124: [Python] Add test for empty item in array
omit cf00b57 ARROW-2138: [C++] abort on failed debug check
omit e8a93ca ARROW-1021: [Python] Add documentation for C++ pyarrow API
omit 62c55ec ARROW-2133: [Python] Fix segfault on conversion of empty nested array to Pandas
omit 296e7b0 ARROW-1912: [Website] Add committer affiliations and roles to website
omit 31a1b9b [Website] Add FPGA acceleration framework Fletcher to "Powered By" (#1593)
omit 08d664a ARROW-2137: [Python] Don't print paths that are ignored when reading Parquet files
omit 90d9daf ARROW-2129: [Python] Handle conversion of empty tables to Pandas
omit f7d3c64 ARROW-2134: [CI] Make Travis-CI commit inspection more robust
omit a6bcaa7 ARROW-2106: [Python] Add conversion for a series of datetime objects
omit 41a42de ARROW-2128: [Python] Support arrays of empty lists
omit 9d9cc8f ARROW-2049: [Python] Use python -m cython to run Cython, instead of CYTHON_EXECUTABLE
omit b18e159 ARROW-1973: [Python] Memory leak when converting Arrow tables with array columns to Pandas dataframes.
omit ddae240 ARROW-2120: [C++] Add possibility to use empty _MSVC_STATIC_LIB_SUFFIX for Thirdparties
omit 0417b14 ARROW-2123: [JS] Upgrade to TS 2.7.1
omit 163be42 [Doc] Refine top of README, add GLib bindings to README, fix ASF link
omit 4fe3a0b ARROW-2114: [Python] Pull latest docker manylinux1 image [skip appveyor]
omit 88b72df ARROW-2073: [Python] Create struct array from sequence of tuples
omit 6e6f9b7 ARROW-2083: [CI] Detect changed components on Travis-CI
omit 7bf7b2e ARROW-1950: [Python] pandas_type in pandas metadata incorrect for List types
omit f69e9db ARROW-633/634: [Java] Add FixedSizeBinary support in Java and integration tests (Updated)
omit ea4c7b1 ARROW-2110: [Python] Only require pytest-runner on test commands
omit 45ad0b0 ARROW-2087: [Python] Binaries of 3rdparty are not stripped in manylinux1 base image
omit 90bb4bd ARROW-2111: [C++] Lint in parallel
omit bd1e6e5 ARROW-2095: [C++] Less verbose building 3rd party deps
omit 5dd9bff ARROW-2107: [GLib] Follow arrow::gpu::CudaIpcMemHandle API change
omit 57563cd ARROW-2109: [C++] Completely disable boost autolink on MSVC build
omit 3b6b93d ARROW-2108: [Python] Update instructions for ASV
omit 54859c5 ARROW-1394: [Plasma] Add optional extension for allocating memory on GPUs
omit 310e5b1 ARROW-1757: [C++] Add DictionaryArray::FromArrays alternate ctor that can check or sanitized "untrusted" indices
omit 2a881a0 ARROW-2044: [JS] Typings should be a regular dependency
omit 1a8c9a4 ARROW-1976: [Python] Handling unicode pandas columns on parquet.read_table
omit 0d02a7d ARROW-2080: [Python] Update documentation about pandas serialization context.
omit c49636d ARROW-2086: [Python] Shrink size of arrow_manylinux1_x86_64_base docker image
omit 11c9b42 ARROW-2090: [Python] Add context methods to ParquetWriter
omit 30ade84 ARROW-2071: [Python] Fix test slowness on Travis-CI
omit bdedf23 ARROW-2088: [GLib] Add GArrowNumericArray
omit de850b9 ARROW-2089: [GLib] Rename to GARROW_TYPE_BOOLEAN for consistency
omit 416d565 ARROW-2071: [Python] Lighten serialization tests
omit febc19d ARROW-1589: [C++] Fuzzing for certain input formats
omit d949ee6 ARROW-2084: [C++] Support newer Brotli static library names
omit e26f3da ARROW-2085: [Python] HadoopFileSystem.isdir/.isfile return False on missing paths
omit 2e9f7dd ARROW-1706: [Python] Coerce array inputs to StructArray.from_arrays. Flip order of arguments
omit 5042863 ARROW-1754: [Python] alternative fix for duplicate index/column name that preserves index name if available
omit a1fd796 ARROW-2050: [Python] Support `setup.py pytest`
omit 3098c14 ARROW-2052: [C++ / Python] Rework OwnedRef, remove ScopedRef
omit e327747 ARROW-1990: [JS] C++ Refactor, Add DataFrame
omit f84af8f ARROW-2065: [Python] Fix bug in SerializationContext.clone().
omit c1d77a1 ARROW-2076: [Python] Display slowest test durations
omit 0ada875 ARROW-1861: [Python] Rework benchmark suite [skip ci]
omit ff28c76 ARROW-2024: [Python] Remove torch serialization from default serialization context.
omit 2d649f9 ARROW-1623: [C++] Add convenience method to construct Buffer from a string that owns its memory
omit 1ed4019 ARROW-2072: [Python] Fix crash in decimal128.byte_width
omit 0e04f6d ARROW-2070: [Python] Fix chdir logic in setup.py
omit 0d6817a ARROW-2042: [Plasma] Revert API change of plasma::Create to output a MutableBuffer
omit e112995 ARROW-2062: [Python] Do not use memory maps in test_serialization.py to try to improve Travis CI flakiness
omit cd0676f ARROW-2064: [GLib] Add common build problems link to the install section
omit 3e63084 ARROW-2036: [Python] Support standard IOBase methods on NativeFile
omit 5c704bc ARROW-1705: [Python] allow building array from dicts
omit 8d78376 ARROW-2047: [Python] Use sys.executable instead of one in the search path.
omit 673125f ARROW-2054: [C++] Fix compilation warnings
omit 40dd9cc ARROW-2033: [Python] Fix pa.array() with iterator input
omit 0621765 ARROW-2048: [Python/C++] Upate Thrift pin to 0.11
omit d322634 ARROW-1992: [C++/Python] Fix segfault when string to categorical empty string array
omit e50b1b3 ARROW-2028: [Python] extra_cmake_args needs to be passed through shlex.split
omit 0543953 ARROW-1646: [Python] Handle NumPy scalar types
omit 450bf47 ARROW-1835: [C++] Create Arrow schema from std::tuple types
omit edde5c1 ARROW-1999: [Python] Type checking in `from_numpy_dtype`
omit 6299a9c ARROW-2032: [C++] ORC ep installs on each call to ninja build
omit a71bc83 ARROW-2010: [C++] Do not suppress shorten-64-to-32 warnings from clang, fix warnings in ORC adapter
omit 074eafc ARROW-2043: [C++] change description from OS X to macOS
omit a95465b ARROW-2035: [C++] Update vendored cpplint.py to a Py3-compatible one
omit f680dac ARROW-2007: [Python] Implement float32 conversions, use NumPy dtype when possible for inner arrays
omit bfce44b ARROW-2017: [Python] Use unsigned PyLong API for uint64 values over int64 range
omit 51046a0 ARROW-1961: [Python] Preserve pre-existing schema metadata in Parquet files when passing flavor='spark'
omit 8edd62e ARROW-2031: [Python] HadoopFileSystem is pickleable
omit 1a9d024 ARROW-2019: [JAVA] Control the memory allocated for inner vector in LIST (#1497)
omit 68b119b ARROW-2029: [Python] NativeFile.tell errors after close
omit db83fb4 [C++] Update README for linting (#1515)
omit 6bb1d1b ARROW-2003: [Python] Remove use of fastpath parameter to pandas.core.internals.make_block
omit 2126ebf ARROW-2025: [C++] Creating multiple equivalent `HadoopFileSystem`s works fine
omit 0a49022 ARROW-1712: [C++] Add method to BinaryBuilder to reserve space for value data
omit 0930b1d ARROW-2018: [C++] fix Build instruction on macOS and Homebrew
omit 72dea17 ARROW-1997: [C++/Python] Ignore zero-copy-option in to_pandas when `strings_to_categorical` is True
omit 422efd9 ARROW-1580: [Python] Instructions for setting up nightly builds on Linux
omit ed27243 ARROW-2012: [GLib] Support "make distclean"
omit 1bbaf7e [Python] Fix small typos in bytes, String/UTF-8 and FixedSizeBinary type check exceptions. (#1495)
omit d135974 ARROW-2000: [Plasma] Deduplicate file descriptors when replying to GetRequest.
omit e446084 ARROW-2011: [Python] Allow setting the pickler in the serialization context.
omit 9e4a6e4 ARROW-1930: [C++] Adds Slice operation to ChunkedArray and Column
omit 305b54c ARROW-1872: [Website] Minor edits and addition of YAML for versions
omit a11da7f ARROW-2005: [Python] Fix incorrect flake8 config path to Cython lint config
omit bc9f9e5 ARROW-1966: [C++] Accommodate JAVA_HOME on Linux that includes the jre/ directory, or is the full path to directory with libjvm
omit 58a24c5 ARROW-2004: [C++] Add shrink_to_fit parameter to BufferBuilder::Resize, add Reserve method
omit 1ffce26 ARROW-1856: [Python] Auto-detect Parquet ABI version when using PARQUET_HOME
omit 9e2fc04 ARROW-2002: [Python] check write_queue is not full and writer_thread is alive before enqueue new record when download file.
omit 9be080f ARROW-1991: [Website] Fix Docker documentation build
omit 99e58da ARROW-1979: [JS] Fix JS builds hanging in es2015
omit b49e8f3 ARROW-1971: [Python] Add pandas serialization to the default
omit f82b7e4 ARROW-1927: [Plasma] Add delete function
omit 9eae508 ARROW-764: [C++] Improves performance of CopyBitmap and adds benchmarks
omit 289e205 ARROW-1977: [C++] Update windows dev docs
omit 3e14e12 ARROW-1978: [Website] Consolidate Powered By project list, add more visibly to front page
omit d0a93ba ARROW-1980: [Python] Fix race condition in write_to_dataset
omit 1b0732c ARROW-1965: [GLib] Add garrow_array_builder_get_value_data_type()
omit ee134f0 ARROW-1969: [C++] Don't build ORC extension by default
omit 95d894d ARROW-1972: [Python] Import pyarrow in DeserializeObject.
omit 234ff71 ARROW-1958: [Python] Error in pandas conversion for datetimetz row index
omit bda85bb ARROW-1970: [GLib] Add garrow_chunked_array_get_value_data_type() and garrow_chunked_array_get_value_type()
omit 4dbce60 ARROW-1962: [Java] Adding reset to ValueVector interface
omit 0115e93 ARROW-1919: [Plasma] Test that object ids are 20 bytes
omit cb9c52e ARROW-1909: [C++] Enables building with benchmarks on windows
omit 3a69efc ARROW-1920 [C++/Python] Add experimental reader for Apache ORC files
omit 4a3e6e3 ARROW-1941: [Python] Fix empty list roundtrip in to_pandas
omit 37c3265 ARROW-1946: [JAVA] Add APIs to decimal vector for writing big endian data
omit 0f38a95 ARROW-1947: [Plasma] Change Client Create and Get to use Buffers
omit 4daffad ARROW-1953: [JS] Fix JS build
omit d86fdc7 Fix a comment typo (#1448)
omit 0401e6d ARROW-1945: [C++] Fix doxygen documentation of array.h
omit 2ca69d1 ARROW-1948: [Java] Load ListVector validity buffer with BitVectorHelper to handle all non-null
omit 16c79cc ARROW-1951: [Python] Add memcopy threads argument to PlasmaClient put.
omit 8986521 ARROW-1943: [JAVA] handle setInitialCapacity for deeply nested lists
omit 65f5add ARROW-1944: [C++] Fix ARROW_STATIC_LIB in FindArrow
omit ce95db3 ARROW-1931: [C++] Suppress C4996 deprecation warning in MSVC builds for now
omit ba00956 ARROW-1939: Correct links in release blog post
omit 9895181 ARROW-1934: [Website] 0.8.0 release highlights blog post
omit ac789ba ARROW-232: [Python] Add unit test for writing Parquet file from chunked table
omit bcfd83d ARROW-1935: [Website] Remove link to nightly builds. Fix signature / checksum links, add verification instructions
omit d023b40 ARROW-1922: Blog post on JAVA vector changes
omit 9335e28 ARROW-1832: [JS] Implement JSON reader for integration tests
omit 44c5a7c ARROW-1926: [GLib] Add garrow_timestamp_data_type_get_unit()
omit db72bfe ARROW-1932: [Website] Update site for 0.8.0 release info
omit 72e660a ARROW-1933: [GLib] Fix build error with --with-arrow-cpp-build-dir
omit 9e262f4 ARROW-1924: [Python] Bring back pickle=True option for serialization
omit 5afae14 [maven-release-plugin] prepare for next development iteration
omit 1d689e5 [maven-release-plugin] prepare release apache-arrow-0.8.0
omit 3afb8f4 [Release] Update CHANGELOG.md for 0.8.0
omit e4770b2 ARROW-1917: Fixes to enable verify-release-candidate.sh to work for 0.8.0
omit 8d006dc ARROW-1915: [Python] Add missing parquet decorator to decimal tests
omit 4f1bc97 ARROW-1916: [Java] Include java/dev/checkstyle in git archive for source releases
omit 16ddb12 ARROW-1914: [C++] Fix build dependency for GPU support build
omit 0095c4e ARROW-1911: [JS] Add Graphistry to Arrow JS proof points
omit 6a7ce32 ARROW-1904: [C++] Deprecate PrimitiveArray::raw_values
omit abb9341 ARROW-1905: [Python] Add more comprehensive list of exact type checking functions to pyarrow.types
omit 20bbbcb ARROW-1906: [Python] Do not override user-supplied type in pyarrow.array when converting DatetimeTZ pandas data
omit 97678c1 ARROW-1883: [Python] Fix handling of metadata in to_pandas when not all columns are present
omit 84f18c5 ARROW-1910: [C++] Use c_glib Brewfile in README for installing dependencies on macOS (#1407)
omit 501d60e ARROW-1895/ARROW-1897: [Python] Add field_name to pandas index metadata
omit 74b2ebe ARROW-1908: [Python] Construction of arrow table from pandas DataFrame with duplicate column names crashes
omit fcf46d9 ARROW-1902: [Python] Remove mkdir race condition from write_to_dataset
omit fe33155 ARROW-1901: [Python] Support recursive mkdir for DaskFilesystem
omit 543808d ARROW-1864: [Java] Upgrade Netty to 4.1.17
omit 2994815 ARROW-1873: [Python] Catch more possible Python/OOM errors in to_pandas conversion path
omit 64af87b ARROW-1884: [C++] Exclude integration test JSON reader/writer classes from public API
omit aaa978b ARROW-1893: [Python] Convert memoryview to bytes when loading from pickle in Python 2.7
omit ad30138 ARROW-1891: [Python] Always use NumPy NaT sentinels to mark nulls when converting to array
omit 7ed4ca7 ARROW-1867: [Java] Add missing methods to BitVector from legacy vector class
omit ad454e8 ARROW-1877: [Java] Fix incorrect equals method in JsonStringArrayList
omit 1d519d8 ARROW-1487: [C++] Implement casts from List<A> to List<B>, where a cast function is defined from any A to B
omit fb80013 ARROW-1892: [Python] Support binaries in lists
omit aad0782 ARROW-1857: [Python] Add switch for boost linkage with static parquet in wheels
omit 712b9d2 ARROW-1784: [Python] Enable zero-copy serialization, deserialization of pandas.DataFrame via components
omit aee1a0b ARROW-1889: [Python] --exclude is not available in older git versions
omit 665da71 ARROW-1890: [Python] Fix mask handling for Date32 NumPy conversions
omit 33b628a ARROW-1882: [C++] Reintroduce DictionaryBuilder
omit d64947e ARROW-1881: Ignore JS tags for Python packages
omit b241eb6 ARROW-1839/ARROW-1871: [C++/Python] Add Decimal Parquet Read/Write Tests
omit 611a4b9 ARROW-1785: [Format/C++/Java] Remove VectorLayout from serialized schemas
omit fe6f60c ARROW-1885: [Java] Restore MapVector class names prior to ARROW-1710
omit 8f2dbee ARROW-1879: [Python] Dask integration tests are not skipped if dask is not installed
omit 5dbfe30 ARROW-1863: [Python] PyObjectStringify could render bytes-like output for more types of objects
omit 3b438bc ARROW-1755: [C++] CMake option to link msvc crt statically
omit 3ee75a0 ARROW-1719: [Java] Remove accessor and mutator interface
omit ff4e407 ARROW-1878: [GLib] Add garrow_array_dictionary_encode()
omit 3bed4eb ARROW-1865: [C++] Do not alter number of rows attribute when removing last column from Table
omit ad9105e ARROW-1817: [Java] Configure JsonReader to read floating point NaN values
omit 705d842 ARROW-1874: [GLib] Add garrow_array_unique()
omit 1fd3457 ARROW-1862: [GLib] Add GArrowDictionaryArray
omit ff8efbf ARROW-1869: [JAVA] Fix LowCostIdentityHashMap name
omit bbbbbfb ARROW-1844: [C++] Add initial Unique benchmarks for int64, variable-length strings
omit b92c435 ARROW-1684: [Python] Support selecting nested Parquet fields by any path prefix
omit 155bf07 ARROW-1854: [Python] Use pickle to serialize numpy arrays of objects.
omit ffb37db ARROW-1735: [C++] Test CastKernel writing into output array with non-zero offset
omit a75325a ARROW-1710: [Java] Remove Non-Nullable Vectors
omit b19e183 ARROW-1783: [Python] Provide a "component" dict representation of a serialized Python object with minimal allocation
omit 682e248 ARROW-1850: [C++] Use void* / const void* for buffers in file APIs
omit 6176350 [Release] Apache Arrow JavaScript 0.2.0
omit 42fc57b ARROW-1178: [C++/Python] Add option to set chunksize in TableBatchReader, Table.to_batches method
omit 85e2d89 ARROW-1758: [Python] Remove pickle=True option for object serialization
omit ebb6c76 ARROW-1859: [GLib] Add GArrowDictionaryDataType
omit bf1cf3b [Python] Add more detail to development docs (#1356)
omit ad82c9a ARROW-1853: [Plasma] Fix off-by-one error in retry processing
omit b20beff ARROW-1836: [C++] Remove deprecated static_visitor struct to avoid msvc C4996 warning
omit 82e42c5 ARROW-1777: [C++] Add ArrayData::Make static ctor for more convenient construction
omit aaa0443 ARROW-1855: [GLib] Add workaround for build failure on macOS
omit 05bfb26 ARROW-1849: [GLib] Add input checks to GArrowRecordBatch
omit ac4bb69 ARROW-1852: [C++] Make retrieval of Plasma manager fd a const operation
omit 6ec4f34 ARROW-1047: [Java] [FollowUp] Change ArrowMagic to be non-public class
omit ea0fb37 ARROW-1577: [JS] add ASF release scripts
omit 1524ed7 ARROW-1782: [Python] Add pyarrow.compress, decompress APIs
omit dda2d34 ARROW-1828: [C++] Hash kernel specialization for BooleanType
omit 9b2dc77 ARROW-1845: [Python] Expose Decimal128Type
omit 1516306 ARROW-1047: [Java] Add Generic Reader Interface for Stream Format
omit fc4e2c3 ARROW-1808: [C++] Make RecordBatch, Table virtual interfaces for column access
omit 3fb1491 ARROW-1268: [SITE][FOLLOWUP] Update Spark Post to Reflect Conf Change
omit 15ed080 ARROW-1703: [C++] Vendor exact version of jemalloc we depend on
omit cac0912 ARROW-1841: [JS] Update text-encoding-utf-8 and tslib for node ESModules support
omit c436376 ARROW-1838: [C++] Conform kernel API to use Datum for input and output
omit e98adc3 ARROW-1840: [Website] The installation command failed on Windows10 anaconda envir…
omit d887d91 ARROW-1830: [Python] Relax restriction that Parquet files in a dataset end in .parq or .parquet
omit 284e6c9 ARROW-1826: [JAVA] Avoid branching in copyFrom for fixed width scalars
omit cb5da9c ARROW-1778: [Python] Link parquet-cpp statically, privately in manylinux1 wheels
omit b3a3a74 ARROW-1693: [JS] Expand JavaScript implementation, build system, fix integration tests
omit d92735e ARROW-1834: [Doc] Build documentation in separate build folders
omit 9f9dc5b ARROW-1575: [Python] Add tests for pyarrow.column factory function
omit 37214ef ARROW-1827: [Java] Add checkstyle file and license template
omit 952ec05 ARROW-1773: [C++] Add casts from date/time types to compatible signed integers
omit 202e650 ARROW-1791: Limit generated data range to physical limits for temporal types
omit eb7be48 ARROW-1805: [Python] Ignore special private files when traversing ParquetDataset
omit f2806fa ARROW-1559: [C++] Add Unique kernel and refactor DictionaryBuilder to be a stateful kernel
omit cacbacd ARROW-1795: [Plasma] Create flag to make Plasma store use a single memory-mapped file.
omit ac26eb7 ARROW-1829: [Plasma] Fixes to eviction policy.
omit ca3acdc ARROW-1821: [INTEGRATION] Add integration test case for when Field has zero null count and optional validity buffer
omit 837150e ARROW-1476: [JAVA] Implement Final ValueVector Updates
omit 5bea983 ARROW-1717: [Java] Refactor JsonReader for new class hierarchy and fix integration tests
omit 9ee838a ARROW-1474:[JAVA] ValueVector hierarchy (Implementation Phase 2)
omit 42353ba ARROW-1473: ValueVector new hierarchy prototype (implementation phase 1)
omit 9812aea ARROW-1812: [C++] Plasma store modifies hash table while iterating during client disconnect
omit 1d951b5 ARROW-1809: [GLib] Use .xml instead of .sgml for GTK-Doc main file
omit 7255460 ARROW-1810: [Plasma] Remove unused Plasma test shell scripts
omit 9fb806c ARROW-1811: [C++/Python] Rename all Decimal based APIs to Decimal128
omit e3db5da ARROW-1806: [GLib] Add garrow_record_batch_writer_write_table()
omit b18bbeb ARROW-1371: [Website] Add "Powered By" page to the website
omit 8f2d152 ARROW-1802: [GLib] Support arrow-gpu
omit 6f8e287 ARROW-1743: [Python] Avoid non-array writeable-flag check
omit 4a33bad ARROW-1767: [C++] Support file reads and writes over 2GB on Windows
omit e8331f4 ARROW-1794: [C++/Python] Rename DecimalArray to Decimal128Array
omit 7adadd8 ARROW-1763: [Python] Implement __hash__ for DataType
omit 550a39f ARROW-1801: [Docs] Update install instructions to use red-data-tools repos
omit 357eedc ARROW-1781: Don't use brew when using the toolchain
omit 21112f8 ARROW-1800: [C++] Fix and simplify random_decimals
omit 7c205b0 ARROW-1787: [Python] Support reading parquet files into DataFrames in a backward compatible way
omit 2d34f34 ARROW-1788 Fix Plasma store abort bug on client disconnection
omit ed8aef2 ARROW-1793: fix a typo for README.md
omit 65a9055 ARROW-972: UnionArray in pyarrow
omit dffa486 ARROW-1709: [C++] Decimal.ToString is incorrect for negative scale
omit 78872a1 ARROW-1775: Ability to abort created but unsealed Plasma objects
omit 252a2a5 [GLib] Fix a typo in document
omit bfc0f24 ARROW-1776: [C++] Define arrow::gpu::CudaContext::bytes_allocated()
omit 3188d70 ARROW-1716: [Format/JSON] Use string integer value for Decimals in JSON
omit e631119 [Format] Fix link to Flatbuffers project in IPC.md
omit 3995eb3 ARROW-1768: [Python] Fix suppressed exception in ParquetWriter.__del__
omit 99ea353 ARROW-1771: [C++] ARROW-1749 Breaks Public API test in parquet-cpp
omit 0106f53 ARROW-1750: [C++] Remove the need for arrow/util/random.h
omit 9721930 ARROW-480: [Python] Implement RowGroupMetaData.ColumnChunk
omit b25b243 ARROW-1663: [Java] use consistent name for null and not-null in FixedSizeLis…
omit d7f1398 ARROW-1749: [C++] Handle range of Decimal128 values that require 39 digits to be displayed
omit 1ee73ef ARROW-1770: [GLib] Fix GLib compiler warning
omit ea4a8f5 ARROW-1714: [Python] Fix invalid serialization/deserialization None name Series
omit b513c8d ARROW-1762: [C++] Add note to readme about need to set LC_ALL on some Linux systems
omit 62190d7 ARROW-1756: [Python] Fix large file read/write error
omit fc7104f ARROW-1742: C++: clang-format is not detected correct on OSX anymore
omit b9a2ce9 ARROW-1765: [Doc] Use dependencies from conda in C++ docker build
omit 5d66576 ARROW-1727: [Format] Expand Arrow streaming format to permit deltas / additions to existing dictionaries
omit 82cd6e5 ARROW-1764: [Python] Add -c conda-forge for Windows dev installation instructions
omit 527af63 ARROW-1652: [JS] housekeeping, vector cleanup
omit 0373541 ARROW-1766: [GLib] Fix failing builds on OSX
omit 142e6ee ARROW-1455 [Python] Add Dockerfile for validating Dask integration
omit 9dc4c58 ARROW-1753: [Python] Provide for matching subclasses with register_type in serialization context
omit eca9924 ARROW-1658: [Python] Add boundschecking of dictionary indices when creating CategoricalBlock
omit 0880550 ARROW-1754: [Python] Fix buggy Parquet roundtrip when an index name is the same as a column name
omit 72b50bc [C++] Fix clang-format failure from ARROW-1409
omit 39243ff ARROW-1409: [Format] Remove page id from Buffer metadata, increment metadata version number
omit 30158ad ARROW-1718: [C++/Python] Implement casts from timestamp to date32/64, properly handle NumPy datetime64[D] -> date32
omit 1d36dd2 ARROW-1748: [GLib] Add GArrowRecordBatchBuilder
omit ec22228 ARROW-1747: [C++] Don't export symbols of statically linked libraries
omit f257b00 ARROW-1746: [Python] Add build dependencies for Arch Linux
omit b221a2c ARROW-1751: [Python] Pandas 0.21.0 introduces a breaking API change for MultiIndex construction
omit 74a934a ARROW-1689: [Python] Implement zero-copy conversions for DictionaryArray
omit cc03a45 ARROW-1745: [Plasma] Include gtest after plasma/compat.h in tests.
omit 2eb78b0 ARROW-1728: [C++] Run clang-format checks in Travis CI
omit 4db0046 ARROW-1555 [Python] Implement Dask exists function
omit 2ed886e ARROW-1723: [C++] add ARROW_STATIC to mark static libs on Windows
omit 59030fe ARROW-1730, ARROW-1738: [Python] Fix wrong datetime conversion
omit 2e04089 ARROW-1736: [GLib] Add GArrowCastOptions:allow-time-truncate
omit 3596a43 ARROW-1737: [GLib] Use G_DECLARE_DERIVABLE_TYPE
omit a385e2b ARROW-1739: [Python] Fix broken build due to using unittest.TestCase methods
omit 7abaa00 ARROW-587: Add fix version to PR merge tool
omit 6b16cca ARROW-1689: [Python] Allow user to request no data copies
omit c30a7e3 ARROW-1732: [Python] Permit creating record batches with no columns, test pandas roundtrips
omit 238881f ARROW-1675: [Python] Use RecordBatch.from_pandas in Feather write path
omit 48a6ff8 ARROW-1721: [Python] Implement null-mask check in places where it isn't supported in numpy_to_arrow.cc
omit 54d5c81 ARROW-1484: [C++/Python] Implement casts between date, time, timestamp units
omit 8148b6d ARROW-1726: [GLib] Add setup description to verify C GLib build
omit b2596f6 ARROW-1588: [C++/Format] Harden Decimal Format
omit ecb7605 ARROW-1134: [C++] Support for C++/CLI compilation, add NULLPTR define to avoid using nullptr in public headers
omit b08f7e3 ARROW-1711: [Python] Fix flake8 calls to lint the right directories
omit e876e17 ARROW-1720: [Python] Implement bounds check in chunk getter
omit 935a3cf ARROW-1654: [Python] Implement pickling for DataType, Field, Schema
omit 8e00ee9 ARROW-1114: [C++] Add simple RecordBatchBuilder class
omit 2b77b7c ARROW-507: [C++] Complete ListArray::FromArrays implementation, add unit tests
omit 4eb38a2 ARROW-571: [Python] Add unit test for incremental Parquet file building, improve docs
omit 8eb2a1b ARROW-1707: Update dev README after movement to GitBox
omit 6209489 ARROW-1708: [JS] Fix linter error
omit f40618d ARROW-1671: [C++] Deprecate arrow::MakeArray that returns Status, refactor existing code to new variant
omit 53dd0c8 ARROW-1087: [Python] Add pyarrow.get_include function. Bundle includes in all builds
omit 61d8a76 ARROW-641: [C++] Do not build io-hdfs-test if ARROW_HDFS is off
omit 9ee5508 ARROW-1522: [Python] Zero copy buffer deserialization
omit fbeaeea ARROW-1704: [GLib] Fix Go example failure
omit 05788d0 ARROW-1701: [Serialization] Support zero copy PyTorch Tensor serialization
omit 9d12c7c ARROW-1697: [GitHub] Add ISSUE_TEMPLATE.md
omit 3549fa8 ARROW-1683: [Python] Restore TimestampType to pyarrow namespace
omit 2ee900c ARROW-1702: Update jemalloc in manylinux1 build
omit 989aba6 ARROW-1698: [JS] File reader attempts to load the same dictionary batch more than once
omit deaa0cf ARROW-1686: [Docs] rsync contents of apidocs directory into site java directory
omit 971e99d ARROW-1695: [Serialization] Fix reference counting of numpy arrays created in custom serializer
omit a8f5185 ARROW-1666: [GLib] Enable gtk-doc on Travis CI Mac environment
omit d7bf5f2 ARROW-1690: [GLib] Add garrow_array_is_valid()
omit 298e343 ARROW-1673: [Python] Add support for numpy 'bool' type
omit a4813bd ARROW-1685: [GLib] Add GArrowTableBatchReader
omit a043018 ARROW-1678: [Python] Implement numpy.float16 SerDe
omit 8eb2b0e ARROW-1679: [GLib] Add garrow_record_batch_reader_read_next()
omit 1926bdc ARROW-1613: [Java] Alternative ArrowReader close to free resources but leave ReadChannel open
omit 2f2a0c1 ARROW-1676: [C++] Only pad null bitmap up to a factor of 8 bytes in Feather format
omit 1571fb4 ARROW-1677: [Blog] Post on ray and arrow serialization
omit e39b479 ARROW-1667: [GLib] Support Meson
omit a6a97a9 ARROW-1631 [C++] Add GRPC to ThirdpartyToolchain
omit 894f740 ARROW-1670: [Serialization] Speed up deserialization by getting rid of smart pointer overhead
omit dc53321 ARROW-1648: C++: Add cast from Dictionary[NullType] to NullType
omit 47e6ff6 ARROW-1665: [Serialization] Support more custom datatypes in the default serialization context
omit 434df8a ARROW-1488: [C++] Implement ArrayBuilder::Finish in terms of FinishInternal based on ArrayData
omit 0d1e69c ARROW-1630: [Serialization] Support Python datetime objects
omit 60cb1c3 ARROW-905 [Docs] Dockerize document generation
omit 4cb3e97 ARROW-1662: Move to using Homebrew/bundle and Brewfile
omit ee78cdc ARROW-1503: [Python] Add default serialization context, callbacks for pandas.Series/DataFrame
omit 166f0a8 ARROW-1635: Add release management guide
omit bf2e3ab ARROW-1593: [Python] Pass through preserve_index to RecordBatch.from_pandas in serialize_pandas
omit a0555c0 ARROW-1535: [Python] Enable sdist tarballs to be installed
omit 81a0e67 ARROW-1657: [C++] Multithreaded Read Test Failing on Arch Linux
omit 33d446d ARROW-1656: [C++] Endianness Macro is Incorrect on Windows And Mac
omit 208e798 ARROW-1594: [Python] Multithreaded conversions to Arrow in from_pandas
omit e31c2e3 ARROW-1585/ARROW-1586: [PYTHON] serialize_pandas roundtrip loses columns name
omit eaeb5d4 ARROW-1250: [Python] Add pyarrow.types module with useful type checking functions
omit b29b065 ARROW-1641: [C++] Hide std::mutex from public headers
omit 8309556 ARROW-1556: [C++] Move verbose AssertArraysEqual function used in PARQUET-1100 into arrow/test-util.h
omit 0a4c5b1 ARROW-1226: [C++] Docs cleaning in arrow/ipc. Doxyfile fixes, move ipc/metadata-internal.h symbols to internal NS
omit 898f5e2 ARROW-1602: [C++] Add IsValid method to pair with IsNull
omit ac1b66d ARROW-1540: Add NO_VALGRIND option to ADD_ARROW_TEST and disable valgrind in a few problematic tests
omit f8cdafa ARROW-1541: [C++] Fix race conditions in arrow_gpu with generated Flatbuffers files. Do not put generated files in source tree
omit 3ae4355 ARROW-1653: [Plasma] Use static cast to avoid compiler warning.
omit eaa9538 ARROW-1649: C++: Print number of nulls in PrettyPrint for NullArray
omit bea3495 ARROW-1539: [C++] Remove APIs deprecated as of 0.7.0 or prior releases
omit 51905e5 ARROW-1498: Add CONTRIBUTING.md to .github special directory
omit bd73166 ARROW-1526: [Python] Add unit test for fix in PARQUET-1100
omit 909a6f6 ARROW-1616: [Python] Add unit test for RecordBatchWriter.write dispatching to write_table or write_batch
omit ab6aa9a ARROW-1486: [C++] Make Column, RecordBatch, and Table non-copyable
omit 9805ada ARROW-1633: [Python] Support NumPy string and unicode types in pyarrow.array, Array.from_pandas
omit f0873a9 ARROW-942: Support running integration tests with both Python 2.7 and 3.6
omit 7511cfd ARROW-226: [C++] If opening an HDFS file fails and it does not exist, say so to help with debugging
omit 0f819fa ARROW-1603: [C++] Add BinaryArray::GetString helper method
omit 8b5b22b ARROW-1525: [C++] New compare functions that return boolean instead of Status
omit 81319d9 ARROW-1647: [Plasma] Make sure to read length header as int64_t instead of size_t.
omit dc129d6 ARROW-1627: New class to handle collection of BufferLedger(s) within …
omit 31d33e0 [Website] Update website with new committers
omit 87fc577 ARROW-1584: [C++/Python] Support Null type in IPC round trips, fix serialize_pandas on empty DataFrame
omit 592c4e8 [Website] jekyll must be run with JEKYLL_ENV=production
omit 67c6317 ARROW-950: [Website] Add Google Analytics tag to site
omit 8ceee56 ARROW-1543: [C++] Correct C++ tutorial to use std::unique_ptr instead of std::shared_ptr
omit ff39cb5 ARROW-1640: Fix HTTPS failures in cmake / libcurl caused by ca-certificates clash
omit 988338c ARROW-1634: [Website] Add release page for 0.7.1, update front page
omit 82eea49 [Java] Update pom versions to 0.8.0-SNAPSHOT
omit c905783 ARROW-1625: [Serialization] Support OrderedDict and defaultdict serialization
omit af167fd [Python] Update README.md to reflect that wheels are available on all platforms
omit 811e668 ARROW-1629: [C++] Add miscellaneous DCHECKs and minor changes based on infer tool output
omit 9aa6eb5 ARROW-1624: [C++] Fix build on LLVM 4.0, remove some clang warning suppressions
omit cc3b27c ARROW-1626 Add make targets to run the inter-procedural static analys…
omit ccbf644 ARROW-838: [Python] Expand pyarrow.array to handle NumPy arrays not originating in pandas
omit a03e093 ARROW-1600: [C++] Add Buffer constructor that wraps std::string
omit 7045b42 ARROW-1615 Added BUILD_WARNING_LEVEL and BUILD_WARNING_FLAGS to Setup…
omit 545496c ARROW-1619: [Java] Set lastSet in JsonFileReader
omit ac997fb ARROW-1618: [JAVA] Reduce Heap Usage (Phase 1)
omit bdfa65e ARROW-1620: Python: Download Boost in manylinux1 build from bintray
omit c358154 ARROW-1609: [Plasma] Xcode 9 compilation workaround
omit 686a8f7 ARROW-1607: [C++] Implement DictionaryBuilder for Decimals
omit 0e21f84 [maven-release-plugin] prepare release apache-arrow-0.7.1
omit fbabde5 [Release] Update CHANGELOG.md for 0.7.1
omit 3a53f93 [Release] Update version to 0.7.1-SNAPSHOT
omit 808a143 ARROW-1612:[GLib] Update readme for mac os
omit f9d1e1b ARROW-1611: [C++] Add BitmapWriter, do not perform out of bounds read in BitmapReader when length is 0
omit 5da6b87 ARROW-1606: [Python] Copy .lib files in addition to .dll when bundling libraries for Windows
omit b640cc0 ARROW-1610: C++/Python: Only call python-prefix if the default PYTHON_LIBRARY is not present
omit 39e487c ARROW-1608: Support Release verification script on macOS
omit 096b877 ARROW-1601: [C++] Do not read extra byte from validity bitmap, add internal::BitmapReader in lieu of macros
omit b41a4ee ARROW-1598: [C++] Fix diverged code comment in plasma tutorial
omit c0a5019 ARROW-1592: [GLib] Add GArrowUIntArrayBuilder
omit 8996a4f ARROW-1590: [JS] Flow TS Table method generics
omit 8fd73b4 ARROW-1595: [Python] Fix package dependency resolution issue causing broken builds
omit cfcee74 ARROW-1347: [JAVA] Return consistent child field name for List Vectors
omit c470c9c ARROW-1591: C++: Xcode 9 is not correctly detected
omit d154c10 ARROW-1578: [C++] Run lint checks in Travis CI much earlier at before_script stage to fail faster
omit 203fb63 ARROW-1500: [C++] Do not ignore return value from truncate in MemoryMa…
omit 975f32b ARROW-1497: [Java] Fix JsonReader to initialize count correctly
omit 9997a1a ARROW-1557 [Python] Validate names length in Table.from_arrays
omit 903d03b ARROW-1553: [JAVA] Implement setInitialCapacity for MapWriter
omit 2551050 ARROW-1554: [Python] Update Sphinx install page to note that VC14 runtime may need to be installed on Windows
omit c4f5a12 ARROW-1536:[C++] Do not transitively depend on libboost_system
omit d4685f4 ARROW-1547: [JAVA] Fix 8x memory over-allocation in BitVector
omit 2706b7f ARROW-1533: [JAVA] realloc should consider the existing buffer capacity for computing target memory requirement
omit aebc412 ARROW-1551: [Website] Add 0.7.0 changelog
omit b448f66 ARROW-1550: [Python] Followup: fix flake8 warning
omit 0d5e699 ARROW-1551: [Website] Website updates, blog post for 0.7.0
omit e1d9c7f ARROW-1550: [Python] Explicitly close owned file handles in ParquetWriter.close to avoid Windows flakiness
omit 4a65fea ARROW-1548: [GLib] Support bulk append in builder
omit 63e7966 ARROW-1464: [GLib] Add "Common build problems" section into the README.md of c_glib
omit b635d4c Remove garbage ")"
omit e093772 ARROW-1544: [JS] Export Vector types
omit bfe6579 ARROW-1546: [GLib] Support GLib 2.40 again
omit bf73d27 ARROW-1545: Remove deprecated args of builder
omit 59b24ba ARROW-559: Add release verification script for Linux
omit 72ad07e ARROW-1542: [C++] Install packages in temporary directory in MSVC build verification script
omit 96d451f ARROW-1537: [C++] Support building with full path install_name on macOS
omit d0b0b74 ARROW-1529: [GLib] Use Xcode 8.3 on Travis CI
omit 97f9029 [maven-release-plugin] prepare release apache-arrow-0.7.0
omit b671dcc [Release] Update CHANGELOG.md for 0.7.0
omit 576fb66 ARROW-1532: [Python] Referencing an Empty Schema causes a SegFault
omit cf1ac9c ARROW-1531: [C++] Return ToBytes by value from Decimal128
omit 3fbf760 ARROW-1530: [C++] Install arrow/util/parallel.h
omit b77af1a ARROW-1528: [GLib] Resolve recursive include dependency
omit 6a020a1 ARROW-1459: [Python] Use list values length to advance offset when reconstructing array of ndarrays
omit 4c008c2 ARROW-1511: [C++] Promote ArrayData, MakeArray to public API, deprecate MakePrimitiveArray
omit 18388d6 ARROW-1331: [JAVA] include package statement
omit b590c24 ARROW-1519: [C++] Move DecimalUtil functions to methods on the Int128 class
omit 9ede7fb ARROW-1527: Fix Travis CI JDK9 build
omit 7e95764 ARROW-1513: C++: Add cast from Dictionary to plain arrays
omit 94f6247 ARROW-1508: C++: Add support for FixedSizeBinaryType in DictionaryBuilder
omit a45b047 ARROW-1307: [Python] Expand IPC section to include object serialization, Feather format. Add Feather functions to API listing
omit 840b687 ARROW-1517: Remove unnecessary temporary in DecimalUtil::ToString function
omit a534e5d ARROW-1516: [GLib] Update document
omit 0ac81b5 ARROW-1515: [GLib] Detect version directly
omit c1492bf ARROW-1510: [GLib] Support cast
omit ce623a9 ARROW-1512: [C++] Fix API change in documentation
omit f211463 ARROW-1514: [C++] Fix a typo in document
omit 4a6a6cb ARROW-1359: [C++] Add flavor='spark' option to write_parquet that sanitizes schema field names
omit 947ca87 ARROW-594: [C++/Python] Write arrow::Table to stream and file writers
omit b5d510f ARROW-1358: Update sha{1, 256, 512} checksums per latest ASF release policy
omit 675e251 ARROW-1506: [C++] Add .pc for compute modules
omit 1706aab ARROW-1505: [GLib] Simplify arguments check
omit 875be96 ARROW-1504: [GLib] Add GArrowTimestampArray
omit 8b70ab0 ARROW-1507: [C++] Include arrow/array.h for arrow::internal::ArrayData
omit 0c8853f ARROW-1479: [JS] Expand JavaScript implementation
omit 8911a34 ARROW-1493: [C++] Flush stream in PrettyPrint functions
omit 5aca7b6 ARROW-1480: [Python] Improve performance of serializing sets
omit 11ebe93 ARROW-1494: [C++] Improve doxygen comments in arrow/table.h, note that RecordBatch::column returns new object
omit de2edc8 ARROW-1156: [C++/Python] Expand casting API, add UnaryKernel callable. Use Cast in appropriate places when converting from pandas
omit fe45c2b ARROW-1490: [Java] Allow failures for JDK9 for now
omit 6f27a64 ARROW-1467: [JAVA] Fix reset() and allocateNew() in Nullable Value Vectors t…
omit b698227 ARROW-622 [Python] deprecate timestamps_to_ms in .from_pandas()
omit 3f2fa03 ARROW-1430: [Python] Python CI build outside of a bash function scope, enable flake8 to fail build
omit b0b125f ARROW-229: [C++] Implement cast functions for numeric types, booleans
omit a9a80fe ARROW-941: Add "cold start" instructions for running integration tests
omit 6e5f7be ARROW-1435: [Python] Properly handle time zone metadata in Parquet round trips
omit 3033eac ARROW-1466: [C++] Implement PrettyPrint for DecimalArray
omit d9f895e ARROW-1446: [Python] Add (very slow) large memory unit test for int32 overflow in PARQUET-1090
omit 3d285c6 ARROW-1451: [C++] Add public API file for IO section in arrow/io/api.h
omit 54d624b ARROW-1405: [Python] Expose LoggingMemoryPool in Python API
omit 5abd123 ARROW-1468: [C++] Add primitive Append variants that accept std::vector<T>
omit a3514a3 ARROW-1396: [C++] Add PrettyPrint for schemas that outputs dictionaries
omit e9f3a12 ARROW-695: Add decimal integration test.
omit 9634f4b ARROW-1462: [GLib] Add GArrowTime32Array and GArrowTime64Array
omit f355354 ARROW-1317: [Python] Attempt to set Hadoop CLASSPATH when using JNI
omit 2660dda ARROW-1377: [Python] Add ParquetFile.scan_contents function to use for benchmarking
omit 2433289 ARROW-696: [C++] Support decimals in IPC and JSON reader/writer to enable integration tests
omit bea5ab0 ARROW-1442: [Website] Add note about nightly builds to /install
omit 1ba19c2 ARROW-1401: [C++] Add note to readme about ARROW_EXTRA_ERROR_CONTEXT
omit 3283d2a ARROW-1458: [Python] Document that create_parents=False is unsupported in HadoopFileSystem
omit df0ca4e ARROW-1461: [C++] Restore LLVM apt usage
omit ab328ec ARROW-1401: [C++] Add ARROW_EXTRA_ERROR_CONTEXT option
omit 338a187 ARROW-1461: [C++] Disable builds using LLVM apt repo until installation issues resolved
omit ec32013 ARROW-1417: [Python] Allow more generic filesystem objects to be passed to ParquetDataset
omit b1e56a2 ARROW-1453: [C++/Python] Support non-contiguous Tensors in WriteTensor
omit 0e0da74 ARROW-1460: [C++] Pin clang-format at LLVM 4.0
omit f391950 ARROW-1452: [C++] Restore DISALLOW_COPY_AND_ASSIGN usages removed in ARROW-1452 patch
omit cc30512 ARROW-1390: [Python] Add more serialization tests
omit e5aeb90 ARROW-1383: [C++] Add vector append variant to primitive array builders that accepts std::vector<bool>
omit 9968d95 ARROW-1400: [Python] Adding parquet.write_to_dataset() method for writing partitioned .parquet files
omit 6f2fd8d ARROW-1449: Implement Decimal using only Int128
omit 08b41f9 ARROW-1238: [Java] Adding Decimal type JSON read and write support
omit 016c45a ARROW-1450: [Python] Raise proper error if custom serialization handler fails
omit ebca1af ARROW-1452: [C++] Make macros in arrow/util/macros.h more unique
omit 1a8dafb ARROW-1447: [C++] Fix many include-what-you-use warnings
omit 848a0f7 ARROW-1444: [JAVA] fix last byte copy in BitVector splitAndTransfer
omit 4956e90 ARROW-1407: Fix bug where DictionaryEncoder can only encode vector le…
omit 75d1f61 ARROW-1413: [C++] Add include-what-you-use configuration
omit 28553b4 ARROW-1443: [Java] Fixed a small bug on ArrowBuf.setBytes with unsliced ByteBuffers
omit 8344f28 ARROW-1434: [Python] Support datetime64[D] numpy arrays
omit c6295f3 ARROW-1438: [Python] Pull serialization context through PlasmaClient put and get
omit 9ab0c95 ARROW-1441: [Site] Add Ruby to Flexible section
omit 78c952d ARROW-1351: Update CHANGELOG.md in 00-prepare.sh when creating release candidate
omit 6b391f0 ARROW-1432: [C++] Build bundled jemalloc functions with private prefix
omit f450025 ARROW-1381: [Python] Use FixedSizeBufferWriter in SerializedPyObject.to_buffer
omit d8c651c ARROW-1433: [C++] Simplify Array::Slice to be non-virtual
omit 7510ae6 ARROW-837: [Python] Add public pyarrow.allocate_buffer API. Rename FixedSizeBufferOutputStream
omit af78293 ARROW-1429: [Python] Open common Parquet metadata file using passed file system
omit 6af2931 ARROW-1302: C++: Set MAKE to make if not defined
omit 19bbf12 ARROW-1428: [C++] Append steps to clone source code to README.mb
omit 59fb8d0 ARROW-1427: [GLib] Add arrow cpp link to readme
omit 441f965 ARROW-1418: [Python] Introduce SerializationContext to register custom serialization callbacks
omit 254078e ARROW-1426: [Site] Fix the title of the top page.
omit 5cda693 ARROW-1402: [C++] Deprecate APIs which return std::shared_ptr<MutableBuffer> in favor of std::shared_ptr<Buffer>
omit a009aab ARROW-1421: [Python] Extend Python serialization API to accept non-list types
omit e6456b6 ARROW-1344: [C++] Do not permit writing to closed BufferOutputStream
omit 0ced74e ARROW-1363: [C++] Use buffer layout from dictionary index type in IPC messages
omit c0beb87 ARROW-1415: [GLib] Support date32 and date64
omit 0728148 ARROW-1364: [C++] IPC support machinery for record batch roundtrips to GPU device memory
omit c027a03 ARROW-1412: [Plasma] Add higher level API for putting and getting Python objects
omit 32e2668 ARROW-1414: [GLib] Cast after status check
omit f250d46 ARROW-1416: Clarify memory layout documentation
omit 6cd2a17 ARROW-1419: [GLib] Suppress sign-conversion warnings
omit 26d4e3f ARROW-1399: [C++] Add CUDA build version defines in public headers
omit b36aab5 ARROW-1411: [Python] Booleans in Float Columns cause Segfault
omit ea503a5 ARROW-1379: [Java] adding maven-dependency-plugin and fixing all reported dependency errors
omit a3607d2 ARROW-1410: Remove MAP_POPULATE flag when mmapping files in Plasma store.
omit f50f2ea ARROW-1408: [C++] IPC public API cleanup, refactoring. Add SerializeSchema, ReadSchema public APIs
omit 750b77d ARROW-786: [Format] In-memory format for 128-bit Decimals, handling of sign bit
omit b312697 ARROW-1386: [C++] Unpin CMake version in MSVC toolchain builds
omit 2c3a5f4 ARROW-1392: [C++] Add GPU IO interfaces for CUDA
omit 3c70ff1 ARROW-1384: [C++] Add SerializeRecordBatch API for writing a record batch as an IPC message to a new buffer
omit 5303594 ARROW-1395: [C++/Python] Remove APIs deprecated from 0.5.0 onward
omit 4e0aa3c ARROW-1387: [C++] Set up GPU leaf library, add unit test module for CUDA tests
omit 6ad976e ARROW-1375: [C++] Remove dependency on msvc version for Snappy build
omit de7c671 ARROW-1357: [Python] Account for chunked arrays when converting lists back to pandas form
omit b50f235 ARROW-759: [Python] Serializing large class of Python objects in Apache Arrow
omit 10f7158 ARROW-1372: [Plasma] enable HUGETLB support on Linux to improve plasma put performance
omit 652fd36 ARROW-1366: [Plasma] Define entry point for the plasma store
omit e1bad9f [C++] Fix a typo in in plasma.md
omit c9805d6 ARROW-1373: Implement getBuffer() methods for ValueVector
omit 4ef7c89 ARROW-1355: [Java] Make Arrow buildable with jdk9
omit 3c5290a ARROW-1365: [Python] Remove outdated pyarrow.jemalloc_memory_pool example. Update API doc site build instructions
omit c0fa8e0 [Python] DOC: Fix Parquet docs to use pyarrow.parquet namespace for write_table
omit 4471dc9 [C++] DOC: Fix a typo in plasma.md
omit b78e2ef ARROW-1353: [Website] Update website for 0.6.0 release and add short release blog post
omit c2fb9cb ARROW-1356: [Website] Add new committers
omit 31457ae ARROW-801: Provide direct access to underlying buffer memory addresses
omit 94b7cfa ARROW-1339: [C++] Use of boost::filesystem::path to handle file paths
omit a2f4323 ARROW-1352: [Integration] Added specific formatting for producer consumer output
omit 142f74e ARROW-1331: [JAVA] Refactor unit tests
omit 6135958 ARROW-1348: [C++/Python] Release verification script for Windows
omit 4db732c [maven-release-plugin] prepare for next development iteration
omit b173334 [maven-release-plugin] prepare release apache-arrow-0.6.0
omit 63954c0 ARROW-1350: [C++] Do not exclude Plasma source tree from source release
omit 2143349 ARROW-1242: [JAVA] - upgrade jackson to mitigate security vulnerabilities (take 2)
omit b795e5c ARROW-1240: [JAVA] security: upgrade logback to address CVE-2017-5929 (take 2)
omit 2972c9d ARROW-1342: [Python] Support strided ndarrays in pandas conversion from nested lists
omit e44ede8 ARROW-1343: [Java] Aligning serialized schema, end of buffers in RecordBatches
omit 86154f0 ARROW-1340: [Java] Fix NullableMapVector field metadata
omit 7fdbcc6 ARROW-1243: [JAVA] update all libs to latest versions
omit a9c2f19 ARROW-1242: [JAVA] - upgrade jackson to mitigate security vulnerabilities
omit 6e26701 ARROW-439: [Python] Add option in "to_pandas" conversions to yield Categorical from String/Binary arrays
omit 2615b47 ARROW-1306: [C++] Use UTF8 filenames in local file error messages
omit 20cee70 ARROW-1338: [Python] Do not close RecordBatchWriter on dealloc in case sink is no longer valid
omit 5281a82 ARROW-1334: [C++] Add alternate Table constructor that takes vector of Array
omit 939957f ARROW-1335: [C++] Add offset to PrimitiveArray::raw_values to make consistent with other raw_values
omit 03dcce4 ARROW-1173: [Plasma] Add blog post describing Plasma object store
omit 66ab6b2 ARROW-1309: [Python] Handle nested lists with all None values in Array.from_pandas
omit 02ab748 ARROW-1336: [C++] Add arrow::schema factory function, simply some awkward constructors
omit 2015198 ARROW-1263: [C++] Get CPU info on Windows; Resolve patching whitespac…
omit 0b91cad ARROW-622: [Python] Add coerce_timestamps option to parquet.write_table, deprecate timestamps_to_ms argument
omit 7a4026a ARROW-1304: [Java] Fix Indentation, WhitespaceAround and EmptyLineSeparator checkstyle warnings in Java
omit f9d9833 ARROW-1283: [JAVA] Allow VectorSchemaRoot to close more than once
omit c0acb86 ARROW-1333: [Plasma] Example code for using Plasma to sort a DataFrame
omit 619472e ARROW-1225: [Python] Decode bytes to utf8 unicode if possible when passing explicit utf8 type to pyarrow.array
omit 3200e91 ARROW-1327: [Python] Always release GIL before calling check_status in Cython
omit 25439e7 ARROW-1300: [JAVA] Fix Tests for ListVector
omit 3bc7d46 ARROW-1296: [Java] Fix allocationSizeInBytes in FixedValueVectors.res…
omit 717bed0 ARROW-1328: [Python] Set correct Arrow type when coercing to milliseconds and passing explicit type
omit aa5d417 ARROW-1326: [Python] Fix Sphinx Build in Travis CI, treat Sphinx warnings as errors
omit a388ddf ARROW-1330: [Plasma] Turn on plasma tests on manylinux1
omit f775af7 ARROW-1312: [Python] Follow-up: do not use jemalloc in manylinux1 builds
omit 3732324 ARROW-1224: [Format] Clarify language around buffer padding and align…
omit 1874a8b ARROW-1310: [JAVA] revert changes made in ARROW-886
omit 84b7a0d ARROW-1312: [C++] Make ARROW_JEMALLOC OFF by default until ARROW-1282 is resolved
omit 21a0191 ARROW-1323: [GLib] Add garrow_boolean_array_get_values()
omit 93b51a0 ARROW-1315: [GLib] Add missing status check for arrow::ArrayBuilder::Finish()
omit ee928d2 ARROW-1211: [C++] Enable builder classes to automatically use the default memory pool
omit 5917e07 ARROW-1305: [GLib] Add GArrowIntArrayBuilder
omit b95bed0 ARROW-1303: [C++] Support downloading Boost
omit e50b6ae ARROW-1308: [C++] Link utility executables to Arrow shared library if ARROW_BUILD_STATIC=off
omit 7e7861c ARROW-1257: Plasma documentation
omit e5ed31f ARROW-1093: [Python] Run flake8 in Travis CI. Add note about development to README
omit aa1d753 ARROW-573: [C++/Python] Implement IPC metadata handling for ordered dictionaries, pandas conversions
omit b8754eb ARROW-884: [C++] Exclude internal namespaces from generated Doxygen docs
omit e1d574c ARROW-1301: [C++/Python] More complete filesystem API for HDFS
omit 3a84653 ARROW-1265: [Plasma] Clean up all resources on SIGTERM to keep valgrind output clean
omit b5ff2f6 ARROW-1251: [C++] Update C++ README to account for toolchain evolution
omit 900105a ARROW-187: [C++] Add development style notes to C++ README, note about esoteric exceptions in constructors
omit af2aeaf ARROW-1213: [Python] Support s3fs filesystem for Amazon S3 in ParquetDataset
omit b4eec62 ARROW-932: [Python] Fix MSVC compiler warnings, build Python with /WX and -Werror in CI
omit 2288bfc ARROW-1264: [Python] Raise exception in Python instead of aborting if cannot connect to Plasma store
omit 4108bda ARROW-1291: [Python] Cast non-string DataFrame columns to strings in RecordBatch/Table.from_pandas
omit ea1b67c ARROW-1294: [C++] Pin cmake=3.8.0 in MSVC toolchain build
omit b4e9ba1 ARROW-968: [Python] Support slices in RecordBatch.__getitem__
omit 5aea3a3 ARROW-1287: [Python] Implement whence argument for pyarrow.NativeFile.seek
omit ec32617 ARROW-1192: [JAVA] Use buffer slice for splitAndTransfer in List and Union Vectors.
omit 05af640 ARROW-276: [JAVA] Nullable Vectors should extend BaseValueVector and not Bas…
omit 1dd0f5f ARROW-1267: [Java] Handle zero length case in BitVector.splitAndTransfer
omit 3b14765 ARROW-1289: [Python] Add PYARROW_BUILD_PLASMA CMake option, follow semantics of --with-parquet
omit 44855bb ARROW-1273: [Python] Add Parquet read_metadata, read_schema convenience functions
omit 4df2a0b ARROW-1290: [C++] Double buffer size when exceeding capacity in arrow::BufferBuilder as in array builders
omit 33c85cd [Java] Fix letter case in rat plugin config
omit 8841bc0 ARROW-1281: [C++/Python] Add Docker setup for testing HDFS IO in C++ and Python
omit ff6c6e0 ARROW-1276: enable parquet serialization of empty DataFrames
omit b7639c1 ARROW-1285: [Python] Delete any incomplete file when attempt to write single Parquet file fails
omit f72279b ARROW-1288: Fix many license headers to use proper ASF one
omit 7b3378f ARROW-1204: [C++] Remove WholeProgramOptimization(/GL) compilation fl…
omit cae3510 ARROW-1274: [C++] Fix CMake >= 3.3 warning. Also add option to suppress ExternalProject output
omit d76e43e ARROW-1268: [WEBSITE] Added blog post for Spark integration toPandas()
omit dca5d96 ARROW-1275: [C++] Deafult Snappy static lib suffix updated to "_static"
omit 5708cd1 [Java] Fix some typos in code comments and exception messages
omit 676a4a9 ARROW-1255: [Plasma] Fix typo in plasma protocol; add DCHECK for ReadXXX in plasma protocol.
omit 2eeaa95 ARROW-1248: [Python] Suppress return-type-c-linkage warning in Cython clang builds
omit e9e17b5 ARROW-1258: [C++] Suppress Clang dlmalloc compiler warnings
omit f90fa49 [Website] Fix link to 0.5.0 post on install page
omit ed54dce ARROW-1253: [C++/Python] Speed up C++ / Python builds by using conda-forge toolchain for thirdparty libraries
omit 08cec90 ARROW-1252: [Website] Updates for 0.5.0 and short blog post summarizing the release
omit 07b89bf ARROW-1219: [C++] Use Google C++ code formatting
omit 204f148 ARROW-1260: [Plasma] Use factory method to create Python PlasmaClient
omit 11c92bf ARROW-1246: [Format] Draft Flatbuffer metadata description for Map
omit 9e692af ARROW-1245: [Integration] Enable JavaTester in Integration tests
omit 886e2af ARROW-1259: [Plasma] Speed up plasma tests
omit ecdc86b ARROW-1249: [JAVA] expose fillEmpties from Nullable variable length vectors
omit 6042c48 ARROW-1195: [C++] CpuInfo init with cores number, frequency and cache…
omit a94f471 ARROW-1149: [Plasma] Create Cython client library for Plasma
omit 05f7058 ARROW-1239: [JAVA] upgrading git-commit-id-plugin
omit 457bb07 ARROW-1237: [JAVA] expose the ability to set lastSet
omit e1b098e ARROW-1240: [JAVA] security: upgrade slf4j to 1.7.25 and logback to 1.2.3
omit fabf7fb ARROW-1241: [C++] Appveyor build matrix extended with Visual Studio 2…
omit 2c81015 [C++] Restore Plasma source tree after 0.5.0 release
omit 9b26ed8 [maven-release-plugin] prepare for next development iteration
omit e9f76e1 [maven-release-plugin] prepare release apache-arrow-0.5.0
omit 62ef2cd [C++] Remove Plasma source tree for 0.5.0 release pending IP Clearance
omit db181d1 ARROW-1244: Exclude C++ Plasma source tree when creating source release
omit 5aa0809 [GLib] Update rat_exclusion_files.txt
omit 2c5b412 ARROW-1167: [Python] Support chunking string columns in Table.from_pandas
omit 6999dbd ARROW-935: [Java] Build Javadoc and site with OpenJDK8 in Java CI build
omit fe9c7ef ARROW-1236: Fix lib path in pkg-config file
omit c5a89b7 ARROW-1120: Support for writing timestamp(ns) to Int96
omit 362e754 ARROW-1103: [Python] Support read_pandas (with index metadata) on directory of Parquet files
omit a73252d ARROW-1235: [C++] Make operator<< for Array/Status and std::ostream inline
omit 8152433 ARROW-1188: [Python] Handle Feather case where category values are null type
omit 6035d9b ARROW-1233: [C++] Validate libs availability in conda toolchain
omit a1c8b83 ARROW-1079: [Python] Filter out private directories when building Parquet dataset manifest
omit b4d34f8 ARROW-1191: [JAVA] Implement getField() method for complex readers
omit 1541a08 ARROW-1177: [C++] Check for int32 offset overflow in ListBuilder, BinaryBuilder
omit 0396240 ARROW-1190: [JAVA] Fixing VectorLoader for duplicate field names
omit ea9bc83 ARROW-1229: [GLib] Use "read" instead of "get" for reading record batch
omit b474cac ARROW-1221: [C++] Add run_clang_format.py script, exclusions file. Pin clang-format-3.9
omit 5fbfd8e ARROW-597: [Python] Add read_pandas convenience to stream and file reader classes. Add some data type docstrings
omit e370174 ARROW-1222: [Python] Raise exception when passing unsupported Python object type to pyarrow.array
omit 8644ee1 ARROW-1227: [GLib] Support GOutputStream
omit d538426 ARROW-1228: [GLib] Fix test file name
omit cdf7db9 ARROW-1223: [GLib] Fix function name that returns wrapped object
omit 50b518a ARROW-1183: [Python] Implement pandas conversions between Time32, Time64 types and datetime.time
omit bf01966 [Python] Correct function name in use with pandas documentation
omit f266f17 ARROW-1220: [C++] Cmake script errors out if lib is not found under *…
omit e438e15 ARROW-1217: [GLib] Add GInputStream based arrow::io::RandomAccessFile
omit dc4216f ARROW-575: Python: Auto-detect nested lists and nested numpy arrays in Pandas
omit bb0a758 ARROW-1214: [Python/C++] Add C++ functionality to more easily handle encapsulated IPC messages, Python bindings
omit 099f61c ARROW-1218: [C++] Fix arrow build if no compression library is used
omit 9ff39f3 ARROW-1216: [Python] Fix creating numpy array from arrow buffers on python 2
omit d46b7ea ARROW-992: [Python] Try to set a __version__ in in-place local builds
omit f62db83 ARROW-1100: [Python] Add mode property to NativeFile
omit bfe3959 ARROW-962: [Python] Add schema attribute to RecordBatchFileReader
omit cb31b8b ARROW-1215: [Python] Generate documentation for class members in API Reference
omit 8cad26e ARROW-1200: C++: Switch DictionaryBuilder to signed integers
omit c7e0995 ARROW-1208: [C++] Install zstd from conda for Toolchain Appveyor buil…
omit 248a9d8 ARROW-1212: [GLib] Add garrow_binary_array_get_offsets_buffer()
omit 85892a2 ARROW-1187: Python: Feather: Serialize a DataFrame with None column
omit 74bc873 ARROW-1150: Silence AdaptiveIntBuilder compiler warning on MSVC
omit 28e06d8 ARROW-1194: [Python] Expose MockOutputStream in pyarrow.
omit f0ecc06 ARROW-1208: [C++] Temporary remove conda's build of zstd from Toolcha…
omit afb1928 ARROW-1206: [C++] Add finer grained control of compression library support, do not expose symbols which may not be built in compression.h
omit e8c09c6 ARROW-1205: C++: Reference to type objects in ArrayLoader may cause segmentation faults
omit dbedc8d ARROW-1186: [C++] Add support to build only Parquet dependencies
omit 8452071 ARROW-1199: [C++] Implement mutable POD struct for Array data
omit ad57ea8 ARROW-1125: Python: Add public C++ API to unwrap PyArrow object
omit 471a85f ARROW-1168: [Python] pandas metadata may contain "mixed" data types
omit bc16e0e ARROW-1196: [C++] Release, Debug, Toolchain, NMake Generator Appveyor…
omit cab07c2 ARROW-1202: [C++] Remove semicolons from status macros
omit f73c1c3 ARROW-1201: [Python] Incomplete Python types cause a core dump when repr-ing
omit 7870804 ARROW-1074: Support lists and arrays in pandas DataFrames without explicit schema
omit e894532 ARROW-1197: [GLib] Fix a bug that record batch related functions for C++ aren't included
omit b6b876c ARROW-1193: [C++] Support pkg-config for arrow_python.so
omit 3309d12 ARROW-1174: [GLib] Fix ListArray test failure
omit c398fda ARROW-462: [C++] Implement in-memory conversions between non-nested primitive types and DictionaryArray equivalent
omit 83a4405 ARROW-599: [C++] Lz4 compression codec support
omit 00a7d55 ARROW-1185: [C++] Status class cleanup, warn_unused_result attribute and Clang warning fixes
omit 7d86c28 ARROW-693: [Java] Add dictionary support to JSON reader and writer
omit cbbd04b ARROW-1172: [C++] Refactor to use unique_ptr for builders
omit edcded3 ARROW-1148: [C++] Raise minimum CMake version to 3.2
omit 7c18ddd ARROW-966: [Python] Also accept Field instance in pyarrow.list_
omit e5a08dd ARROW-1098. [Format] modify document mistake
omit 681479d ARROW-1182: C++: Specify BUILD_BYPRODUCTS for zlib and zstd
omit cdee23c ARROW-600: ZSTD compression lib support
omit e18abac ARROW-1181: [Python] Parquet multiindex test should be optional
omit a6d0c26 ARROW-1180: [GLib] Fix a returning invalid address bug in garrow_tensor_get_dimension_name()
omit 2c3e8b0 ARROW-692: Integration test data generator for dictionary types
omit 2e5ddfe ARROW-1179: C++: Add missing virtual destructors
omit 9e4906f ARROW-1160: C++: Implement DictionaryBuilder
omit e268ce8 ARROW-915: [Python] Struct Array reads limited support
omit 96e7e99 ARROW-960: Add section on how to develop with pip
omit c294ec3 ARROW-1125: partial schemas for Table.from_pandas
omit 930db87 ARROW-1169: [C++] jemalloc externalproject doesn't build with CMake's ninja generator
omit 456330f ARROW-599: CMake support of LZ4 compression lib
omit 9f500af ARROW-1170: C++: Link to pthread on ARROW_JEMALLOC=OFF
omit af83c45 ARROW-1166: Fix errors in example and missing reference in Layout.md
omit 6958252 ARROW-1165: [C++] Refactor PythonDecimalToArrowDecimal to not use templates
omit 65558db ARROW-1162: Empty data vector transfer between list vectors should no…
omit bddb219 ARROW-834: Python Support creating from iterables
omit a588938 ARROW-1159: [C++] Use dllimport for visibility when not building Arrow library
omit b065228 ARROW-1154: [C++] Import miscellaneous computational utility code from parquet-cpp
omit cb5f2b9 ARROW-1157: C++/Python: Decimal templates are not correctly exported on OSX
omit 3e754a0 ARROW-1155: [Python] Add null check when user improperly instantiates ArrayValue instances
omit bfe15db ARROW-1152: [Cython] read_tensor should work with a readable file
omit ec6e183 ARROW-1151: [C++] Add branch prediction to RETURN_NOT_OK
omit 5de6eb5 ARROW-978: [Python] - Change python documentation sphinx theme to bootstrap
omit fc3f8c2 ARROW-1131: [Python] Enable the Parquet unit tests by default if the extension imports
omit bea30d6 ARROW-1113: [C++] Upgrade to gflags 2.2.0, use tarball instead of git tag
omit f3bcf76 ARROW-1145: [GLib] Add get_values()
omit 41524d6 ARROW-1135: [C++] Use clang 4.0 in one of the Linux builds
omit 73007de ARROW-1147: [C++] Allow optional vendoring of flatbuffers in plasma
omit 98f7cac ARROW-1142: [C++] Port over compression toolchain and interfaces from parquet-cpp, use Arrow-style error handling
omit 1514016 ARROW-1146: Add .gitignore for *_generated.h files in src/plasma/format
omit b7befeb ARROW-1132: [Python] Unable to write pandas DataFrame w/MultiIndex containing duplicate values to parquet
omit 8bf567e ARROW-1136: [C++] Add null checks for invalid streams
omit 6768f52 ARROW-1139: Silence dlmalloc warning on clang-4.0
omit e209e58 ARROW-1144: [C++] Remove unused variable
omit 074dde4 ARROW-1143: C++: Fix comparison of NullArray
omit c1ec0c7 ARROW-1039: Python: Remove duplicate column
omit a16c124 ARROW-1137: Python: Ensure Pandas roundtrip of all-None column
omit 608b89e ARROW-1073: C++: Adapative integer builder
omit 222628c ARROW-1140: [C++] Allow optional build of plasma
omit 5e34309 ARROW-1104: Integrate in-memory object store into arrow
omit ef579ca ARROW-1123: Make jemalloc the default allocator
omit f0f1ca6 ARROW-1138: Travis: Use OpenJDK7 instead of OracleJDK7
omit 86c67d0 ARROW-1129: [C++] Fix gflags issue in Linux/macOS toolchain builds
omit b5e8a48 ARROW-1128: [Docs] command to build a wheel is not properly rendered
omit d874d4e ARROW-1081: Fill null_bitmap correctly in TestBase
omit 5be05ac ARROW-742: [C++] Use gflags from toolchain; Resolve cmake FindGFlags …
omit 1a23419 ARROW-1124: Increase numpy dependency to >=1.10.x
omit d54bf48 ARROW-1122: [Website] Change timestamp to yield correct Jekyll date
omit 3f26dfa ARROW-1096: [C++] CreateFileMapping maximum size calculation issue
omit 5b66c25 ARROW-1122: [Website] Add turbodbc + arrow blog post
omit d1de66b ARROW-1118: [Site] Website updates for 0.4.1
omit 697df1b ARROW-1117: [Docs] Minor issues in GLib README
omit d25ea63 ARROW-1115: [C++] use CCACHE_FOUND value for ccache path
omit 25ba44c ARROW-460: [C++] JSON read/write for dictionaries
omit 2a2b109 ARROW-742: [C++] std::wstring_convert exceptions handling
omit ac64853 ARROW-1112: [JAVA] Set lastSet for VarLength and List vectors when loading
omit 11deee6 ARROW-1111: [JAVA] Make aligning buffers optional, and allow -1 for unknown null count
omit c6cf124 ARROW-1110: [JAVA] make union vector naming consistent
omit 0e680f0 ARROW-1109: [JAVA] transferOwnership fails when readerIndex is not 0
omit 06c26a2 ARROW-1108: [JAVA] Check if ArrowBuf is empty buffer in getActualConsumedMemory() and getPossibleConsumedMemory()
omit ae6142d ARROW-1107: [JAVA] Fix getField() for NullableMapVector
omit a44d584 ARROW-1102: Make MessageSerializer.serializeMessage() public
omit a382034 ARROW-1101: Implement write(TypeHolder) methods in UnionListWriter
omit 7a7b0c2 ARROW-1048: Use existing LD_LIBRARY_PATH in source release script to accommodate non-system toolchain libs
omit e344066 ARROW-1095: Add Arrow logo PNG to website img folder
omit 41b58e4 [maven-release-plugin] prepare for next development iteration
omit 4631543 [maven-release-plugin] prepare release apache-arrow-0.4.1
omit 2a12482 ARROW-1094: [C++] Always truncate buffer read in ReadableFile::Read if actual number of bytes less than request
omit ac54075 ARROW-1088: [Python] Only test unicode filenames if system supports them
omit 402baa4 ARROW-1092: More Decimal and scale flipped follow-up
omit c3e865d ARROW-1090: Improve build_ext usability with --bundle-arrow-cpp
omit 5589dda ARROW-1080: C++: Add tutorial about converting to/from row-wise representation
omit 1a72acd [Doc] Fix a few links for files moved in ARROW-957
omit 44dba71 ARROW-1020: [Format] Revise language for Timestamp type in Schema.fbs to avoid possible confusion about tz-naive timestamps
omit a367fd4 ARROW-1086: include additional pxd files during package build
omit 4e134e5 ARROW-1091: Decimal scale and precision are flipped
omit 316930c ARROW-1056: [Python] Ignore pandas index in parquet+hdfs test
omit cfaddab ARROW-1050: [C++] Export arrow::ValidateArray
omit a44155d ARROW-986: [Format] Add brief explanation of dictionary batches in IPC.md
omit 8f2b44b ARROW-1051: [Python] Opt in to Parquet unit tests to avoid accidental suppression of dynamic linking errors
omit a81aefb ARROW-1082: [GLib] Add CI on macOS
omit 931a877 ARROW-1070: [C++] Use physical types for Feather date/time types
omit 0576ff5 ARROW-1085: [java] Follow up on template cleanup. Missing method for …
omit ba97f34 ARROW-1084: Implementations of BufferAllocator should handle Netty's OutOfDirectMemoryError
omit 092afb6 ARROW-990: [JS] Add tslint support for linting TypeScript
omit 5c155c3 ARROW-1075: [GLib] Fix build error on macOS
omit 8229688 ARROW-1078: [Python] Account for Apache Parquet shared library consolidation
omit 530f0da [Doc] Change cpp api doc, std:shared_pointer_cast to std::static_pointer_cast
omit 51b6bf2 ARROW-897: [GLib] Extract CI configuration for GLib
omit 03e8b54 ARROW-1069: Add instructions for publishing maven artifacts
omit 8a700cc ARROW-1063: [Website] Updates for 0.4.0 release, release posting
omit 4e4435e ARROW-424: [C++] Make ReadAt, Write HDFS functions threadsafe
omit 078357a ARROW-1066: [Python] pandas 0.20.1 deprecation of pd.lib causes a warning on import
omit 1cb18d5 ARROW-1061: [C++] Harden decimal parsing against invalid strings
omit 33117d9 ARROW-1034: [PYTHON] Resolve wheel build issues on Windows
omit aa652cb ARROW-1060: [Python] Add unit tests for reference counts in memoryview interface
omit 84b7ee1 ARROW-1057: Fix cmake warning and msvc debug asserts
omit d2cc199 ARROW-1062: [GLib] Follow API changes in examples
omit b06602d ARROW-1049: [java] vector template cleanup
omit a6e77f4 ARROW-1054: [Python] Fix test failure on pandas 0.19.2, some refactoring
omit cf4ef5e Increment version to 0.5.0-SNAPSHOT
omit a8f8ba0 [maven-release-plugin] prepare release apache-arrow-0.4.0
omit ff72951 ARROW-1053: [Python] Remove unnecessary Py_INCREF in PyBuffer causing memory leak
omit 37cdc6e ARROW-970: [Python] Nicer experience if user accidentally calls pyarrow.Table ctor directly
omit 0eec40a ARROW-1046: [Python] Reconcile pandas metadata spec
omit 62a17b7 ARROW-1044: [GLib] Support Feather
omit fee4475 ARROW-1029: [Python] Fixes for building pyarrow with Parquet support on MSVC. Add to appveyor build
omit a4f3259 ARROW-1030: Python: Account for library versioning in parquet-cpp
omit c4086fe ARROW-997: [Java] Implementing transferPair for FixedSizeListVector
omit bed0197 ARROW-881: [Python] Reconstruct Pandas DataFrame indexes using metadata
omit e7e8d61 ARROW-1040: [GLib] Support tensor IO
omit 49c5398 ARROW-1038: [GLib] Follow writer name change
omit 8a8e7bb ARROW-1037: [GLib] Follow reader name change
omit ce0bb53 ARROW-1002: [C++] Fix inconsistency with padding at start of IPC file format
omit 47e289a ARROW-961: [Python] Rename InMemoryOutputStream to BufferOutputStream
omit 86a9055 ARROW-182: [C++] Factor out Array::Validate into a separate function
omit 222cbfe ARROW-998: [Format] Clarify that the IPC file footer contains an additional copy of the schema
omit abbd815 ARROW-1025: [Website] Improved changelog for website, include git shortlog
omit b23b864 ARROW-1015 [Java] Schema-level metadata
omit 681afab ARROW-977: [java] Add Timezone aware timestamp vectors
omit 4381845 ARROW-1033: [Python] pytest discovers scripts/test_leak.py
omit ba9348f ARROW-1031: [GLib] Support pretty print
omit edfb2dc ARROW-1027: [Python] Allow negative indexing in fields/columns on pyarrow Table and Schema objects
omit 0543379 ARROW-1028: [Python] Fix IPC docs per API changes
omit 37dbddf ARROW-1004: [Python] Add conversions for numpy object arrays with integers and floats
omit 393f46a ARROW-1023: Python: Fix bundling of arrow-cpp for macOS
omit c7839e9 ARROW-1017: [Python] Fix memory leaks in conversion to pandas.DataFrame
omit 852ee4f ARROW-1024: Python: Update build time numpy version to 1.10.1
omit d8d3d84 ARROW-1022: [Python] Add multithreaded read option to read_feather
omit 5739e04 ARROW-1008: [C++] Add abstract stream writer and reader C++ APIs. Give clearer names to IPC reader/writer classes
omit 99ff240 ARROW-1011: [FORMAT] fix typo and mistakes in Layout.md
omit dbbbc66 ARROW-988 [JS] Add entry to Travis CI matrix
omit 9e875a6 ARROW-819: Public Cython and C++ API in the style of lxml, arrow::py::import_pyarrow method
omit 95ee96b ARROW-1016: Python: Include C++ headers (optionally) in wheels
omit 05e8f68 ARROW-1010: [Website] Provide for translations without repeating blog post in blogroll
omit a4f29f3 ARROW-29: [C++] FindRe2 cmake module
omit b066660 ARROW-996: [Website] Add 0.3.0 release announce in Japanese
omit 010bd22 ARROW-482 [Java] Exposing custom field metadata
omit a8338f1 ARROW-995: [Website] Fix a typo
omit a7722dc ARROW-993: [GLib] Add missing error checks in Go examples
omit 1c6f3ef ARROW-813: [Python] setup.py sdist must also bundle dependent cmake m…
omit 84413b0 ARROW-901: [Python] Add Parquet unit test for fixed size binary
omit c10b7d7 ARROW-1003: [C++] Check flag _WIN32 instead of __WIN32
omit 3f22b5f ARROW-1000: [GLib] Move install document to Website
omit 8856541 ARROW-1001: [GLib] Unify writer files
omit 0216145 ARROW-991: [Python] Create new dtype when deserializing from Arrow to NumPy datetime64
omit 2d6453b ARROW-940: [JS] Generate multiple artifacts
omit 22c738c ARROW-874: [JS] Read dictionary-encoded vectors
omit 670612e ARROW-954: Flag for compiling Arrow with header-only boost
omit ccf83f4 ARROW-985: [GLib] Update package information
omit 74ad4a8 ARROW-984: [GLib] Add Go examples
omit af0c21e ARROW-957: [Doc] Add HDFS and Windows documents to doxygen output
omit fe945a2 ARROW-965: Website updates for 0.3.0
omit 3d19831 ARROW-967: [GLib] Support initializing array with buffer
omit cb5e7b6 ARROW-446: [Python] Expand Sphinx documentation for 0.3
omit d7a2a1e ARROW-958: [Python] Fix conda source build instructions
omit c48f649 ARROW-963: [GLib] Add equal
omit 20228a2 ARROW-909: Link jemalloc statically if build as external project
omit 03c242c ARROW-947: [Python] Improve execution time of manylinux1 build
omit bd36f6f ARROW-899: [Doc] Add 0.3.0 changelog
omit 959ec47 ARROW-856: Also read compiler info from stdout
omit 75ebf5c ARROW-956: [Python] compat with pandas >= 0.20.0
omit c3a122e ARROW-939: fix division by zero if one of the tensor dimensions is zero
omit 8febd03 ARROW-953: Use conda-forge cmake, curl in CI toolchain
omit 995317a ARROW-929: Remove KEYS file from git
omit 5af8069 ARROW-866: [Python] Normalize PyErr exc_value to be more predictable
omit 316c63d ARROW-824: Date and Time Vectors should reflect timezone-less semantics
omit 1a6d135 ARROW-952: fix regex include from C++ standard library
omit f63ff08 ARROW-52: Set up project blog, draft 0.3 release posting
omit cc06197 ARROW-948: [GLib] Update C++ header file list
omit ba2880c ARROW-946: [GLib] Use "new" instead of "open" for constructor name
omit 9a48773 ARROW-943: [GLib] Support running unit tests with source archive
omit bcf073c ARROW-945: [GLib] Add a Lua example to show Torch integration
omit 80b72d4 [maven-release-plugin] prepare for next development iteration
omit 2c3e111 ARROW-923: Changelog generation Python script, add 0.1.0 and 0.2.0 changelog
omit 928b63f ARROW-938: Fix Rat license warnings
omit 32a4d70 ARROW-936: add missing file; revert tag change
omit e794a59 ARROW-936: fix release README
omit 0eff217 ARROW-933: [Python] Remove debug print statement
omit f1bd49d ARROW-931: [GLib] Reconstruct input stream
omit 02a121f ARROW-927: C++/Python: Add manylinux1 builds to Travis matrix
omit 569426b ARROW-930: javadoc generation fails with java 8
omit da523ce ARROW-928: [C++] Detect supported MSVC versions
omit c9e61cd ARROW-926: Add wesm to KEYS
omit 8013cf3 ARROW-925: [GLib] Fix GArrowBufferReader test
omit 6950e45 ARROW-922: Allow Flatbuffers and RapidJSON to be used locally on Windows
omit d4a2a75 ARROW-910: [C++] Write 0 length at EOS in StreamWriter
omit 00994b8 ARROW-920: [GLib] Add Lua examples
omit b4886da ARROW-919: [GLib] Use "id" to get type enum value from GArrowDataType
omit 2d5142c ARROW-918: [GLib] Use GArrowBuffer for read buffer
omit ce0c962 ARROW-917: [GLib] Add GArrowBufferReader
omit ed5a1d4 ARROW-916: [GLib] Add GArrowBufferOutputStream
omit 53c093b ARROW-914 [C++/Python] Fix Decimal ToBytes
omit f7ab727 ARROW-896: Support Jupyter Notebook in Web site
omit f13a928 ARROW-907: C++: Construct Table from schema and arrays
omit 14bec24 ARROW-908: [GLib] Unify OutputStream files
omit 03dce9d ARROW-900: [Python] Fix UnboundLocalError in ParquetDatasetPiece.read
omit 81be9c6 ARROW-866: [Python] Be robust to PyErr_Fetch returning a null exc value
omit 909f826 ARROW-867: [Python] pyarrow MSVC fixes
omit e876abb ARROW-898: [C++/Python] Use shared_ptr to avoid copying KeyValueMetadata, add to Field type also
omit 3fdeac7 ARROW-886 [Java] Fixing reallocation of VariableLengthVector offsets
omit 8bf61d1 ARROW-697: JAVA Throw exception for record batches > 2GB
omit 02c32ff ARROW-903: [GLib] Remove a needless "."
omit 3ad9d09 ARROW-904: [GLib] Simplify error check codes
omit 7d433dc ARROW-483: [C++/Python] Provide access to "custom_metadata" Field attribute in IPC setting
omit 949249d ARROW-893: Add GLib document to Web site
omit 015b284 ARROW-894: [GLib] Add GArrowResizableBuffer and GArrowPoolBuffer
omit 6ae49a1 ARROW-892: [GLib] Fix GArrowTensor document
omit 68decb6 ARROW-865: [Python] Add unit tests validating Parquet date/time type roundtrips
omit 0bee804 ARROW-888: Transfer ownership of buffer in BitVector transferTo()
omit 1a73c35 ARROW-895: Fix lastSet in fillEmpties() and copyFrom()
omit f00e2ab ARROW-890: [GLib] Add GArrowMutableBuffer
omit eaf2118 ARROW-887: add default value to units for backward compatibility
omit 6239abd ARROW-862: [Python] Simplify README landing documentation to direct users and developers toward the documentation
omit 76d56d3 ARROW-95: Add Jekyll-based website publishing toolchain, migrate existing arrow-site
omit de54eff ARROW-659: [C++] Add multithreaded memcpy implementation
omit 95f489c ARROW-880: [GLib] Support getting raw data of primitive arrays
omit 33ac8a2 ARROW-882: [C++] Rename statically build library on Windows to avoid …
omit 26e5bb1 ARROW-879: compat with pandas v0.20.0
omit a0a925b ARROW-875: Avoid setting an extra empty in fillEmpties()
omit 39a37f7 ARROW-878: [GLib] Add garrow_binary_array_get_buffer()
omit 07c6ade ARROW-849: [C++] Support setting production build dependencies with ARROW_BUILD_TOOLCHAIN
omit 578b0ff ARROW-877: [GLib] Add garrow_array_get_null_bitmap()
omit 76dfd98 ARROW-876: [GLib] Unify ArrayBuilder files
omit 423235c ARROW-868: [GLib] Use GBytes to reduce copy
omit b4a75b1 ARROW-871: [GLib] Unify DataType files
omit 16ea370 ARROW-616: [C++] Do not include debug symbols in release builds by default
omit 6867e93 ARROW-869 [JS] Rename directory to js/
omit 6c352e2 ARROW-822: [Python] StreamWriter Wrapper for Socket and File-like Objects without tell()
omit 7c1fef5 ARROW-864: [GLib] Unify Array files
omit 3f9b26c ARROW-863: [GLib] Use GBytes to implement zero-copy
omit a68f31b ARROW-860: [C++] Remove typed Tensor containers
omit 0dc6fe8 ARROW-846: [GLib] Add GArrowTensor, GArrowInt8Tensor and GArrowUInt8Tensor
omit 74f89cf ARROW-858: Remove boost_regex from arrow dependencies
omit 391242a ARROW-848: [Python] Another pass on conda dev guide
omit 41a8ff9 ARROW-853: [Python] Only set RPATH when bundling the shared libraries
omit 4555ab9 ARROW-841: [Python] Add pyarrow build to Appveyor
omit 59cd801 ARROW-852: Also search for ARROW libs when pkg-config provided the path
omit a94c03a ARROW-809: [C++] Do not write excess bytes in IPC writer after slicing arrays
omit 4baaa88 ARROW-847: Specify BUILD_BYPRODUCTS for gtest
omit 38efabe ARROW-844: [Format] Update README documents in format/
omit 7f20f6e ARROW-818: [Python] Expand Sphinx API docs, pyarrow.* namespace. Add factory functions for time32, time64
omit bb287e2 ARROW-845: [Python] Sync changes from PARQUET-955; explicit ARROW_HOME will override pkgconfig
omit 0bcb785 ARROW-839: [Python] Use mktime variant that is reliable on MSVC
omit bb8514c ARROW-833: [Python] Add Developer quickstart for conda users
omit 84d725b ARROW-825: [Python] Rename pyarrow.from_pylist to pyarrow.array, test on tuples
omit 7238d54 ARROW-734: [C++/Python] Support building PyArrow on MSVC
omit 312a665 ARROW-707: [Python] Return NullArray for array of all None in Array.from_pandas. Revert from_numpy -> from_pandas
omit f512590 ARROW-827: [Python] Miscellaneous improvements to help with Dask support
omit 09e6ead ARROW-836: add test for pandas conversion of timedelta, currently unimplemented
omit dad1a8e ARROW-832: [C++] Update to gtest 1.8.0, remove now unneeded test_main.cc
omit ee5cb2a ARROW-830: [Python] Expose jemalloc memory pool and other memory pool functions in public pyarrow API
omit 30e03a9 ARROW-703: Fix issue where setValueCount(0) doesn’t work in the case that we’ve shipped vectors across the wire
omit 0f9c88f ARROW-725: [Formats/Java] FixedSizeList message and java implementation
omit edb8252 ARROW-829: Don't deactivate Parquet dictionary encoding on column-wis…
omit 4d2ac87 ARROW-826: [C++/Python] Fix compilation error on Mac with -DARROW_PYTHON=on
omit ce5b98e ARROW-820: [C++] Build dependencies for Parquet library without arrow…
omit 4b030dd ARROW-828: [C++] Add new dependency to README
omit 88c351a ARROW-720: arrow should not have a dependency on slf4j bridges in com…
omit 794d020 ARROW-777: restore getObject behavior on Date and Time
omit b603337 ARROW-815 [Java] Exposing reAlloc for ValueVector
omit 01114d8 ARROW-783: [Java/C++] Fixes for 0-length record batches
omit b4892fd ARROW-528: [Python] Utilize improved Parquet writer C++ API, add write_metadata function, test _metadata files
omit 874666a ARROW-816: [C++] Travis CI script cleanup, add C++ toolchain env with Flatbuffers, RapidJSON
omit 19da86a ARROW-817: [Python] Fix comment in date32 conversion
omit 8b64a4f ARROW-751: [Python] Make all Cython modules private. Some code tidying
omit e934365 ARROW-797: [Python] Make more explicitly curated public API page, sphinx cleanup
omit 3d9bfc2 ARROW-646: [Python] Conda s3 robustness, set CONDA_PKGS_DIR env variable and add Travis CI caching
omit 9d532c4 ARROW-539: [Python] Add support for reading partitioned Parquet files with Hive-like directory schemes
omit 9db96fe ARROW-811: [GLib] Add GArrowBuffer
omit 6443b82 ARROW-810: [GLib] Remove io/ipc prefix
omit 5e5a587 ARROW-805: [C++] Don't throw IOError when listing empty HDFS dir
omit ab520cb ARROW-808: [GLib] Remove needless ignore entries
omit 7b4723b ARROW-807: [GLib] Update "Since" tag
omit f5245cc ARROW-806: [GLib] Support add/remove a column from table
omit b3cec80 ARROW-804: [GLib] Update build document
omit b7423a6 ARROW-803: [GLib] Update package repository URL
omit 85b870e ARROW-802: [GLib] Add read examples
omit 06d92bb ARROW-779: [C++] Check for old metadata and raise exception if found
omit c2f28cd ARROW-741: [Python] Switch Travis CI to use Python 3.6 instead of 3.5
omit e327c2e ARROW-761: [C++/Python] Add GetTensorSize method, Python bindings
omit 793f4e0 ARROW-782: [C++] API cleanup, change public member access in DataType classes to functions, use class instead of struct
omit d1a9aff ARROW-795: [C++] Consolidate arrow/arrow_io/arrow_ipc into a single shared and static library
omit ddda303 ARROW-526: [Format] Revise Format documents for evolution in IPC stream / file / tensor formats
omit acbda18 ARROW-794: [C++/Python] Disallow strided tensors in ipc::WriteTensor
omit 72e1e08 ARROW-800: [C++] Boost headers being transitively included in pyarrow
omit 137aade ARROW-722: [Python] Support additional date/time types and metadata, conversion to/from NumPy and pandas.DataFrame
omit 754bcce ARROW-655: [C++/Python] Implement DecimalArray
omit 449f991 ARROW-773: [CPP] Add Table::AddColumn API
omit b0863cb ARROW-788: [C++] Align WriteTensor message
omit 739ed82 ARROW-762: [Python] Start docs page about files and filesystems, adapt C++ docs about HDFS
omit b0e3122 ARROW-724: Add How to Contribute section to README
omit 3591103 ARROW-793: [GLib] Fix indent
omit 8ae3283 ARROW-787: [GLib] Fix compilation error caused by introducing BooleanBuilder::Append overload
omit 027c6b8 ARROW-781 [C++/Python] Increase reference count of the numpy base array?
omit 1c66097 ARROW-758: [C++] Build with /WX in Appveyor, fix MSVC compiler warnings
omit e53357c ARROW-778: Port merge tool to work on Windows
omit e371ebd ARROW-756: [C++] MSVC build fixes and cleanup, remove -fPIC flag from EP builds on Windows, Dev docs
omit 58fa4c2 ARROW-776: [GLib] Fix wrong type name
omit 56f1e91 ARROW-771: [Python] Add read_row_group / num_row_groups to ParquetFile
omit ff744ef ARROW-775: add simple constructors to value vectors
omit 49b3e0e ARROW-774: [GLib] Remove needless LICENSE.txt copy
omit 621d527 ARROW-582: [Java] Added JSON reader/writer unit test for date, time, and timestamp
omit ddf880b ARROW-752: [Python] Support boxed Arrow arrays as input to DictionaryArray.from_arrays
omit f4fcb42 ARROW-510 ARROW-582 ARROW-663 ARROW-729: [Java] Added units for Time and Date types, and integration tests
omit e29a7d4 ARROW-668: [Python] Box timestamp values as pandas.Timestamp if available, attach tzinfo
omit 360942e ARROW-672: [Format] Add MetadataVersion::V3 for Arrow 0.3
omit 5d6c6ad ARROW-770: [C++] Move .clang* files back into cpp source tree
omit 2aed784 ARROW-765: [Python] Add more natural Exception type hierarchy for thirdparty users
omit ec6188e ARROW-769: [GLib] Support building without installed Arrow C++
omit d560e30 ARROW-656: [C++] Add random access writer for a mutable buffer. Rename WriteableFileInterface to WriteableFile for better consistency
omit d0cd03d ARROW-763: C++: Use to find libpythonX.X.dylib
omit f05b7c6 ARROW-443: [Python] Support ingest of strided NumPy arrays from pandas
omit 7d1d4e7 ARROW-657: [C++/Python] Expose Tensor IPC in Python. Add equals method. Add pyarrow.create_memory_map/memory_map functions
omit 7232e5b ARROW-676: move from MinorType to FieldType in ValueVectors to carry all the relevant type bits
omit 96f3d61 ARROW-749: [Python] Delete partially-written Feather file when column write fails
omit 8f113b4 ARROW-755: [GLib] Add garrow_array_get_value_type()
omit 9f720b1 ARROW-738: Fix manylinux1 build
omit c4d535c ARROW-753: [Python] Fix linker error for python-test on OS X
omit d54ab9a ARROW-737: [C++] Enable mutable buffer slices, SliceMutableBuffer function
omit e333576 ARROW-718: [Python] Implement pyarrow.Tensor container, zero-copy NumPy roundtrips
omit 7fec7d3 ARROW-754: [GLib] Add garrow_array_is_null()
omit baf38e4 ARROW-747: [C++] Calling add_dependencies with dl causes spurious CMake warning
omit 651ea92 ARROW-745: [C++] Allow use of system cpplint
omit 31a1f53 ARROW-710: [Python] Read/write with file-like Python objects from read_feather/write_feather
omit fd00096 ARROW-723: [Python] Ensure that passing chunk_size=0 when writing Parquet file does not enter infinite loop
omit 9f5e174 ARROW-733: [C++/Python] Rename FixedWidthBinary to FixedSizeBinary for consistency with FixedSizeList
omit d75d7a9 ARROW-736: [Python] Mixed-type object DataFrame columns should not silently co…
omit 067cd4e ARROW-630: [C++] Create boolean batches for IPC testing, properly account for nonzero offset
omit 4e77d33 ARROW-746: [GLib] Add garrow_array_get_data_type()
omit e5b6827 ARROW-744: [GLib] Re-add an assertion for garrow_table_new() test
omit ad8a0cf ARROW-739: Don't install jemalloc in parallel
omit 005826f ARROW-719: [GLib] Release source archive
omit f5967ed ARROW-603: [C++] Add RecordBatch::Validate method, call in RecordBatch ctor in debug builds
omit 4915ecf ARROW-632: [Python] Add support for FixedWidthBinary type
omit edd6cfc ARROW-727: [Python] Ensure that NativeFile.write accepts any bytes, unicode, or object providing buffer protocol. Rename build_arrow_buffer to pyarrow.frombuffer
omit ba4f478 ARROW-715: [Python] Make pandas not a hard requirement, flake8 fixes
omit ae2da98 ARROW-743: [C++] Consolidate all but decimal array tests into array-test, collect some tests in type-test.cc
omit 4938d8d ARROW-726: [C++] Fix segfault caused when passing non-buffer object to arrow::py::PyBuffer
omit 957a0e6 ARROW-717: [C++] Implement IPC zero-copy round trip for tensors
omit 15b874e ARROW-699: [C++] Resolve Arrow and Arrow IPC build issues on Windows;
omit 47fad3f ARROW-728: [C++/Python] Add Table::RemoveColumn method, remove name member, some other code cleaning
omit 642b753 ARROW-698: Add flag to FileWriter::WriteRecordBatch for writing record batches with lengths over INT32_MAX
omit f7b287a ARROW-627: [C++] Add compatibility macros for exported extern templates
omit 8f38637 ARROW-731: [C++] Add shared library related versions to .pc
omit b032363 ARROW-732: [C++] Schema comparison bugs in struct and union types
omit dac648d ARROW-701: [Java] Support Additional Date Type Metadata
omit 3b71d87 ARROW-620: [C++] Implement JSON integration test support for date, time, timestamp, fixed width binary
omit e717d47 ARROW-716: [Python] Update README build instructions after moving libpyarrow to C++ tree
omit d2d2755 ARROW-658: [C++] Implement a prototype in-memory arrow::Tensor type
omit 3aac4ad ARROW-341: [Python] Move pyarrow's C++ code to the main C++ source tree, install libarrow_python and headers
omit 6d4e862 ARROW-712: [C++] Reimplement Array::Accept as inline visitor
omit fd87669 ARROW-684: [Python] More helpful error message if libparquet_arrow not built
omit ab848f0 ARROW-713: [C++] Fix cmake linking issue in new IPC benchmark
omit 685ebf4 ARROW-626: [Python] Replace PyBytesBuffer with zero-copy, memoryview-based PyBuffer
omit c7947dc ARROW-709: [C++] Restore type comparator for DecimalType
omit 60b5832 ARROW-686: [C++] Account for time metadata changes, add Time32 and Time64 types
omit 5ad4988 ARROW-708: [C++] Simplify metadata APIs to all use the Message class, perf analysis
omit dc3cb30 ARROW-550: [Format] Draft experimental Tensor flatbuffer message type
omit 016a209 ARROW-706: [GLib] Add package install document
omit bc185a4 ARROW-595: [Python] Set schema attribute on StreamReader
omit 13c12c6 ARROW-682: [Integration] Check implementations against themselves
omit dcaa8e5 ARROW-702: fix BitVector.copyFromSafe to reAllocate instead of returning false
omit e968ca6 ARROW-621: [C++] Start IPC benchmark suite for record batches, implement "inline" visitor. Code reorg
omit 2a568f0 ARROW-662: [Format] Move Schema flatbuffers into their own file that can be included
omit 7594492 ARROW-704: Fix bad import caused by conflicting changes
omit e8f6a49 ARROW-674: [Java] Support additional Timestamp timezone metadata
omit f67974b ARROW-700: Add headroom interface for allocator
omit 2926183 ARROW-347: Add method to pass CallBack when creating a transfer pair
omit 990e2bd ARROW-691: [Java] Encode dictionary type in message format
omit bf2acf6 ARROW-454: pojo.Field doesn't implement hashCode()
omit 2406d4e ARROW-552: [Python] Implement getitem for DictionaryArray by returning a value from the dictionary
omit ced9d76 ARROW-679: [Format] Change FieldNode, RecordBatch lengths to long, remove LargeRecordBatch. Refactoring
omit 71424c2 ARROW-683: [C++/Python] Refactor to make Date32 and Date64 types for new metadata. Test IPC roundtrip
omit 3610314 ARROW-689: [GLib] Fix install directories
omit 1b957dc ARROW-688: [C++] Use CMAKE_INSTALL_INCLUDEDIR for consistency
omit 5fda247 ARROW-680: [C++] Support CMake 2 or older again
omit b179ad2 ARROW-681: [C++] Disable boost's autolinking if shared boost is used …
omit 96734ef ARROW-654: [C++] Serialize timezone in IPC metadata
omit d252867 ARROW-675: [GLib] Update package metadata
omit 82b15a4 ARROW-678: [GLib] Fix dependencies
omit 55d8f99 ARROW-677: [java] Fix checkstyle jcl-over-slf4j conflict issue
omit a9a5701 ARROW-208: Add checkstyle policy to java project
omit a8bf0fb ARROW-673: [Java] Support additional Time metadata
omit 98a52b4 ARROW-316: [Format] Changes to Date metadata format per discussion in ARROW-316
omit 6cd82c2 ARROW-671: [GLib] Install missing license file
omit 02bdbf4 ARROW-502 [C++/Python]: Logging memory pool
omit cd4544d ARROW-664: [C++] Make C++ Arrow serialization deterministic
omit df2220f ARROW-661: [C++] Add LargeRecordBatch metadata type, IPC support, associated refactoring
omit 4c5f79c ARROW-617: [Format] Add additional Time metadata and comments based on discussion in ARROW-617
omit a9f0c63 ARROW-651: [C++] Set version to shared library
omit 98c9490 ARROW-639: [C++] Invalid offset in slices
omit 019f90d ARROW-647: [C++] Use Boost shared libraries for tests and utilities
omit 5ef6840 ARROW-652: Remove trailing f in merge script output
omit f5157a0 ARROW-648: [C++] Support multiarch on Debian
omit 16dd871 ARROW-650: [GLib] Follow ReadableFileInterface -> RnadomAccessFile change
omit 57b537a ARROW-637: [Format] Add timezone to Timestamp metadata, comments describing the semantics
omit 39c7274 ARROW-631: [GLib] Import
omit c13d671 ARROW-644: Python: Cython should be a setup-only requirement
omit 3ee3822 ARROW-593 [C++]: Rename ReadableFileInterface to RandomAccessFile
omit 867f924 ARROW-231 [C++]: Add typed Resize to PoolBuffer
omit 0cf2bbb ARROW-642: [Java] Remove temporary file in java/tools
omit 1c101ff ARROW-636: [C++] Update README about Boost system requirement
omit 49f666e ARROW-542: Adding dictionary encoding to FileWriter
omit 3b65001 ARROW-520: [C++] STL-compliant allocator
omit c8d15d4 ARROW-491: [Format / C++] Add FixedWidthBinary type to format, C++ implementation
omit dd8204c ARROW-628: [Python] Install nomkl metapackage when building parquet-cpp in Travis CI
omit a32ae59 ARROW-625: [C++] Add TimeUnit to TimeType::ToString. Add timezone to TimestampType::ToString if present
omit cef4615 ARROW-598: [Python] Add support for converting pyarrow.Buffer to a memoryview with zero copy
omit f442879 ARROW-624: [C++] Restore MakePrimitiveArray function, use in feather.cc
omit 6aed18f ARROW-619: [Python] Fixed remaining typo for LD_LIBRARY_PATH
omit 00df40c ARROW-618: [Python/C++] Support timestamp+timezone conversion to pandas
omit 331be49 ARROW-623: Fix segfault in __repr__ of empty field
omit 2cf36ef ARROW-574: Python: Add support for nested Python lists in Pandas conversion
omit 492b3d4 ARROW-613: WIP TypeScript Implementation
omit d4ecb5e ARROW-612: [Java] Added not null to Field.toString output
omit 344ad1f ARROW-619: Fix typos in setup.py args and LD_LIBRARY_PATH
omit e5a11da ARROW-534: [C++] Add IPC tests for date/time after ARROW-452, fix bugs
omit fdc25b4 ARROW-606: [C++] upgrade flatbuffers version to 1.6.0
omit d99958d ARROW-452: [C++/Python] Incorporate C++ and Python codebases for Feather file format
omit f7f915d ARROW-615: [Java] Moved ByteArrayReadableSeekableByteChannel to src main o.a.a.vector.util
omit 6b3ae2a ARROW-605: [C++] Refactor IPC adapter code into generic ArrayLoader class. Add Date32Type
omit b109a24 ARROW-566: Bundle Arrow libraries in Python package
omit fb9fbe4 ARROW-604: Python: boxed Field instances are missing the reference to their DataType
omit 9deb325 ARROW-109: [C++] Add nesting stress tests up to 500 recursion depth
omit 8378c48 ARROW-589: C++: Use system provided shared jemalloc if static is unavailable
omit 0637e05 ARROW-576: [C++] Complete file/stream implementation for union types
omit 2c3bd93 ARROW-588: [C++] Fix some 32 bit compiler warnings
omit 01a67f3 ARROW-493: [C++] Permit large (length > INT32_MAX) arrays in memory
omit dc103fe ARROW-557: [Python] Add option to explicitly opt in to HDFS tests, do not implicitly skip
omit 16c9759 ARROW-577: [C++] Use private implementation pattern in ipc::StreamWriter and ipc::FileWriter
omit ef3b6b3 ARROW-451: [C++] Implement DataType::Equals as TypeVisitor. Add default implementations for TypeVisitor, ArrayVisitor methods
omit 8afe92c ARROW-578: [C++] Add -DARROW_CXXFLAGS=... option to make CMake more consistent
omit 89dc557 ARROW-580: C++: Also provide jemalloc_X targets if only a static or shared version is found
omit d28f1c1 ARROW-459: [C++] Dictionary IPC support in file and stream formats
omit 5e279f0 ARROW-569: [C++] Set version for *.pc
omit 4598c1a ARROW-570: Determine Java tools JAR location from project metadata
omit ef6b465 ARROW-563: Support non-standard gcc version strings
omit ab15e01 [maven-release-plugin] prepare for next development iteration
omit f6924ad [maven-release-plugin] prepare release apache-arrow-0.2.0
omit fa8d27f ARROW-561:[JAVA][PYTHON] Update java & python dependencies to improve downstream packaging experience
omit d50f152 ARROW-558: Add KEYS files
omit 69cf692 ARROW-556: [Integration] Configure C++ integration test executable with a single environment variable. Update README
omit 66f650c ARROW-547: [Python] Add zero-copy slice methods to Array, RecordBatch
omit ad01575 ARROW-553: C++: Faster valid bitmap building
omit 1f26040 ARROW-548: [Python] Add nthreads to Filesystem.read_parquet and pass through
omit e4845c4 ARROW-551: C++: Construction of Column with nullptr Array segfaults
omit 42b55d9 ARROW-544: [C++] Test writing zero-length record batches, zero-length BinaryArray fixes
omit 0ab4252 ARROW-546: Python: Account for changes in PARQUET-867
omit 3add918 ARROW-476: Add binary integration test fixture, add Java support
omit dc6cefd ARROW-521: [C++] Track peak allocations in default memory pool
omit 31f145d ARROW-545: [Python] Ignore non .parq/.parquet files when reading directories as Parquet datasets
omit 0bdfd5e ARROW-538: [C++] Set up AddressSanitizer (ASAN) builds
omit 4440e40 ARROW-543: C++: Lazily computed null_counts counts number of non-null entries
omit b99d049 ARROW-351: Time type has no unit
omit 1407abf ARROW-537: [C++] Do not compare String/Binary data in null slots when comparing arrays
omit c322cbf ARROW-366 Java Dictionary Vector
omit e97fbe6 ARROW-531: Python: Document jemalloc, extend Pandas section, add Getting Involved
omit 4c3481e ARROW-535: [Python] Add type mapping for NPY_LONGLONG
omit f268e92 ARROW-540: [C++] Build fixes after ARROW-33, PARQUET-866
omit 5439b71 ARROW-33: [C++] Implement zero-copy array slicing, integrate with IPC code paths
omit 74bc4dd ARROW-511: Python: Implement List conversions for single arrays
omit 5bee596 ARROW-529: Python: Add jemalloc and Python 3.6 to manylinux1 build
omit 70c05be ARROW-524: provide apis to access nested vectors and buffers
omit c45c3b3 ARROW-527: Remove drill-module.conf file
omit 84f1662 ARROW-381: [C++] Simplify primitive array type builders to use a default type singleton
omit 5b35d6b ARROW-457: Python: Better control over memory pool
omit e881f11 ARROW-525: Python: Add more documentation to the package
omit 08f38d9 ARROW-477: [Java] Add support for second/microsecond/nanosecond timestamps in-memory and in IPC/JSON layer
omit 720d422 ARROW-467: [Python] Run Python parquet-cpp unit tests in Travis CI
omit c05292f ARROW-523: Python: Account for changes in PARQUET-834
omit 0ae4d86 ARROW-497: Integration harness for streaming file format
omit be5d73f ARROW-410: [C++] Add virtual Writeable::Flush
omit 7ac320b ARROW-519: [C++] Refactor array comparison code into a compare.h / compare.cc in part to resolve Xcode 6.1 linker issue
omit 4226adf ARROW-515: [Python] Add read_all methods to FileReader, StreamReader
omit 30bb0d9 ARROW-514: [Python] Automatically wrap pyarrow.io.Buffer in BufferReader
omit aac2e70 ARROW-513: [C++] Fixing Appveyor / MSVC build
omit a90b5f3 ARROW-512: C++: Add method to check for primitive types
omit a68af9d ARROW-498 [C++] Add command line utilities that convert between stream and file.
omit 61a54f8 ARROW-509: [Python] Add support for multithreaded Parquet reads
omit c90ca60 ARROW-378: Python: Respect timezone on conversion of Pandas datetime columns
omit 085c875 ARROW-81: [Format] Augment dictionary encoding metadata to accommodate additional use cases
omit 2821030 ARROW-508: [C++] Add basic threadsafety to normal files and memory maps
omit 1f81adc ARROW-503: [Python] Implement Python interface to streaming file format
omit c327b5f ARROW-506: Java: Implement echo server for integration testing.
omit 69cdbd8 ARROW-494: [C++] Extend lifetime of memory mapped data if any buffers reference it
omit 53a478d ARROW-475: [Python] Add support for reading multiple Parquet files as a single pyarrow.Table
omit 5a161eb ARROW-505: [C++] Fix compiler warning in gcc in release mode
omit 5888e10 ARROW-495: [C++] Implement streaming binary format, refactoring
omit 8ca7033 ARROW-499: Update file serialization to use the streaming serialization format.
omit 512bc16 ARROW-386: [Java] Respect case of struct / map field names
omit 6811d3f ARROW-474: [Java] Add initial version of streaming serialized format.
omit 9b1b397 ARROW-461: [Python] Add Python interfaces to DictionaryArray data, pandas interop
omit 353772f ARROW-468: Python: Conversion of nested data in pd.DataFrames
omit b147230 ARROW-490: Python: Update manylinux1 build scripts
omit 850774e ARROW-484: Revise README to include more detail about software components
omit a098fd0 ARROW-486: [C++] Use virtual inheritance for diamond inheritance
omit 47115aa ARROW-478: Consolidate BytesReader and BufferReader to accept PyBytes or Buffer
omit 876ae85 ARROW-239: Test reading remainder of file in HDFS with read() with no args
omit 281cb96 ARROW-481: [Python] Fix 2.7 regression in Parquet path to open file code path
omit cb83b8d ARROW-96: Add C++ API documentation
omit ad0e57d ARROW-472: [Python] Expose more C++ IO interfaces. Add equals methods to Parquet schemas. Pass Parquet metadata separately in reader
omit 5ffbda1 ARROW-479: Python: Test for expected schema in Pandas conversion
omit c5663c6 ARROW-385: Refactors metric system
omit 7d3e2a3 ARROW-421: [Python] Retain parent reference in PyBytesReader
omit 543e508 ARROW-469: C++: Add option so that resize doesn't decrease the capacity
omit 8d917c1 ARROW-466: Add ExternalProject for jemalloc
omit f44b6a3 ARROW-442: [Python] Inspect Parquet file metadata from Python
omit 3195948 ARROW-438: [C++/Python] Implement zero-data-copy record batch and table concatenation.
omit 1094d89 ARROW-463: C++: Support jemalloc 4.x
omit 7d1f1cf ARROW-360: C++: Add method to shrink PoolBuffer using realloc
omit 74685f3 ARROW-427: [C++] Implement dictionary array type
omit 5bf6ae4 ARROW-456: Add jemalloc based MemoryPool
omit 320f587 ARROW-455: [C++] Add dtor to BufferOutputStream that calls Close()
omit 9513ca7 ARROW-411: [Java] Move compactor functions in Integration to a separate Validator module
omit fdbc579 ARROW-417: Add Equals implementation to compare ChunkedArrays
omit 26140dc ARROW-387: [C++] Verify zero-copy Buffer slices from BufferReader retain reference to parent Buffer
omit d9df556 ARROW-294: [C++] Do not use platform-dependent fopen/fclose functions for MemoryMappedFile
omit 9f7d4ae ARROW-108: [C++] Add Union implementation and IPC/JSON serialization tests
omit 806239f ARROW-449: Python: Conversion from pyarrow.{Table,RecordBatch} to a Python dict
omit e8b6231 ARROW-450: Fixes for PARQUET-818
omit e15c6a0 ARROW-447: Always return unicode objects for UTF-8 strings
omit 23fe6ae ARROW-338: Implement visitor pattern for IPC loading/unloading
omit 4733ee8 ARROW-445: arrow_ipc_objlib depends on Flatbuffer generated files
omit 3095f2c ARROW-444: [Python] Native file reads into pre-allocated memory. Some IO API cleanup / niceness
omit 8aab00e ARROW-330: CMake functions to simplify shared / static library configuration
omit cfbdb68 ARROW-322: [C++] Remove ARROW_HDFS option, always build the module
omit ab5f66a ARROW-428: [Python] Multithreaded conversion from Arrow table to pandas.DataFrame
omit 1079a32 ARROW-437: [C++} Fix clang compiler warning
omit 65af9ea ARROW-432: [Python] Construct precise pandas BlockManager structure for zero-copy DataFrame initialization
omit fd4eb98 ARROW-440: [C++] Support pkg-config
omit 268ffbe ARROW-374: More precise handling of bytes vs unicode in Python API
omit 73455b5 ARROW-430: Improved version handling
omit f6bf112 ARROW-434: [Python] Correctly handle Python file objects in Parquet read/write paths
omit 6ff5fcf ARROW-433: Correctly handle Arrow to Python date conversion for timezones west of London
omit fe53fa4 ARROW-435: Fix spelling of RAPIDJSON_VENDORED
omit d7845fc ARROW-420: Align DATE type with Java implementation
omit cfde460 ARROW-243: [C++] Add option to switch between libhdfs and libhdfs3 when creating HdfsClient
omit 68e39c6 ARROW-429: Revert ARROW-379 until git-archive issues are resolved
omit c369709 ARROW-426: Python: Conversion from pyarrow.Array to a Python list
omit a2ead2f ARROW-380: [Java] optimize null count when serializing vectors
omit cfb544d ARROW-425: Add private API to get python Table from a C++ object
omit 063c190 ARROW-423: Define BUILD_BYPRODUCTS for CMake 3.2+
omit 9352790 ARROW-422: IPC should depend on rapidjson_ep if RapidJSON is vendored
omit 7e93075 ARROW-405: Use vendored hdfs.h if not found in include/ in $HADOOP_HOME
omit 2c10d7c ARROW-418: [C++] Array / Builder class code reorganization, flattening
omit 73fe556 ARROW-328: Return shared_ptr<T> by value instead of const-ref
omit 45ed7e7 ARROW-394: [Integration] Generate tests cases for numeric types, strings, lists, structs
omit 8995c92 ARROW-402: Fix reference counting issue with empty buffers. Close #232
omit 14ed1be ARROW-400: set struct length on load
omit d06c491 ARROW-399: ListVector.loadFieldBuffers ignores the ArrowFieldNode len…
omit a5362c2 ARROW-346: Use conda environment to build API docs
omit e139b8b ARROW-404: [Python] Fix segfault caused by HdfsClient getting closed before an HdfsFile
omit c8eb49e ARROW-408: Remove defunct conda recipes
omit 72f80d4 ARROW-409: [Python] Change record batches conversion to Table
omit 4b72329 ARROW-406: [C++] Set explicit 64K HDFS buffer size, test large reads
omit 82575ca ARROW-403: [Java] Create transfer pairs for internal vectors in UnionVector transfer impl
omit 599d516 ARROW-401: Floating point vectors should do an approximate comparison…
omit 0ac01a5 ARROW-379: Use setuptools_scm for Python versioning
omit b5de9e5 ARROW-369: [Python] Convert multiple record batches at once to Pandas
omit ebe7dc8 ARROW-335: Improve Type apis and toString() by encapsulating flatbuffers better
omit 06be7ae ARROW-389: Python: Write Parquet files to pyarrow.io.NativeFile objects
omit 33c731d ARROW-398: Java file format requires bitmaps of all 1's to be written…
omit 3b946b8 ARROW-396: [Python] Add pyarrow.schema.Schema.equals
omit 072b7d6 ARROW-395: Arrow file format writes record batches in reverse order.
omit 859018b ARROW-392: [C++/Java] String IPC integration testing / fixes. Add array / record batch pretty-printing
omit 65b74b3 ARROW-393: [JAVA] JSON file reader fails to set the buffer size on String data vector
omit e3c167b ARROW-363: [Java/C++] integration testing harness, initial integration tests
omit 86f56a6 ARROW-202: Integrate with appveyor ci for windows
omit 197120c ARROW-390: Only specify dependencies for json-integration-test on ARROW_BUILD_TESTS=ON
omit f082b17 ARROW-383: [C++] Integration testing CLI tool
omit 997f502 ARROW-382: Extend Python API documentation
omit ed6ec3b ARROW-373: [C++] JSON serialization format for testing
omit 8417096 ARROW-367: converter json <=> Arrow file format for Integration tests
omit 78288b5 ARROW-371: Handle pandas-nullable types correctly
omit 48f9780 ARROW-375: Fix unicode Python 3 issue in columns argument of parquet.read_table
omit 7f048a4 ARROW-356: Add documentation about reading Parquet
omit 4fa7ac4 ARROW-372: json vector serialization format
omit 6996c17 ARROW-312: [Java] IPC file round trip tool for integration testing
omit 79344b3 ARROW-362: Fix memory leak in zero-copy arrow to NumPy/pandas conversion
omit 121e826 ARROW-361: Python: Support reading a column-selection from Parquet files
omit e8bc1fe ARROW-368: Added note for LD_LIBRARY_PATH in Python README
omit 25e0106 ARROW-323: [Python] Opt-in to pyarrow.parquet extension rather than attempting and failing silently
omit 17c9ae7 ARROW-357: Use a single RowGroup for Parquet files as default.
omit 2a059bd ARROW-359: Document ARROW_LIBHDFS_DIR
omit e70d97d ARROW-358: Add explicit environment variable to locate libhdfs in one's environment
omit c7db80e ARROW-355: Add tests for serialising arrays of empty strings to Parquet
omit d414875 ARROW-348: [Python] Add build-type command line option to setup.py, build CMake extensions in a build type subdirectory
omit ca088dd ARROW-339: [Dev] Lingering Python 3 fixes
omit 772bc6e ARROW-349: Add six as a requirement
omit d946e79 ARROW-354: Fix comparison of arrays of empty strings
omit da24c1a ARROW-339: Python 3 compatibility in merge_arrow_pr.py
omit 6178bf7 ARROW-350: Added Kerberos to HDFS client
omit 3d2e4df ARROW-337: UnionListWriter.list() is doing more than it should, this …
omit 2f84493 ARROW-342: Set Python version on release
omit 446ec9b ARROW-334: [Python] Remove INSTALL_RPATH_USE_LINK_PATH
omit e2c0a18 ARROW-327: [Python] Remove conda builds from Travis CI setup
omit 676c32c ARROW-317: Add Slice, Copy methods to Buffer
omit 732a205 ARROW-261: Refactor String/Binary code paths to reflect unnested (non-list-based) structure
omit 8e8b17f ARROW-97: API documentation via sphinx-apidoc
omit 8520061 ARROW-336: Run Apache Rat in Travis builds
omit 4ecf327 ARROW-191: Python: Provide infrastructure for manylinux1 wheels
omit bf749f5 ARROW-275: Add tests for UnionVector in Arrow File
omit 3919a27 ARROW-332: Add RecordBatch.to_pandas method
omit caa843b ARROW-333: Make writers update their internal schema even when no data is written
omit 994aa5a ARROW-189: Build 3rd party with ExternalProject.
omit 8c8d341 ARROW-326: Include scale and precision when materializing decimal writer
omit fb799bc ARROW-112: Changed constexprs to kValue naming.
omit a9747ce ARROW-312: Read and write Arrow IPC file format from Python
omit 17cd7a6 [maven-release-plugin] prepare for next development iteration
omit e7080ef [maven-release-plugin] prepare release apache-arrow-0.1.0
omit eb1491a ARROW-325: make TestArrowFile not dependent on timezone
omit 1196691 ARROW-326: Initialize nested writers in MapWriter based on the underlying MapVector's field
omit 2d8e820 ARROW-319: Add canonical Arrow Schema json representation
omit 3f85cee ARROW-324: Update arrow metadata diagram
omit f1a4bd1 ARROW-320: ComplexCopier.copy(FieldReader, FieldWriter) should not st…
omit 04cf874 ARROW-321: fix arrow licenses
omit dd1b95b ARROW-318: Revise python/README.md given recent changes in codebase
omit 7fb4d24 ARROW-315: finalize timestamp
omit c3cfa3d ARROW-313: Build on any version of XCode
omit c7e6a07 ARROW-302: [C++/Python] Implement C++ IO interfaces for interacting with Python file and bytes objects
omit c3930a0 ARROW-301: Add user field metadata to IPC schemas
omit c7b0480 ARROW-314: JSONScalar is unnecessary and unused
omit 391ab64 ARROW-309: Types.getMinorTypeForArrowType() does not work for Union type
omit 30f6083 ARROW-305: Add compression and use_dictionary options to Parquet
omit bf30235 ARROW-306: Add option to pass cmake arguments via environment variable
omit bd195e3 ARROW-308: UnionListWriter.setPosition() should not call startList()
omit 768c7d0 ARROW-257: Add a typeids Vector to Union type
omit bae33d6 ARROW-304: NullableMapReaderImpl.isSet() always returns true
omit 03134b1 ARROW-270: Define more generic Interval logical type
omit 45d8832 ARROW-293: [C++] Implement Arrow IO interfaces for operating system files
omit 32fd692 ARROW-296: [Python / C++] Remove arrow::parquet, make pyarrow link against parquet_arrow
omit 7e39747 ARROW-267: [C++] Implement file format layout for IPC/RPC
omit 430bd95 ARROW-299: Use absolute namespace in macros
omit 5358328 ARROW-298: create release scripts
omit 5f1556c ARROW-297: Fix Arrow pom for release
omit 559b865 ARROW-280: [C++] Refactor IPC / memory map IO to use common arrow_io interfaces. Create arrow_ipc leaf library
omit 17e90e1 ARROW-290: Specialize alloc() in ArrowBuf
omit 3487c2f ARROW-292: [Java] Upgrade Netty to 4.0.41
omit 6f99156 ARROW-287: Make nullable vectors use a BitVecor instead of UInt1Vector for bits
omit 6b8abb4 ARROW-289: Install test-util.h
omit 077c72b ARROW-256: [Format] Add a version number to the IPC/RPC metadata
omit a5f2861 ARROW-286: Build thirdparty dependencies in parallel
omit 52089d6 ARROW-285: Optional flatc download
omit 270ab4e ARROW-278: [Format] Rename Tuple to Struct_ in flatbuffers IDL
omit 214b861 ARROW-283: [C++] Account for upstream changes in parquet-cpp
omit 637584b ARROW-284: Disable arrow_parquet module in Travis CI to triage builds
omit 2d8ec78 ARROW-274: Add NullableMapVector to support nullable maps
omit e197b2d ARROW-279: rename vector module to arrow-vector
omit 0a411fd ARROW-242: Support Timestamp Data Type
omit e081a4c ARROW-271: Update Field structure to be more explicit
omit 907cc5a ARROW-262: Start metadata specification document
omit 803afeb ARROW-264: File format
omit ec51d56 ARROW-269: Include typeVector buffers UnionVector.getBuffers()
omit 8960a2e ARROW-255: Finalize Dictionary representation
omit 7861968 ARROW-252: Add implementation guidelines to the documentation
omit 812201a ARROW-266: [C++] Fix broken build due to Flatbuffers namespace change
omit c2eb161 ARROW-265: Fix few decimal bugs
omit 282fcac ARROW-265: Pad negative decimal values with1
omit fd2e524 Revert version to 0.1-SNAPSHOT
omit e7e399d ARROW-259: Use Flatbuffer Field type instead of MaterializedField
omit 246a126 ARROW-107: [C++] Implement IPC for structs
omit 268e108 ARROW-251: Expose APIs for getting code and message of the status
omit 689cd27 ARROW-245: add endianness to RecordBatch
omit e8724f8 ARROW-260: Fix flaky oversized tests
omit dc01f09 ARROW-253: restrict ints to 8, 16, 32, or 64 bits in V1
omit 2742d37 ARROW-254: remove Bit type as it is redundant with Boolean
omit 34e7f48 ARROW-250: Fix for ARROW-246 may cause memory leaks
omit 5df7d4d ARROW-247: Missing explicit destructor in RowBatchReader causes an incomplete type error
omit 56835c3 ARROW-246: [Java] UnionVector doesn't call allocateNew() when creating it's vectorType
omit 3a2dfba ARROW-101: Fix java compiler warnings
omit 356d015 ARROW-240: Provide more detailed installation instructions for pyarrow. Closes
omit dc79ceb ARROW-244: Some global APIs of IPC module should be visible to the outside
omit a2fb756 ARROW-241: Add missing implementation for splitAndTransfer in UnionVector
omit 59e5f98 ARROW-236: Bridging IO interfaces under the hood in pyarrow
omit 55bfa83 ARROW-238: Change InternalMemoryPool::Free() to return Status::Invalid when ther…
omit 62390d8 ARROW-106: [C++] Add IPC to binary/string types
omit ff6132f ARROW-237: Implement parquet-cpp's abstract IO interfaces for memory allocation and file reading
omit 77598fa ARROW-233: Add visibility macros, add static build option
omit fab4c82 ARROW-234: Build libhdfs IO extension in conda artifacts
omit 2f52cf4 ARROW-215: Support other integer types and strings in Parquet I/O
omit ef90830 ARROW-222: Prototyping an IO interface for Arrow, with initial HDFS target
omit f7ade7b ARROW-223: Do not link against libpython
omit a3e3849 ARROW-219: Preserve CMAKE_CXX_FLAGS, fix compiler warnings
omit 27edd25 ARROW-210: Cleanup of the string related types in C++ code base
omit 790d541 ARROW-218: Add optional API token authentication option to PR merge tool
omit b4e0e93 ARROW-217: Fix Travis w.r.t conda 4.1.0 changes
omit ec66ddd ARROW-203: Python: Basic filename based Parquet read/write
omit 8197f24 ARROW-212: Change contract of PrimitiveArray to reflect its abstractness
omit bc6c4c8 ARROW-200: [C++/Python] Return error status on string initialization failure
omit 9ce13a0 ARROW-60: [C++] Struct type builder API
omit ce2fe7a ARROW-211: [Format] Fixed typos in layout examples
omit 6574095 ARROW-209: [C++] Triage builds due to unavailable LLVM apt repo
omit c8b8078 [Doc] Update Layout.md
omit cd1d770 ARROW-206: Expose a C++ api to compare ranges of slots between two arrays
omit 7035467 Add java support to Travis CI
omit e316b3f Fix BaseAllocator.java NPE when assertions are disabled
omit c0985a4 Make BaseValueVector#MAX_ALLOCATION_SIZE configurable
omit e0fb369 ARROW-201: [C++] Initial ParquetWriter implementation
omit 978de1a ARROW-204: Add Travis CI builds that post conda artifacts for Linux and OS X
omit 9c59158 ARROW-185: Make padding and alignment for all buffers be 64 bytes
omit 6968ec0 ARROW-199: [C++] Refine third party dependency
omit 68b80a8 ARROW-197: Working first draft of a conda recipe for pyarrow
omit 4bd13b8 ARROW-91: Basic Parquet read support
omit 1f04f7f ARROW-193: typos "int his" fix to "in this"
omit c9ffe54 ARROW-194: C++: Allow read-only memory mapped source
omit 3302257 ARROW-190: Python: Provide installable sdist builds
omit ad3d01d ARROW-188: Add numpy as install requirement
omit 355f7c9 ARROW-92: Arrow to Parquet Schema conversion
omit 56514d9 ARROW-104: [FORMAT] Add alignment and padding requirements + union clarification
omit a541644 ARROW-100: [C++] Computing RowBatch size
omit 0b472d8 ARROW-82: Initial IPC support for ListArray
omit 5843e68 ARROW-103: Add files to gitignore
omit 37f7271 ARROW-94: [Format] Expand list example to clarify null vs empty list
omit 7b2153b ARROW-85: memcmp can be avoided in Equal when comparing with the same …
omit 9d88a50 ARROW-86: [Python] Implement zero-copy Arrow-to-Pandas conversion
omit 5d12999 ARROW-71: [C++] Add clang-tidy and clang-format to the the tool chain.
omit 79fddd1 ARROW-90: [C++] Check for SIMD instruction set support
omit 6d31d59 ARROW-49: [Python] Add Column and Table wrapper interface
omit b3ebce1 ARROW-89: [Python] Add benchmarks for Arrow<->Pandas conversion
omit 5a68f8d ARROW-93: Fix builds when using XCode 7.3
omit 2d8627c ARROW-87: [C++] Add all four possible ways to encode Decimals in Parquet to schema conversion
omit 38897ee ARROW-83: [C++] Add basic test infrastructure for DecimalType
omit df7726d ARROW-88: [C++] Refactor usages of parquet_cpp namespace
omit 80ec2c1 ARROW-79: [Python] Add benchmarks
omit ecadd0b ARROW-80: Handle len call for pre-init arrays
omit 1fd0668 ARROW-30: [Python] Routines for converting between arrow::Array/Table and pandas.DataFrame
omit 0171877 ARROW-65: Be less restrictive on PYTHON_LIBRARY search paths
omit d6d53b2 ARROW-63: [C++] Enable ctest to work on systems with Python 3 as the default Python
omit d3cb6b4 ARROW-22: [C++] Convert flat Parquet schemas to Arrow schemas
omit 0a8979d ARROW-37: [C++ / Python] Implement BooleanArray and BooleanBuilder. Handle Python built-in bool
omit c06b765 ARROW-62: Clarify null bitmap interpretation, indicate bit-endianness, add null count, remove non-nullable physical distinction
omit fbbee3d ARROW-77: [C++] Conform bitmap interpretation to ARROW-62; 1 for nulls, 0 for non-nulls
omit a4002c6 ARROW-70: Add adapt 'lite' DCHECK macros from Kudu as also used in Parquet
omit 65db0da ARROW-67: C++ metadata flatbuffer serialization and data movement to memory maps
omit 093f9bd ARROW-75: Fix handling of empty strings
omit 4ec034b ARROW-28: Adding google's benchmark library to the toolchain
omit 016b92b ARROW-72: Search for alternative parquet-cpp header
omit 3a99f39 ARROW-73: Support older CMake versions
omit c996610 ARROW-68: Better error handling for not fully setup systems
omit 5881aac ARROW-64: Add zsh support to C++ build scripts
omit 883c62b ARROW-55: [Python] Fix unit tests in 2.7
omit 6fdcd49 ARROW-54: [Python] Rename package to "pyarrow"
omit 8367527 ARROW-42: Add Python tests to Travis CI build
omit e822ea7 ARROW-46: ListVector should initialize bits in allocateNew
omit 31def7d ARROW-51: Add simple ValueVector tests
omit 243ed4e ARROW-18: Fix decimal precision and scale in MapWriters
omit 1650026 ARROW-17: set some vector fields to package level access for Drill compatibility
omit 45cd9fd ARROW-43: Python: format array values to in __repr__ for interactive computing
omit ae95dbd ARROW-44: Python: prototype object model for array slot values ("scalars")
omit 9afb667 ARROW-31: Python: prototype user object model, add PyList conversion path with type inference
omit 571343b ARROW-9: Rename some unchanged "Drill" to "Arrow" (follow-up)
omit 8caa287 ARROW-35: Add a short call-to-action in the top level README.md
omit 572cdf2 ARROW-7: Add barebones Python library build toolchain
omit 612fbc7 ARROW-24: C++: Implement a logical Table container type
omit 9c2b954 ARROW-23: Add a logical Column data structure
omit 3b777c7 ARROW-26: Add instructions for enabling Arrow C++ Parquet adapter build
omit 0c95d3c ARROW-10: Fix mismatch of javadoc names and method parameters
omit 307977e ARROW-15: Fix a naming typo for memory.AllocationManager.AllocationOutcome
omit 89c6afd ARROW-21: Implement a simple in-memory Schema data structure
omit b88b69e ARROW-20: Add null_count_ member to array containers, remove nullable_ member
omit e418020 ARROW-19: Add an externalized MemoryPool interface for use in builder classes
omit 1000d11 ARROW-36: Remove fixVersions from JIRA resolve code path
omit 8f2ca24 ARROW-13: Add PR merge tool from parquet-mr, suitably modified
omit a385622 ARROW-8: Add .travis.yml and test script for Arrow C++. OS X build fixes
omit e6905ef ARROW-9: Replace straggler references to Drill
omit e9cc8ce ARROW-5: Correct Apache Maven repo for maven plugin use
omit 7e76e3a ARROW-5: Update drill-fmpp-maven-plugin to 1.5.0
omit 23c4b08 ARROW-4: This provides an partial C++11 implementation of the Apache Arrow data structures along with a cmake-based build system. The codebase generally follows Google C++ style guide, but more cleaning to be more conforming is needed. It uses googletest for unit testing.
omit 16e44e3 ARROW-3: This patch includes a WIP draft specification document for the physical Arrow memory layout produced over a series of discussions amongst the to-be Arrow committers during late 2015. There are also a few small PNG diagrams that illustrate some of the Arrow layout concepts.
omit fa5f029 ARROW-1: Initial Arrow Code Commit
omit cbc56bf Update readme and add license in root.
omit d5aa7c4 Initial Commit
add 0427442 Initial pre-ASF parquet-cpp development by Nong Li
add b30c09c PARQUET-232: minor compilation issue
add 4f47d10 PARQUET-416: C++11 compilation, code reorg, libparquet and installation targets
add 09cec85 PARQUET-267: Detach thirdparty code from build configuration.
add aecf146 PARQUET-449: updated to latest parquet.thrift
add aac1934 PARQUET-437: Add googletest setup and ADD_PARQUET_TEST helper
add cea2092 PARQUET-469: Roll back Thrift thirdparty and compiled sources to 0.9.0
add fbda61f PARQUET-434: Add a ParquetFileReader class
add fb06287 PARQUET-418: Refactored parquet_reader utility for printing file contents.
add 7c33cc9 PARQUET-451: Add RowGroupReader helper class and refactor parquet_reader.cc into DebugPrint
add b1d44f1 PARQUET-439: Conform copyright headers to ASF requirements
add 2152bfc PARQUET-428: Support INT96 and FIXED_LEN_BYTE_ARRAY types
add ecf5e7d PARQUET-472: Changed the ownership of InputStream in ColumnReader.
add 6cefaba PARQUET-435: Change column reader methods to be array-oriented rather than scalar
add e837ee9 PARQUET-496: Fix cpplint configuration to catch more style errors
add 3bac789 PARQUET-438: Update RLE encoding tools and add unit tests from Impala
add 41eed7e PARQUET-485: Decouple page deserialization from column reader to facilitate unit testing
add 88e5e0e PARQUET-503: Reenable parquet 2.0 encoding implementations.
add fda229a PARQUET-454: Fix inconsistencies with boolean PLAIN encoding
add 143485d PARQUET-442: Nested schema conversion, Thrift struct decoupling, dump-schema utility
add 783b76c PARQUET-507: Reduce the runtime of rle-test
add 5e91cff PARQUET-455: Fix OS X / Clang compiler warnings
add 569ffb2 PARQUET-448: Add cmake options to not build tests and/or executables
add b47f67e PARQUET-513: Fail build if valgrind finds error during ctest, fix a core dump
add b268bb8 PARQUET-169: Implement support for bulk reading and writing rep/def levels
add bc47477 PARQUET-501: Add OutputStream abstract interface, refactor encoding code paths
add d35efe2 PARQUET-497: Decouple serialized file internals from the ParquetFileReader public API
add 4e18915 PARQUET-505: Column reader should automatically handle large data pages
add c857ddd PARQUET-456: Finish gzip implementation and unit test all compressors
add bf3bf75 PARQUET-446: Hide Thrift compiled headers and Boost from public API, #include scrubbing
add af04814 PARQUET-515: Add "SetData" to LevelDecoder
add a13b20f PARQUET-499: Complete PlainEncoder implementation for all primitive types and test end to end
add 218fe8e PARQUET-468: Use thirdparty Thrift compiler to compile parquet.thrift at make time
add 5d05c2e PARQUET-457: Verify page deserialization for GZIP and SNAPPY codecs, related refactoring
add 70665ce PARQUET-533: Add a Buffer abstraction, refactor input/output classes to be simpler using Buffers
add 3eb2233 PARQUET-525: Add test coverage for failure modes in ParseMetaData
add f0f40f6 PARQUET-538: Improve ColumnReader Tests
add ae1bb51 PARQUET-494: Implement DictionaryEncoder and test dictionary decoding
add cee3691 PARQUET-545: Improve API to support decimal type
add e5f04e6 PARQUET-518: Remove -Wno-sign-compare and scrub integer signedness
add 22f352c PARQUET-520: Add MemoryMapSource and add unit tests for both it and LocalFileSource
add 4923018 PARQUET-463: Add local DCHECK macros, fix some dcheck bugs exposed
add 853b128 PARQUET-537: Ensure that LocalFileSource is properly closed.
add 4bcfb0e PARQUET-519: Remove last of suppressed compiler warnings
add 8d43015 PARQUET-482: Organize public API headers
add 4b0a2d9 PARQUET-549: Add column reader tests for dictionary pages
add 0c764ea PARQUET-555: Dictionary page metadata handling inconsistencies
add 3db3240 PARQUET-561: Add destructor to PIMPL
add cd531f1 PARQUET-556:Extend RowGroupStatistics to include "min" "max" statistics
add 41920f5 PARQUET-488: Add SSE cmake toggle, fix build on systems without SSE
add b2c072e PARQUET-564: Add cmake option to run valgrind on each unit test executable
add c6e269d PARQUET-542: Support custom memory allocators
add 43b895f PARQUET-568: Enable top-level column selection.
add 1ce2869 PARQUET-559: Enable external RandomAccessSource as input to the ParquetFileReader
add 0a0ab70 PARQUET-566: Add method to retrieve the full column path
add bba4d52 PARQUET-572: Rename public namespace to parquet from parquet_cpp
add 8af2caf PARQUET-582: Conversions functions for Parquet enums to Thrift enums
add 2284964 PARQUET-583: Parquet to Thrift schema conversion
add f044f2a PARQUET-587: Implement BufferReader::Read(int64_t,uint8_t*)
add b3cdb9e PARQUET-436: Implement basic Write Support
add 7dc51f8 PARQUET-547: Refactor templates to all be based on DataType structs
add fe1f3b7 PARQUET-477: Add clang-format / clang-tidy checks to toolchain
add bb67f88 PARQUET-512: Add Google benchmark for performance testing
add d050bf4 PARQUET-597: Add data rates to benchmark output
add 862a975 PARQUET-589: Implement BufferedInputStream for better memory usage
add 37e621e PARQUET-599: Better size estimation for levels
add 968e2bd PARQUET-604: Add writer headers to installation
add c41cff6 PARQUET-605: Expose schema node in ColumnDescriptor
add 43bd263 PARQUET-603: Implement missing information in schema descriptor
add dd58e39 PARQUET-607: Public writer header
add 227f66f PARQUET-610: Print additional ColumnMetaData for each RowGroup
add af71bad PARQUET-614: Remove unneeded LZ4-related code
add e1cba98 PARQUET-616: WriteBatch should accept const arrays
add 3ff3b58 PARQUET-600: Add benchmarks for RLE-Level encoding
add e1e0d28 PARQUET-620: Ensure metadata is written only once
add cd8906c PARQUET-619: Add OutputStream for local files
add 634132e PARQUET-621: Add flag to indicate if decimalmetadata is set
add 01d31db PARQUET-598: Test writing all primitive data types
add 466aa3d PARQUET-625: Improve RLE read performance
add 2e42359 PARQUET-629: RowGroupSerializer should only close itself once
add b1a816d PARQUET-633: Add version to WriterProperties
add ba3012e PARQUET-634: Consistent private linking of dependencies
add ce0cdeb PARQUET-592: Support compressed writes
add c21b041 PARQUET-636: Expose selection for different encodings
add 427d0a2 PARQUET-641: Instantiate stringstream only if needed in SerializedPageReader::NextPage
add a8ad3a4 PARQUET-639: Do not export DCHECK in public headers
add 8e98b5c PARQUET-643: Add const modifier to schema pointer reference
add 05c4c9d PARQUET-646: Add options to make developing with clang and 3rd-party gcc easier
add b3d9a14 PARQUET-489: Shared library symbol visibility
add b6abc6d PARQUET-551:Handle compiler warnings due to disabled DCHECKs in relea…
add 1e73c0a PARQUET-657: Do not define DISALLOW_COPY_AND_ASSIGN if already defined
add 3b88b05 PARQUET-658: Add virtual destructor to ColumnReader
add e21857a PARQUET-659: Export extern templates for typed column reader/writer classes
add b283264 PARQUET-662: Compile ParquetException implementation and explicitly export
add a0bfd9d PARQUET-671: performance improvements for rle/bit-packed decoding
add 602b9be PARQUET-666: Add support for writing dictionaries
add 4078b87 PARQUET-694: Revert default data page size back to 1M
add 18aa1ac PARQUET-573: Create a public API for reading and writing file metadata
add f128d51 PARQUET-699: Update parquet.thrift from https://github.com/apache/parquet-format
add 3976997 PARQUET-701: Ensure that Close can be called multiple times
add 08ce126 PARQUET-700: Disable dictionary encoding for boolean columns
add ddf0297 PARQUET-676: Fix incorrect MaxBufferSize for small bit widths
add 78b1de3 PARQUET-681: Add tool to scan a parquet file
add cc1fdec PARQUET-704: Install scan-all.h
add 66e7299 PARQUET-703: Validate that ColumnChunk metadata counts nulls in num_values
add 8268107 PARQUET-708: account for "worst case scenario" in MaxBufferSize for bit_width > 1
add ce843c8 PARQUET-710: Remove unneeded private member variables from RowGroupReader ABI
add 10ebdbd PARQUET-711: Use metadata builders in parquet writer
add adcabc4 PARQUET-687: C++: Switch to PLAIN encoding if dictionary grows too large
add 20c2cb2 PARQUET-718: Fix I/O of non-dictionary encoded pages
add 87ff504 PARQUET-719: Fix WriterBatch API to handle NULL values
add 9e46b37 PARQUET-689: C++: Compress DataPages eagerly
add b8de4d0 PARQUET-720: Mark ScanAllValues as inline to prevent link error
add 13980f9 PARQUET-712: Add library to read into Arrow memory
add 9dfa948 PARQUET-724: Test more advanced properties setting
add 287cf01 PARQUET-728: Incorporate upstream Arrow API changes
add c9c7f4a PARQUET-721: benchmarks for reading into Arrow
add 9aae125 PARQUET-731: API to return metadata size and Skip reading values
add 43c7154 PARQUET-593: Add API for writing Page statistics
add 53958b1 PARQUET-737: Use absolute namespace in macros
add 20d4a17 PARQUET-741: Always allocate fresh buffers while compressing
add 408d788 PARQUET-739: Don't use a static buffer for data accessed by multiple threads
add c81a26e PARQUET-739: Don't use a static buffer for data accessed by multiple threads
add 350e520 PARQUET-747: Better hide TypedRowGroupStatistics in public API
add 73eb456 PARQUET-742: Add missing license headers
add 67ae6e5 PARQUET-752: Account for upstream Arrow API changes
add 05a168c PARQUET-759: Fix handling of columns of empty strings
add 9c527b7 PARQUET-760: Store correct encoding in fallback data pages
add 96a6dd4 PARQUET-745: TypedRowGroupStatistics fails to PlainDecode min and max in ByteArrayType
add 4409707 PARQUET-763: C++: Expose ParquetFileReader through Arrow reader
add 676d61c PARQUET-766: Expose ParquetFileReader through Arrow reader as const
add 6da9e8a PARQUET-764: Support batches for PLAIN boolean writes that aren't a multiple of 8
add 163b2ac PARQUET-762: C++: Use optimistic allocation instead of Arrow Builders
add 5abf985 PARQUET-775: Make TrackingAllocator thread-safe
add 246ec91 PARQUET-702: Add a writer + reader example with detailed comments
add a414be7 PARQUET-778: Standardize the schema output to match the parquet-mr format
add e0f9806 PARQUET-769: Add support for Brotli compression
add fbdba4f PARQUET-779: Export TypedRowGroupStatistics in libparquet
add 7a5f274 PARQUET-780: WriterBatch API does not properly handle NULL values for byte array types
add 38416c4 PARQUET-782: Support writing to Arrow sinks
add 8bbb5d7 PARQUET-789: Catch/translate ParquetExceptions in parquet::arrow::FileReader
add b801505 PARQUET-785: LIST schema conversion for Arrow lists
add 912d7af PARQUET-797: Updates for ARROW-418 header API changes
add 7752273 PARQUET-799: Fix bug in MemoryMapSource::CloseFile
add b50e626 PARQUET-805: Read Int96 into Arrow Timestamp(ns)
add 7790183 PARQUET-812: Read BYTE_ARRAY with no logical type as arrow::BinaryArray
add ffb7f06 PARQUET-816: Workaround for incorrect column chunk metadata in parquet-mr <= 1.2.8
add e348a6d PARQUET-813: Build thirdparty dependencies using ExternalProject
add deb5680 PARQUET-818: Refactoring to utilize common IO, buffer, memory management abstractions and implementations
add bfb24f6 PARQUET-819: Don't try to install no longer existing arrow/utils.h
add d36dc11 PARQUET-807: Allow user to retain ownership of parquet::FileMetaData.
add 1867981 PARQUET-809: Add SchemaDescriptor::Equals method
add 6d354a1 PARQUET-827: Account for arrow::MemoryPool API change and fix bug in reading Int96 timestamps
add ea9c4d3 PARQUET-828: Do not implicitly cast ParquetVersion enum to int
add 2cbd797 PARQUET-829: Make use of ARROW-469
add 6312724 PARQUET-830: Add parquet::arrow::OpenFile with additional properties and metadata args
add 97e69b4 PARQUET-820: Decoders should directly emit arrays with spacing for null entries
add f3a3c69 PARQUET-833: C++: Provide API to write spaced arrays
add 4e52f61 PARQUET-837: Remove RandomAccessSource::Seek method which can be a source of thread safety problems
add 18caeab PARQUET-835: Read Arrow columns in parallel with thread pool
add c195976 PARQUET-836: Bugfix + testcase for column subsetting in arrow::FileReader::ReadFlatTable
add d0446e1 PARQUET-691: Write ColumnChunk metadata after chunk is complete
add 38a6a98 PARQUET-841: Version number being incorrectly written for v1 files
add 493603d PARQUET-842: Do not set unnecessary fields in the parquet::SchemaElement
add 5a21610 PARQUET-843: Impala is thrown off by a REPEATED root schema node
add c016b72 PARQUET-844: Schema, compression consolidation / flattening
add 61b7b12 PARQUET-846: CpuInfo::Init() is not thread safe
add 270bda0 PARQUET-848: Build Thrift bits as part of main parquet_objlib component
add 8fda954 PARQUET-834: Support I/O of arrow::ListArray
add 7f305a6 PARQUET-857: Flatten parquet/encodings directory, consolidate code
add 7a65d43 PARQUET-862: Provide defaut cache size values
add d53bb1a PARQUET-866: API fixes for ARROW-33 patch
add 3eda0d2 PARQUET-867: Support writing sliced Arrow arrays
add ee62a34 PARQUET-874: Use default memory allocator from Arrow
add 6a9631a PARQUET-793: Do not return incorrect statistics
add 72cb04b PARQUET-877: Update Arrow Hash, update Version in metadata.
add cff54fa PARQUET-880: Prevent destructors from throwing
add 74db8d1 PARQUET-882: Improve Application Version parsing
add cb8eab9 PARQUET-888: Add missing virtual dtor.
add 0d2b951 PARQUET-889: Fix compilation when SSE is enabled
add 220aa56 PARQUET-894: Fix compilation warning
add 5ab15c6 PARQUET-895: Fix broken reading of nested repeated columns
add 48b70d0 PARQUET-894: Fix compilation warnings
add 9ca26c7 PARQUET-903: Add option to set RPATH to origin
add fb325c3 PARQUET-890: Support I/O of DATE columns in parquet_arrow
add 6060d83 PARQUET-908: Fix shared library visibility of some symbols in types.h
add b6b5aac PARQUET-909: Reduce buffer allocations (mallocs) on critical path
add aaf4ffd PARQUET-897: Only use designated public headers from libarrow
add 9d27375 PARQUET-919: Account for ARROW-683 changes, but make no functional changes. Set PARQUET_ARROW=on by default
add f0d1456 PARQUET-923: Account for Time type changes in Arrow
add 22d95d2 PARQUET-928: Support pkg-config
add 0f93007 PARQUET-933: Account for API changes in ARROW-728
add 22279eb PARQUET-934: Support multiarch on Debian
add 7bf8f04 PARQUET-935: Set version to shared library
add 81c2696 PARQUET-943: Fix build error on x86
add 4b53921 PARQUET-946: Add ReadRowGroup and num_row_group methods to arrow::FileReader
add d2c347d PARQUET-947: Account for Arrow library consolidation in ARROW-795, API changes in ARROW-782
add 2ea0d60 PARQUET-918: FromParquetSchema API crashes on nested schemas
add b3dedf4 PARQUET-953: Add static constructors to arrow::FileWriter for initializing from schema, add WriteTable method
add ada05fa PARQUET-918: Keep ordering in column indices when converting Parquet Schema
add c3dc8a1 PARQUET-898: Upgrade to googletest 1.8.0, move back to Xcode 6.4 in Travis CI
add 4ea7124 PARQUET-508: Add ParquetFilePrinter
add dac6505 PARQUET-958: [C++] Print Parquet metadata in JSON format
add 61f3b1d PARQUET-915: Support additional Arrow date/time types and metadata
add 6a27975 PARQUET-963: Return NotImplemented when attempting to read a struct field
add 35d09d4 PARQUET-595: API for KeyValue metadata
add 5e60bfc PARQUET-965: Add FIXED_LEN_BYTE_ARRAY read and write support in parquet-arrow
add 4e96056 PARQUET-679: Local Windows build and Appveyor support
add f444dfe PARQUET-936: Return Invalid Status if chunk_size <= 0 when WriteTable in parquet-arrow
add 7242b1c PARQUET-914: Rewording exception message in column writer.
add 8255ccc PARQUET-679: [C++] Resolve unit tests issues on Windows; Run unit tes…
add bd02cca PARQUET-930: Add timestamp[us] to schema test
add 8bc6ec5 PARQUET-679: Fix debug asserts in tests (msvc/debug build)
add 2fab6a2 PARQUET-984: Add abi and so version to pkg-config
add 0e4c4a1 PARQUET-992: Do not transitively include zlib.h in public API
add 7638af1 PARQUET-995: Use sizeof(Int96) instead of Int96Type
add a821f09 PARQUET-997: Fix override compiler warnings
add 0e1f467 PARQUET-978: [C++] Minimizing footer reads for small(ish) metadata
add 7d476b2 PARQUET-991: Resolve msvc warnings; Appveyor treats msvc warnings as …
add a8d8d22 PARQUET-967: Combine libparquet, libparquet_arrow libraries
add 5aa2339 PARQUET-999: Improve MSVC build - Enable PARQUET_BUILD_BENCHMARKS
add 5f42afa PARQUET-1008: [C++] TypedColumnReader::ReadBatch method updated to ac…
add 9dcb12d PARQUET-1003: Modify DEFAULT_CREATED_BY value for every new release v…
add 94e351c PARQUET-1029: [C++] Some extern template symbols not being exported in gcc
add 8f7282b PARQUET-1007: Update parquet.thrift
add 13f3fde PARQUET-991: Fix msvc warning C4100: '<id>': unreferenced formal parameter
add 514b74c PARQUET-1033: Improve documentation about WriteBatchSpaced
add 2d98407 PARQUET-911: [C++] Support nested structs in parquet_arrow
add cc46aff PARQUET-1038: Key value metadata should be nullptr if not set
add 1fdd816 PARQUET-1042: Fix Compilation breaks on GCC 4.8
add 61da26c PARQUET-1041: Support Arrow's NullArray
add 0a32c6b PARQUET-1043: Raise minimum CMake version to 3.2, delete cruft.
add b0414cc PARQUET-1044: Use compression libraries from Apache Arrow
add 81db371 PARQUET-858: Flatten column directory, minor code consolidation
add 40527c3 PARQUET-1045: Remove code that's being moved to Apache Arrow in ARROW-1154
add 5374737 PARQUET-1040: Add missing writer methods
add 3e34c37 PARQUET-1048: Apache Arrow static transitive dependencies
add 658c7fb PARQUET-1053: Fix unused result warnings due to unchecked Statuses
add 68315b8 PARQUET-1054: Fixes for Arrow API changes in ARROW-1199
add 2395770 PARQUET-1035: Write Int96 from Arrow timestamp(ns)
add 6c97fe6 PARQUET-1068: Modify .clang-format to use straight Google format with 90-character line width
add facce86 PARQUET-1072: Build with ARROW_NO_DEPRECATED_API in Travis CI
add 82d516e PARQUET-1078: Add option to coerce Arrow timestamps to a particular unit
add 7fd1519 PARQUET-1079: Remove Arrow offset shift unneeded after ARROW-1335
add 38a4e9f PARQUET-1083: Factor logic in parquet-scan.cc into a library function to help with perf testing
add eadc62e PARQUET-1085: [C++] Use namespaced macros from arrow/util/macros.h, work around UNUSED rename
add 5f54be7 PARQUET-1087: Add ScanContents function to arrow::FileReader that catches Parquet exceptions
add 4845e76 PARQUET-1088: Remove parquet_version.h from version control since it gets auto generated
add 751eb00 PARQUET-1090: Add max row group length option, fix int32 overflow
add 200774e PARQUET-1093: Improve Arrow level generation error message
add dcf96ed PARQUET-1002: Compute statistics based on Sort Order
add 92e7dae PARQUET-1098: Install util/comparison.h
add d29d4a9 PARQUET-1104: Upgrade to Apache Arrow 0.7.0 RC0
add 75cf66a PARQUET-929: Handle arrow::DictionaryArray when writing Arrow data
add cd1c622 PARQUET-1094: Add benchmark for boolean Arrow column I/O
add d7003c0 PARQUET-1100: Introduce RecordReader interface to better support nested data, refactor parquet/arrow/reader
add 468e737 PARQUET-1037: allow arbitrary size row-groups
add 9809754 PARQUET-1108: Fix Int96 comparators
add ac1a5d3 PARQUET-1114 Apply changes for ARROW-1601 ARROW-1611, change shared l…
add f5c7aee PARQUET-1123: [C++] Update parquet-cpp to use Arrow's AssertArraysEqual
add f36231d PARQUET-1121: Handle Dictionary[Null] arrays on writing Arrow tables
add f1dabe9 PARQUET-1138: Fix Arrow 0.7.1 build
add dcea0ab PARQUET-1150: Hide statically linked boost symbols
add da29595 PARQUET-1095: [C++] Read and write Arrow decimal values
add d619050 PARQUET-1164: [C++] Account for API changes in ARROW-1808
add 1124a79 PARQUET-970: Add Lz4 and Zstd compression codecs
add adc569a PARQUET-1167: [C++] FieldToNode function should return a status when throwing an exception
add 4acd139 PARQUET-1175: Fix arrow::ArrayData method rename from ShallowCopy to Copy
add 2b37b1f PARQUET-1165: Pin clang-format version to 4.0
add 5324ee9 PARQUET-859: Flatten parquet/file directory, consolidate file reader, file writer code
add bcc1f88 PARQUET-1177: Add PARQUET_BUILD_WARNING_LEVEL option and more rigorous Clang warnings
add 46e1d4e PARQUET-1092: Support writing chunked arrow::Table columns
add 7dbe374 PARQUET-1180: Fix behaviour of num_children element of primitive nodes
add 4538a2e PARQUET-1086: [C++] Remove usage of arrow/util/compiler-util.h
add d257a88 PARQUET-1193: [CPP] Implement ColumnOrder to support min_value and max_value
add 39c0b7b PARQUET-1179: Upgrade to Thrift 0.11, use std::shared_ptr instead of boost::shared_ptr
add 5ebb78c PARQUET-1200: Support reading a single Arrow column from a Parquet file
add 7f1b0c0 PARQUET-1226: Fixes for CHECKIN compiler warning level with clang 5.0
add cae28c0 PARQUET-1218: More informative error message on too short pages
add 96a0265 PARQUET-1233: Enable option to switch between stl classes and boost c…
add 15e8661 PARQUET-1225: NaN values may lead to incorrect filtering under certai…
add b3f3c09 PARQUET-1245: Fix creating Arrow table with duplicate column names
add 102d951 PARQUET-1166: Add GetRecordBatchReader in parquet/arrow/reader
add f28563d PARQUET-1071: Check that arrow::FileWriter::Close() is idempotent
add de865da PARQUET-1255: Fix error message when PARQUET_TEST_DATA isn't defined
add b73771b PARQUET-1265: Segfault on static ApplicationVersion initialization
add 828783d PARQUET-1267: [C++] replace "unsafe" std::equal by std::memcmp
add a251714 PARQUET-1268: Fix conversion of null list Arrow arrays
add 9d99820 PARQUET-1273: Properly write dictionary values when writing in chunks
add 42f287c PARQUET-1274: Prevent segfault that was occurring when writing a nanosecond timestamp with arrow writer properties set to coerce timestamps and support deprecated int96 timestamps.
add 2d0a904 PARQUET-1272: Return correct row count for nested columns in ScanFileContents
add fa53ea7 PARQUET-1279: [C++] Adding use of ASSERT_NO_FATAL_FAILURE in unit tests when calling helper functions that call ASSERT_ macros
add b9e80c8 PARQUET-1283: [C++] Remove trailing space for string and int96 statis…
add 076fbc6 PARQUET-979: Limit size of min, max or disable stats for long binary types
add f20fe7e PARQUET-1307: Fix memory-test for newer Arrow
add 129d845 PARQUET-1315: ColumnChunkMetaData.has_dictionary_page() should return…
add f38245b PARQUET-1340: Fix Travis Ci valgrind errors related to std::random_de…
add ea8798d PARQUET-1334: [C++] memory_map parameter seems missleading in parquet file opener
add 08ca177 PARQUET-1333: [C++] Reading of files with dictionary size 0 fails on Windows with bad_alloc
add 079ae70 PARQUET-1346: [C++] Protect against empty Arrow arrays with null values
add 630cf0a PARQUET-1350: [C++] Use abstract ResizableBuffer instead of concrete PoolBuffer
add fee8d70 PARQUET-1323: Fix compiler warnings on clang-6
add bd5243e PARQUET-1358: index_page_offset should be unset as it is not supported
add 0ccf832 PARQUET-1348: Add ability to write FileMetaData in arrow FileWriter
add 673ccfa PARQUET-1360: Use conforming API style, variable names in WriteFileMetaData functions
add 0e0f838 PARQUET-1227: Thrift crypto metadata structures
add 40b21b3 PARQUET-1357: FormatStatValue truncates binary statistics on zero character
add b6ad261 PARQUET-1366: [C++] Streamline use of Arrow's bit-util.h APIs
add ed7242e PARQUET-1301: [C++] Crypto package in parquet-cpp
add bdeed71 PARQUET-1332: Add bloom filter for parquet
add e26afc2 PARQUET-1378: Allow RowGroups with zero rows to be written
add 72795ef PARQUET-1308: [C++] Use Arrow thread pool, not Arrow ParallelFor, fix deprecated APIs, upgrade clang-format version. Fix record delimiting bug
add d146452 PARQUET-1382: [C++] Prepare for arrow::test namespace removal
add aa166ed PARQUET-1384: fix clang build error for bloom_filter-test.cc
add 41ae86d PARQUET-1256: Add --print-key-value-metadata option to parquet_reader tool
add cdf2e3f PARQUET-1276: [C++] Reduce the amount of memory used for writing null decimal values
add 1dffe22 PARQUET-1392: Read multiple RowGroups at once into an Arrow table
add 1463276 PARQUET-1372: Add an API to allow writing RowGroups based on size
add 9b4cd9c ARROW-3075: [C++] Incorporate parquet-cpp codebase into Arrow C++ build system. Add unit test label granularity options, ability to add component group targets like 'make parquet' that build libraries and tests
This update added new revisions after undoing existing revisions.
That is to say, some revisions that were in the old version of the
branch are not in the new version. This situation occurs
when a user --force pushes a change and generates a repository
containing something like this:
* -- * -- B -- O -- O -- O (17999a8)
\
N -- N -- N refs/heads/master (9b4cd9c)
You should already have received notification emails for all of the O
revisions, and so the following emails describe only the N revisions
from the common base, B.
Any revisions marked "omit" are not gone; other references still
refer to them. Any revisions marked "discard" are gone forever.
No new revisions were added by this update.
Summary of changes:
.gitmodules | 3 +
.travis.yml | 6 +-
appveyor.yml | 5 +-
ci/cpp-python-msvc-build.bat | 37 +-
ci/travis_before_script_cpp.sh | 4 +
ci/travis_env_common.sh | 4 +-
ci/travis_install_toolchain.sh | 4 -
ci/travis_script_python.sh | 4 +-
cpp/CMakeLists.txt | 25 +-
cpp/build-support/lint_cpp_cli.py | 44 +-
cpp/cmake_modules/BuildUtils.cmake | 58 +-
cpp/cmake_modules/SetupCxxFlags.cmake | 6 +-
cpp/cmake_modules/ThirdpartyToolchain.cmake | 60 +-
cpp/src/arrow/CMakeLists.txt | 10 +
cpp/src/arrow/dbi/hiveserver2/CMakeLists.txt | 10 +-
cpp/src/arrow/dbi/hiveserver2/sample-usage.cc | 2 +-
cpp/src/arrow/gpu/CMakeLists.txt | 6 +
cpp/src/arrow/io/file.cc | 2 +-
cpp/src/arrow/io/hdfs-internal.h | 2 +-
cpp/src/arrow/python/CMakeLists.txt | 14 +-
cpp/src/arrow/type.h | 3 -
cpp/src/arrow/util/io-util.cc | 2 +-
cpp/src/arrow/util/visibility.h | 2 +
cpp/src/arrow/{io => util}/windows_compatibility.h | 5 +-
cpp/src/parquet/.gitignore | 2 +
cpp/src/parquet/.parquetcppversion | 1 +
cpp/src/parquet/CMakeLists.txt | 291 +++
cpp/src/parquet/README | 10 +
.../src/parquet/api/CMakeLists.txt | 19 +-
.../windows_compatibility.h => parquet/api/io.h} | 22 +-
.../api/reader.h} | 29 +-
.../api/schema.h} | 22 +-
.../api/writer.h} | 25 +-
.../src/parquet/arrow/CMakeLists.txt | 23 +-
.../parquet/arrow/arrow-reader-writer-benchmark.cc | 263 +++
cpp/src/parquet/arrow/arrow-reader-writer-test.cc | 2376 ++++++++++++++++++++
cpp/src/parquet/arrow/arrow-schema-test.cc | 852 +++++++
cpp/src/parquet/arrow/reader.cc | 1559 +++++++++++++
cpp/src/parquet/arrow/reader.h | 307 +++
cpp/src/parquet/arrow/record_reader.cc | 818 +++++++
cpp/src/parquet/arrow/record_reader.h | 113 +
cpp/src/parquet/arrow/schema.cc | 704 ++++++
cpp/src/parquet/arrow/schema.h | 94 +
cpp/src/parquet/arrow/test-util.h | 527 +++++
cpp/src/parquet/arrow/writer.cc | 1152 ++++++++++
cpp/src/parquet/arrow/writer.h | 210 ++
cpp/src/parquet/bloom_filter-test.cc | 244 ++
cpp/src/parquet/bloom_filter.cc | 166 ++
cpp/src/parquet/bloom_filter.h | 245 ++
cpp/src/parquet/column-io-benchmark.cc | 237 ++
cpp/src/parquet/column_page.h | 173 ++
cpp/src/parquet/column_reader-test.cc | 390 ++++
cpp/src/parquet/column_reader.cc | 475 ++++
cpp/src/parquet/column_reader.h | 537 +++++
cpp/src/parquet/column_scanner-test.cc | 238 ++
cpp/src/parquet/column_scanner.cc | 91 +
cpp/src/parquet/column_scanner.h | 258 +++
cpp/src/parquet/column_writer-test.cc | 807 +++++++
cpp/src/parquet/column_writer.cc | 868 +++++++
cpp/src/parquet/column_writer.h | 330 +++
cpp/src/parquet/encoding-benchmark.cc | 166 ++
cpp/src/parquet/encoding-internal.h | 979 ++++++++
cpp/src/parquet/encoding-test.cc | 313 +++
cpp/src/parquet/encoding.h | 152 ++
cpp/src/parquet/exception.h | 92 +
cpp/src/parquet/file-deserialize-test.cc | 300 +++
cpp/src/parquet/file-serialize-test.cc | 310 +++
cpp/src/parquet/file_reader.cc | 376 ++++
cpp/src/parquet/file_reader.h | 143 ++
cpp/src/parquet/file_writer.cc | 420 ++++
cpp/src/parquet/file_writer.h | 220 ++
cpp/src/parquet/hasher.h | 75 +
cpp/src/parquet/metadata-test.cc | 231 ++
cpp/src/parquet/metadata.cc | 911 ++++++++
cpp/src/parquet/metadata.h | 279 +++
cpp/src/parquet/murmur3.cc | 222 ++
cpp/src/parquet/murmur3.h | 56 +
.../src/parquet/parquet.pc.in | 21 +-
cpp/src/parquet/parquet.thrift | 923 ++++++++
.../parquet_version.h.in} | 22 +-
cpp/src/parquet/printer.cc | 254 +++
cpp/src/parquet/printer.h | 50 +
cpp/src/parquet/properties-test.cc | 66 +
cpp/src/parquet/properties.h | 439 ++++
.../public-api-test.cc} | 37 +-
cpp/src/parquet/reader-test.cc | 325 +++
cpp/src/parquet/schema-internal.h | 82 +
cpp/src/parquet/schema-test.cc | 761 +++++++
cpp/src/parquet/schema.cc | 756 +++++++
cpp/src/parquet/schema.h | 452 ++++
cpp/src/parquet/statistics-test.cc | 782 +++++++
cpp/src/parquet/statistics.cc | 334 +++
cpp/src/parquet/statistics.h | 241 ++
.../src/parquet/symbols.map | 54 +-
cpp/src/parquet/test-specialization.h | 183 ++
cpp/src/parquet/test-util.h | 447 ++++
cpp/src/parquet/thrift.h | 162 ++
cpp/src/parquet/types-test.cc | 149 ++
cpp/src/parquet/types.cc | 295 +++
cpp/src/parquet/types.h | 316 +++
.../src/parquet/util/CMakeLists.txt | 21 +-
cpp/src/parquet/util/comparison-test.cc | 247 ++
cpp/src/parquet/util/comparison.cc | 112 +
cpp/src/parquet/util/comparison.h | 135 ++
cpp/src/parquet/util/crypto.cc | 369 +++
cpp/src/parquet/util/crypto.h | 46 +
.../util/macros.h} | 26 +-
cpp/src/parquet/util/memory-test.cc | 362 +++
cpp/src/parquet/util/memory.cc | 532 +++++
cpp/src/parquet/util/memory.h | 434 ++++
cpp/src/parquet/util/schema-util.h | 87 +
.../util/stopwatch.h} | 42 +-
cpp/src/parquet/util/test-common.h | 208 ++
cpp/src/{arrow => parquet}/util/visibility.h | 51 +-
.../io => parquet/util}/windows_compatibility.h | 22 +-
cpp/src/plasma/CMakeLists.txt | 8 +-
cpp/submodules/parquet-testing | 1 +
dev/release/rat_exclude_files.txt | 2 +
python/README.md | 1 -
python/doc/source/development.rst | 128 +-
python/manylinux1/Dockerfile-x86_64 | 19 +-
python/manylinux1/build_arrow.sh | 22 +-
.../manylinux1/scripts/check_arrow_visibility.sh | 2 +-
python/pyarrow/_parquet.pxd | 2 +-
python/pyarrow/_parquet.pyx | 17 +-
python/pyarrow/filesystem.py | 12 +-
python/pyarrow/parquet.py | 62 +-
python/pyarrow/tests/test_parquet.py | 10 +-
python/pyarrow/util.py | 10 +
python/testing/functions.sh | 27 +-
130 files changed, 29647 insertions(+), 562 deletions(-)
create mode 100644 .gitmodules
copy cpp/src/arrow/{io => util}/windows_compatibility.h (89%)
create mode 100644 cpp/src/parquet/.gitignore
create mode 100644 cpp/src/parquet/.parquetcppversion
create mode 100644 cpp/src/parquet/CMakeLists.txt
create mode 100644 cpp/src/parquet/README
copy python/manylinux1/scripts/check_arrow_visibility.sh => cpp/src/parquet/api/CMakeLists.txt (77%)
mode change 100755 => 100644
copy cpp/src/{arrow/io/windows_compatibility.h => parquet/api/io.h} (66%)
copy cpp/src/{arrow/io/windows_compatibility.h => parquet/api/reader.h} (67%)
copy cpp/src/{arrow/io/windows_compatibility.h => parquet/api/schema.h} (66%)
copy cpp/src/{arrow/io/windows_compatibility.h => parquet/api/writer.h} (66%)
copy python/manylinux1/scripts/check_arrow_visibility.sh => cpp/src/parquet/arrow/CMakeLists.txt (66%)
mode change 100755 => 100644
create mode 100644 cpp/src/parquet/arrow/arrow-reader-writer-benchmark.cc
create mode 100644 cpp/src/parquet/arrow/arrow-reader-writer-test.cc
create mode 100644 cpp/src/parquet/arrow/arrow-schema-test.cc
create mode 100644 cpp/src/parquet/arrow/reader.cc
create mode 100644 cpp/src/parquet/arrow/reader.h
create mode 100644 cpp/src/parquet/arrow/record_reader.cc
create mode 100644 cpp/src/parquet/arrow/record_reader.h
create mode 100644 cpp/src/parquet/arrow/schema.cc
create mode 100644 cpp/src/parquet/arrow/schema.h
create mode 100644 cpp/src/parquet/arrow/test-util.h
create mode 100644 cpp/src/parquet/arrow/writer.cc
create mode 100644 cpp/src/parquet/arrow/writer.h
create mode 100644 cpp/src/parquet/bloom_filter-test.cc
create mode 100644 cpp/src/parquet/bloom_filter.cc
create mode 100644 cpp/src/parquet/bloom_filter.h
create mode 100644 cpp/src/parquet/column-io-benchmark.cc
create mode 100644 cpp/src/parquet/column_page.h
create mode 100644 cpp/src/parquet/column_reader-test.cc
create mode 100644 cpp/src/parquet/column_reader.cc
create mode 100644 cpp/src/parquet/column_reader.h
create mode 100644 cpp/src/parquet/column_scanner-test.cc
create mode 100644 cpp/src/parquet/column_scanner.cc
create mode 100644 cpp/src/parquet/column_scanner.h
create mode 100644 cpp/src/parquet/column_writer-test.cc
create mode 100644 cpp/src/parquet/column_writer.cc
create mode 100644 cpp/src/parquet/column_writer.h
create mode 100644 cpp/src/parquet/encoding-benchmark.cc
create mode 100644 cpp/src/parquet/encoding-internal.h
create mode 100644 cpp/src/parquet/encoding-test.cc
create mode 100644 cpp/src/parquet/encoding.h
create mode 100644 cpp/src/parquet/exception.h
create mode 100644 cpp/src/parquet/file-deserialize-test.cc
create mode 100644 cpp/src/parquet/file-serialize-test.cc
create mode 100644 cpp/src/parquet/file_reader.cc
create mode 100644 cpp/src/parquet/file_reader.h
create mode 100644 cpp/src/parquet/file_writer.cc
create mode 100644 cpp/src/parquet/file_writer.h
create mode 100644 cpp/src/parquet/hasher.h
create mode 100644 cpp/src/parquet/metadata-test.cc
create mode 100644 cpp/src/parquet/metadata.cc
create mode 100644 cpp/src/parquet/metadata.h
create mode 100644 cpp/src/parquet/murmur3.cc
create mode 100644 cpp/src/parquet/murmur3.h
copy python/manylinux1/scripts/check_arrow_visibility.sh => cpp/src/parquet/parquet.pc.in (67%)
mode change 100755 => 100644
create mode 100644 cpp/src/parquet/parquet.thrift
copy cpp/src/{arrow/io/windows_compatibility.h => parquet/parquet_version.h.in} (66%)
create mode 100644 cpp/src/parquet/printer.cc
create mode 100644 cpp/src/parquet/printer.h
create mode 100644 cpp/src/parquet/properties-test.cc
create mode 100644 cpp/src/parquet/properties.h
copy cpp/src/{arrow/io/windows_compatibility.h => parquet/public-api-test.cc} (51%)
create mode 100644 cpp/src/parquet/reader-test.cc
create mode 100644 cpp/src/parquet/schema-internal.h
create mode 100644 cpp/src/parquet/schema-test.cc
create mode 100644 cpp/src/parquet/schema.cc
create mode 100644 cpp/src/parquet/schema.h
create mode 100644 cpp/src/parquet/statistics-test.cc
create mode 100644 cpp/src/parquet/statistics.cc
create mode 100644 cpp/src/parquet/statistics.h
rename ci/travis_build_parquet_cpp.sh => cpp/src/parquet/symbols.map (53%)
mode change 100755 => 100644
create mode 100644 cpp/src/parquet/test-specialization.h
create mode 100644 cpp/src/parquet/test-util.h
create mode 100644 cpp/src/parquet/thrift.h
create mode 100644 cpp/src/parquet/types-test.cc
create mode 100644 cpp/src/parquet/types.cc
create mode 100644 cpp/src/parquet/types.h
copy python/manylinux1/scripts/check_arrow_visibility.sh => cpp/src/parquet/util/CMakeLists.txt (77%)
mode change 100755 => 100644
create mode 100644 cpp/src/parquet/util/comparison-test.cc
create mode 100644 cpp/src/parquet/util/comparison.cc
create mode 100644 cpp/src/parquet/util/comparison.h
create mode 100644 cpp/src/parquet/util/crypto.cc
create mode 100644 cpp/src/parquet/util/crypto.h
copy cpp/src/{arrow/io/windows_compatibility.h => parquet/util/macros.h} (66%)
create mode 100644 cpp/src/parquet/util/memory-test.cc
create mode 100644 cpp/src/parquet/util/memory.cc
create mode 100644 cpp/src/parquet/util/memory.h
create mode 100644 cpp/src/parquet/util/schema-util.h
copy cpp/src/{arrow/io/windows_compatibility.h => parquet/util/stopwatch.h} (57%)
create mode 100644 cpp/src/parquet/util/test-common.h
copy cpp/src/{arrow => parquet}/util/visibility.h (52%)
rename cpp/src/{arrow/io => parquet/util}/windows_compatibility.h (68%)
create mode 160000 cpp/submodules/parquet-testing