You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@impala.apache.org by st...@apache.org on 2019/08/19 16:08:41 UTC

[impala] 03/03: IMPALA-8683: Document parquet/lz4 compression codec

This is an automated email from the ASF dual-hosted git repository.

stigahuang pushed a commit to branch branch-3.3.0
in repository https://gitbox.apache.org/repos/asf/impala.git

commit 0f840c5a0f5e673c67cbd482e62065fd47b98e1a
Author: Abhishek Rawat <ar...@cloudera.com>
AuthorDate: Sun Aug 18 22:07:45 2019 -0700

    IMPALA-8683: Document parquet/lz4 compression codec
    
    Document lz4 compression codec for parquet.
    
    Change-Id: I304274842c8494a021816d68bc5d81810c353146
    Reviewed-on: http://gerrit.cloudera.org:8080/14093
    Tested-by: Impala Public Jenkins <im...@cloudera.com>
    Reviewed-by: Quanlong Huang <hu...@gmail.com>
---
 docs/topics/impala_compression_codec.xml | 6 +++++-
 docs/topics/impala_file_formats.xml      | 7 ++++++-
 docs/topics/impala_parquet.xml           | 8 ++++----
 3 files changed, 15 insertions(+), 6 deletions(-)

diff --git a/docs/topics/impala_compression_codec.xml b/docs/topics/impala_compression_codec.xml
index 8808bb7..1863aff 100644
--- a/docs/topics/impala_compression_codec.xml
+++ b/docs/topics/impala_compression_codec.xml
@@ -32,6 +32,7 @@ under the License.
       <data name="Category" value="Snappy"/>
       <data name="Category" value="Gzip"/>
       <data name="Category" value="Zstd"/>
+      <data name="Category" value="Lz4"/>
       <data name="Category" value="Developers"/>
       <data name="Category" value="Data Analysts"/>
     </metadata>
@@ -63,7 +64,7 @@ SET COMPRESSION_CODEC=<varname>codec_name</varname>:<varname>compression_level</
 
     <p>
       The allowed values for this query option are <codeph>SNAPPY</codeph> (the default), <codeph>GZIP</codeph>,
-      <codeph>ZSTD</codeph>, and <codeph>NONE</codeph>.
+      <codeph>ZSTD</codeph>, <codeph>LZ4</codeph>, and <codeph>NONE</codeph>.
     </p>
 
     <p>
@@ -103,6 +104,9 @@ SET COMPRESSION_CODEC=<varname>codec_name</varname>:<varname>compression_level</
     <p conref="../shared/impala_common.xml#common/example_blurb"/>
 
 <codeblock>
+set compression_codec=lz4;
+insert into parquet_table_lz4_compressed select * from t1;
+
 set compression_codec=zstd; // Default compression level 3.
 insert into parquet_table_zstd_default_compressed select * from t1;
 
diff --git a/docs/topics/impala_file_formats.xml b/docs/topics/impala_file_formats.xml
index a8e961a..338f45b 100644
--- a/docs/topics/impala_file_formats.xml
+++ b/docs/topics/impala_file_formats.xml
@@ -106,7 +106,7 @@ under the License.
             <entry>
               Structured
             </entry>
-            <entry> Snappy, gzip, zstd; currently Snappy by default </entry>
+            <entry> Snappy, gzip, zstd, lz4; currently Snappy by default </entry>
             <entry>
               Yes.
             </entry>
@@ -317,6 +317,11 @@ under the License.
         <dt>Zstd</dt>
         <dd>For Parquet files only.</dd>
       </dlentry>
+
+      <dlentry>
+        <dt>Lz4</dt>
+        <dd>For Parquet files only.</dd>
+      </dlentry>
     </dl>
 
   </conbody>
diff --git a/docs/topics/impala_parquet.xml b/docs/topics/impala_parquet.xml
index d4cdba7..8148973 100644
--- a/docs/topics/impala_parquet.xml
+++ b/docs/topics/impala_parquet.xml
@@ -452,10 +452,10 @@ under the License.
         underlying compression is controlled by the <codeph>COMPRESSION_CODEC</codeph> query
         option. (Prior to Impala 2.0, the query option name was
         <codeph>PARQUET_COMPRESSION_CODEC</codeph>.) The allowed values for this query option
-        are <codeph>snappy</codeph> (the default), <codeph>gzip</codeph>, <codeph>zstd</codeph>
-        and <codeph>none</codeph>. The option value is not case-sensitive. If the option is set
-        to an unrecognized value, all kinds of queries will fail due to the invalid option
-        setting, not just queries involving Parquet tables.
+        are <codeph>snappy</codeph> (the default), <codeph>gzip</codeph>, <codeph>zstd</codeph>,
+        <codeph>lz4</codeph>, and <codeph>none</codeph>. The option value is not case-sensitive.
+        If the option is set to an unrecognized value, all kinds of queries will fail due to
+        the invalid option setting, not just queries involving Parquet tables.
       </p>
 
     </conbody>