You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@ambari.apache.org by ab...@apache.org on 2017/07/05 11:05:56 UTC

[02/15] ambari git commit: AMBARI-21377: Add HiveVectorizedORC and JDBC profiles to pxf-profiles.xml

AMBARI-21377: Add HiveVectorizedORC and JDBC profiles to pxf-profiles.xml


Project: http://git-wip-us.apache.org/repos/asf/ambari/repo
Commit: http://git-wip-us.apache.org/repos/asf/ambari/commit/9a17ca78
Tree: http://git-wip-us.apache.org/repos/asf/ambari/tree/9a17ca78
Diff: http://git-wip-us.apache.org/repos/asf/ambari/diff/9a17ca78

Branch: refs/heads/branch-feature-logsearch-ui
Commit: 9a17ca78d9c4e4e09123f1640b8f521f246a8b5f
Parents: d0f12bf
Author: lavjain <lj...@pivotal.io>
Authored: Fri Jun 30 12:34:45 2017 -0700
Committer: lavjain <lj...@pivotal.io>
Committed: Fri Jun 30 12:34:45 2017 -0700

----------------------------------------------------------------------
 .../PXF/3.0.0/configuration/pxf-profiles.xml    | 25 ++++++++++++++++++++
 1 file changed, 25 insertions(+)
----------------------------------------------------------------------


http://git-wip-us.apache.org/repos/asf/ambari/blob/9a17ca78/ambari-server/src/main/resources/common-services/PXF/3.0.0/configuration/pxf-profiles.xml
----------------------------------------------------------------------
diff --git a/ambari-server/src/main/resources/common-services/PXF/3.0.0/configuration/pxf-profiles.xml b/ambari-server/src/main/resources/common-services/PXF/3.0.0/configuration/pxf-profiles.xml
index e0a9029..27473a1 100644
--- a/ambari-server/src/main/resources/common-services/PXF/3.0.0/configuration/pxf-profiles.xml
+++ b/ambari-server/src/main/resources/common-services/PXF/3.0.0/configuration/pxf-profiles.xml
@@ -88,6 +88,7 @@ under the License.
         <name>HiveRC</name>
         <description>This profile is suitable only for Hive tables stored in RC files
             and serialized with either the ColumnarSerDe or the LazyBinaryColumnarSerDe.
+            It is much faster than the general purpose Hive profile.
             DELIMITER parameter is mandatory.
             Supports both GPDBWritable and TEXT output formats, as specified in FORMAT header parameter.
             Primary optimized for TEXT output format.
@@ -103,6 +104,7 @@ under the License.
     <profile>
         <name>HiveText</name>
         <description>This profile is suitable only for Hive tables stored as Text files.
+            It is much faster than the general purpose Hive profile.
             DELIMITER parameter is mandatory.
             Supports both GPDBWritable and TEXT output formats, as specified in FORMAT header parameter.
             Primary optimized for TEXT output format.
@@ -119,6 +121,7 @@ under the License.
         <name>HiveORC</name>
         <description>This profile is suitable only for Hive tables stored in ORC files
             and serialized with either the ColumnarSerDe or the LazyBinaryColumnarSerDe.
+            It is much faster than the general purpose Hive profile.
             Supports GPDBWritable output format, as specified in FORMAT header parameter.
         </description>
         <plugins>
@@ -130,6 +133,19 @@ under the License.
         </plugins>
     </profile>
     <profile>
+        <name>HiveVectorizedORC</name>
+        <description>This profile is same as HiveORC profile, but operates on batches of rows
+            instead of one row at a time, leading to faster reading and resolution phases.
+        </description>
+        <plugins>
+            <fragmenter>org.apache.hawq.pxf.plugins.hive.HiveInputFormatFragmenter</fragmenter>
+            <accessor>org.apache.hawq.pxf.plugins.hive.HiveORCVectorizedAccessor</accessor>
+            <resolver>org.apache.hawq.pxf.plugins.hive.HiveORCVectorizedResolver</resolver>
+            <metadata>org.apache.hawq.pxf.plugins.hive.HiveMetadataFetcher</metadata>
+            <outputFormat>org.apache.hawq.pxf.service.io.GPDBWritable</outputFormat>
+        </plugins>
+    </profile>
+    <profile>
         <name>HdfsTextSimple</name>
         <description>This profile is suitable for using when reading delimited single line records from plain text files
             on HDFS
@@ -194,6 +210,15 @@ under the License.
             <resolver>org.apache.hawq.pxf.plugins.json.JsonResolver</resolver>
         </plugins>
     </profile>
+    <profile>
+        <name>Jdbc</name>
+        <description>A profile for reading data into HAWQ via JDBC</description>
+        <plugins>
+            <fragmenter>org.apache.hawq.pxf.plugins.jdbc.JdbcPartitionFragmenter</fragmenter>
+            <accessor>org.apache.hawq.pxf.plugins.jdbc.JdbcReadAccessor</accessor>
+            <resolver>org.apache.hawq.pxf.plugins.jdbc.JdbcReadResolver</resolver>
+        </plugins>
+    </profile>
 </profiles>
     ]]></value>
     <value-attributes>