You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@bigtop.apache.org by el...@apache.org on 2022/03/08 06:44:23 UTC

[bigtop] branch master updated: BIGTOP-3650: Improve Hive's Debian packaging (#871)

This is an automated email from the ASF dual-hosted git repository.

elukey pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/bigtop.git


The following commit(s) were added to refs/heads/master by this push:
     new d7546d9  BIGTOP-3650: Improve Hive's Debian packaging (#871)
d7546d9 is described below

commit d7546d9bf4f52fea8db6251f31391d7397fbd471
Author: Luca Toscano <el...@users.noreply.github.com>
AuthorDate: Tue Mar 8 07:44:13 2022 +0100

    BIGTOP-3650: Improve Hive's Debian packaging (#871)
    
    Raised compat to '12' and followed some suggestions from Lintian.
---
 bigtop-packages/src/deb/hive/compat  |  2 +-
 bigtop-packages/src/deb/hive/control | 47 +++++++++++++++++++++---------------
 bigtop-packages/src/deb/hive/rules   |  7 ++++++
 bigtop.bom                           |  4 +--
 4 files changed, 37 insertions(+), 23 deletions(-)

diff --git a/bigtop-packages/src/deb/hive/compat b/bigtop-packages/src/deb/hive/compat
index ec63514..48082f7 100644
--- a/bigtop-packages/src/deb/hive/compat
+++ b/bigtop-packages/src/deb/hive/compat
@@ -1 +1 @@
-9
+12
diff --git a/bigtop-packages/src/deb/hive/control b/bigtop-packages/src/deb/hive/control
index 8a93542..9a83ae5 100644
--- a/bigtop-packages/src/deb/hive/control
+++ b/bigtop-packages/src/deb/hive/control
@@ -15,7 +15,7 @@
 
 Source: hive
 Section: misc
-Priority: extra
+Priority: optional
 Maintainer: Bigtop <de...@bigtop.apache.org>
 Build-Depends: debhelper (>= 7.0.50~)
 Standards-Version: 3.9.4
@@ -24,34 +24,39 @@ Homepage: http://hive.apache.org/
 
 Package: hive
 Architecture: all
-Depends: adduser, hadoop-client, bigtop-utils (>= 0.7), zookeeper, hive-jdbc (= ${source:Version}), python
-Description: Hive is a data warehouse infrastructure built on top of Hadoop
+Depends: adduser, hadoop-client, bigtop-utils (>= 0.7), zookeeper,
+         hive-jdbc (= ${source:Version}), python
+Description: Data warehouse infrastructure built on top of Hadoop
  Hive is a data warehouse infrastructure built on top of Hadoop that provides
  tools to enable easy data summarization, adhoc querying and analysis of large
  datasets data stored in Hadoop files. It provides a mechanism to put structure
  on this data and it also provides a simple query language called Hive QL which
  is based on SQL and which enables users familiar with SQL to query this data.
  At the same time, this language also allows traditional map/reduce programmers
- to be able to plug in their custom mappers and reducers to do more sophisticated 
- analysis which may not be supported by the built-in capabilities of the language.
+ to be able to plug in their custom mappers and reducers to do more
+ sophisticated analysis which may not be supported by the built-in
+ capabilities of the language.
 
 Package: hive-server2
 Architecture: all
-Depends: hive (= ${source:Version})
+Depends: hive (= ${source:Version}), lsb-base
 Description: Provides a Hive Thrift service with improved concurrency support.
- This optional package hosts a Thrift server for Hive clients across a network to use, with improved concurrency support.
+ This optional package hosts a Thrift server for Hive clients across a network
+ to use, with improved concurrency support.
 
 Package: hive-metastore
 Architecture: all
-Depends: hive (= ${source:Version})
+Depends: hive (= ${source:Version}), lsb-base
 Description: Shared metadata repository for Hive.
- This optional package hosts a metadata server for Hive clients across a network to use.
+ This optional package hosts a metadata server for Hive clients across
+ a network to use.
 
 Package: hive-hbase
 Architecture: all
 Depends: hive (= ${source:Version}), hbase
 Description: Provides integration between Apache HBase and Apache Hive
- This optional package provides integration between Apache HBase and Apache Hive
+ This optional package provides integration between Apache HBase and
+ Apache Hive
 
 Package: hive-jdbc
 Architecture: all
@@ -62,27 +67,29 @@ Description: Provides libraries necessary to connect to Apache Hive via JDBC
 Package: hive-hcatalog
 Architecture: all
 Depends: hadoop, hive, bigtop-utils (>= 0.6), python
-Description: Apache Hcatalog is a data warehouse infrastructure built on top of Hadoop
- Apache HCatalog is a table and storage management service for data created using Apache Hadoop.
+Description: Table and storage management service for Apache Hadoop.
  This includes:
    * Providing a shared schema and data type mechanism.
-   * Providing a table abstraction so that users need not be concerned with where or how their data is stored.
-   * Providing interoperability across data processing tools such as Pig, Map Reduce, Streaming, and Hive.
+   * Providing a table abstraction so that users need not be concerned
+     with where or how their data is stored.
+   * Providing interoperability across data processing tools such
+     as Pig, Map Reduce, Streaming, and Hive.
 
 Package: hive-hcatalog-server
 Architecture: all
-Depends: hive-hcatalog (= ${source:Version})
+Depends: hive-hcatalog (= ${source:Version}), lsb-base
 Description: Init scripts for HCatalog server
- Init scripts for HCatalog server
+ The package includes Init scripts to support the HCatalog server
 
 Package: hive-webhcat
 Architecture: all
 Depends: hive-hcatalog (= ${source:Version})
-Description: WebHcat provides a REST-like web API for HCatalog and related Hadoop components.
- WebHcat provides a REST-like web API for HCatalog and related Hadoop components.
+Description: A REST-like web API for HCatalog and related Hadoop components.
+ WebHcat provides a REST-like web API for HCatalog
+ and related Hadoop components.
 
 Package: hive-webhcat-server
 Architecture: all
-Depends: hive-webhcat (= ${source:Version})
+Depends: hive-webhcat (= ${source:Version}), lsb-base
 Description: Init scripts for WebHcat server
- Init scripts for WebHcat server.
+ The package includes Init scripts to support WebHcat server.
diff --git a/bigtop-packages/src/deb/hive/rules b/bigtop-packages/src/deb/hive/rules
index 3a89344..72a020d 100755
--- a/bigtop-packages/src/deb/hive/rules
+++ b/bigtop-packages/src/deb/hive/rules
@@ -40,6 +40,13 @@ override_dh_auto_build:
 server2 metastore hcatalog-server webhcat-server:
 	bash debian/init.d.tmpl debian/hive-$@.svc deb debian/${hive_pkg_name}-$@.init
 
+override_dh_strip_nondeterminism:
+	# This step is part of https://wiki.debian.org/ReproducibleBuilds
+	# Due to some big jars, the build times are 4/5x higher compared
+	# to a normal build. The aim of the project is really valuable
+	# so we should re-enable this at some point in the future,
+	# but for now it is better to concentrate on the rest of the packaging.
+
 override_dh_auto_install: server2 metastore hcatalog-server webhcat-server
 	cp debian/hive-site.xml .
 	cp debian/hive.1 .
diff --git a/bigtop.bom b/bigtop.bom
index 3eda953..5fd845e 100644
--- a/bigtop.bom
+++ b/bigtop.bom
@@ -44,7 +44,7 @@
      APACHE_MIRROR = "https://apache.osuosl.org"
      APACHE_ARCHIVE = "https://archive.apache.org/dist"
    }
-   git { // *optional* This is a global setting to access protected git repositories, 
+   git { // *optional* This is a global setting to access protected git repositories,
          //            can be specified per component as well
      user = "john_doe"
      token = "john's access token"
@@ -166,7 +166,7 @@ bigtop {
     'hive' {
       name    = 'hive'
       relNotes = 'Apache Hive'
-      version { base = '3.1.2'; pkg = base; release = 2 }
+      version { base = '3.1.2'; pkg = base; release = 3 }
       tarball { destination = "apache-${name}-${version.base}-src.tar.gz"
                 source      = destination }
       url     { download_path = "/$name/$name-${version.base}/"