You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@datasketches.apache.org by le...@apache.org on 2020/01/27 01:37:23 UTC

[incubator-datasketches-characterization] branch master updated: Update CPC Merge Speed and SerDe jobs.

This is an automated email from the ASF dual-hosted git repository.

leerho pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/incubator-datasketches-characterization.git


The following commit(s) were added to refs/heads/master by this push:
     new e48b5cf  Update CPC Merge Speed and SerDe jobs.
e48b5cf is described below

commit e48b5cfbf933161583db3feabef03d1929bfd72c
Author: Lee Rhodes <le...@users.noreply.github.com>
AuthorDate: Sun Jan 26 17:37:13 2020 -0800

    Update CPC Merge Speed and SerDe jobs.
---
 .../datasketches/characterization/cpc/CpcSerDeProfile.java     |  1 +
 src/main/resources/cpc/CpcSerDeJob.conf                        |  4 +++-
 src/main/resources/cpc/CpcUnionUpdateSpeedJob.conf             |  8 ++++----
 src/main/resources/hll/HllSerDeJob.conf                        | 10 +++++-----
 4 files changed, 13 insertions(+), 10 deletions(-)

diff --git a/src/main/java/org/apache/datasketches/characterization/cpc/CpcSerDeProfile.java b/src/main/java/org/apache/datasketches/characterization/cpc/CpcSerDeProfile.java
index a7c67bf..92b09ae 100644
--- a/src/main/java/org/apache/datasketches/characterization/cpc/CpcSerDeProfile.java
+++ b/src/main/java/org/apache/datasketches/characterization/cpc/CpcSerDeProfile.java
@@ -61,6 +61,7 @@ public class CpcSerDeProfile extends BaseSerDeProfile {
 
     stats.serializeTime_nS = stopSerTime_nS - startSerTime_nS;
     stats.deserializeTime_nS = stopDeserTime_nS - startDeserTime_nS;
+    stats.size_bytes = byteArr.length;
   }
 
 }
diff --git a/src/main/resources/cpc/CpcSerDeJob.conf b/src/main/resources/cpc/CpcSerDeJob.conf
index 5e98681..60147d7 100644
--- a/src/main/resources/cpc/CpcSerDeJob.conf
+++ b/src/main/resources/cpc/CpcSerDeJob.conf
@@ -27,7 +27,7 @@ Trials_lgMaxT=16  #Max trials at start (low counts)
 Trials_lgMinT=7  #Min trials at tail (high counts) 
 
 #Trails Speed related
-Trials_lgMinBpU=0   #start the downward slope of trials at this LgU
+Trials_lgMinBpU=4   #start the downward slope of trials at this LgU
 Trials_lgMaxBpU=20  #stop the downward slope of trials at this LgU
 
 # Date-Time Profile
@@ -39,3 +39,5 @@ ReadableDateFormat=yyyy/MM/dd HH:mm:ss z
 #Job Profile
 JobProfile=org.apache.datasketches.characterization.cpc.CpcSerDeProfile
 LgK=11
+# CPC is always serialized in compact (compressed form)
+# CPC is always deserialized on the heap.
diff --git a/src/main/resources/cpc/CpcUnionUpdateSpeedJob.conf b/src/main/resources/cpc/CpcUnionUpdateSpeedJob.conf
index 3b36faa..e7e7e13 100644
--- a/src/main/resources/cpc/CpcUnionUpdateSpeedJob.conf
+++ b/src/main/resources/cpc/CpcUnionUpdateSpeedJob.conf
@@ -19,16 +19,16 @@
 
 #Uniques Profile
 Trials_lgMinU=0  #The starting # of uniques that is printed at the end.
-Trials_lgMaxU=26 #How high the # uniques go
+Trials_lgMaxU=24 #How high the # uniques go
 Trials_UPPO=16   #The horizontal x-resolution of trials points
 
 # Trials Profile
-Trials_lgMaxT=16 #Max trials at start (low counts)
-Trials_lgMinT=8  #Min trials at tail (high counts) 
+Trials_lgMaxT=14 #Max trials at start (low counts)
+Trials_lgMinT=5  #Min trials at tail (high counts) 
 
 #Trails Speed related
 Trials_lgMinBpU=0  #start the downward slope of trials at this LgU
-Trials_lgMaxBpU=26  #stop the downward slope of trials at this LgU
+Trials_lgMaxBpU=24  #stop the downward slope of trials at this LgU
 
 # Date-Time Profile
 TimeZone=PST
diff --git a/src/main/resources/hll/HllSerDeJob.conf b/src/main/resources/hll/HllSerDeJob.conf
index 9a4adcf..9fa7aab 100644
--- a/src/main/resources/hll/HllSerDeJob.conf
+++ b/src/main/resources/hll/HllSerDeJob.conf
@@ -19,11 +19,11 @@
 
 #Uniques Profile
 Trials_lgMinU=0  #The starting # of uniques that is printed at the end.
-Trials_lgMaxU=24 #How high the # uniques go
+Trials_lgMaxU=20 #How high the # uniques go
 Trials_UPPO=2    #The horizontal x-resolution of trial points, Points Per Octave
 
 # Trials Profile
-Trials_lgMaxT=20  #Max trials at start (low counts)
+Trials_lgMaxT=16  #Max trials at start (low counts)
 Trials_lgMinT=7  #Min trials at tail (high counts) 
 
 #Trails Speed related
@@ -38,9 +38,9 @@ ReadableDateFormat=yyyy/MM/dd HH:mm:ss z
 
 #Job Profile
 JobProfile=org.apache.datasketches.characterization.hll.HllSerDeProfile
-LgK=20
+LgK=12
 HLL_tgtHllType=HLL4
 HLL_direct=false
 HLL_useComposite=false
-HLL_compact=false
-HLL_wrap=true
+HLL_compact=false #whether the serialization is compact or updatable form
+HLL_wrap=true     #whether the deserialize operation is wrap or heapify


---------------------------------------------------------------------
To unsubscribe, e-mail: commits-unsubscribe@datasketches.apache.org
For additional commands, e-mail: commits-help@datasketches.apache.org