You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@datasketches.apache.org by le...@apache.org on 2020/01/27 01:37:23 UTC
[incubator-datasketches-characterization] branch master updated:
Update CPC Merge Speed and SerDe jobs.
This is an automated email from the ASF dual-hosted git repository.
leerho pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/incubator-datasketches-characterization.git
The following commit(s) were added to refs/heads/master by this push:
new e48b5cf Update CPC Merge Speed and SerDe jobs.
e48b5cf is described below
commit e48b5cfbf933161583db3feabef03d1929bfd72c
Author: Lee Rhodes <le...@users.noreply.github.com>
AuthorDate: Sun Jan 26 17:37:13 2020 -0800
Update CPC Merge Speed and SerDe jobs.
---
.../datasketches/characterization/cpc/CpcSerDeProfile.java | 1 +
src/main/resources/cpc/CpcSerDeJob.conf | 4 +++-
src/main/resources/cpc/CpcUnionUpdateSpeedJob.conf | 8 ++++----
src/main/resources/hll/HllSerDeJob.conf | 10 +++++-----
4 files changed, 13 insertions(+), 10 deletions(-)
diff --git a/src/main/java/org/apache/datasketches/characterization/cpc/CpcSerDeProfile.java b/src/main/java/org/apache/datasketches/characterization/cpc/CpcSerDeProfile.java
index a7c67bf..92b09ae 100644
--- a/src/main/java/org/apache/datasketches/characterization/cpc/CpcSerDeProfile.java
+++ b/src/main/java/org/apache/datasketches/characterization/cpc/CpcSerDeProfile.java
@@ -61,6 +61,7 @@ public class CpcSerDeProfile extends BaseSerDeProfile {
stats.serializeTime_nS = stopSerTime_nS - startSerTime_nS;
stats.deserializeTime_nS = stopDeserTime_nS - startDeserTime_nS;
+ stats.size_bytes = byteArr.length;
}
}
diff --git a/src/main/resources/cpc/CpcSerDeJob.conf b/src/main/resources/cpc/CpcSerDeJob.conf
index 5e98681..60147d7 100644
--- a/src/main/resources/cpc/CpcSerDeJob.conf
+++ b/src/main/resources/cpc/CpcSerDeJob.conf
@@ -27,7 +27,7 @@ Trials_lgMaxT=16 #Max trials at start (low counts)
Trials_lgMinT=7 #Min trials at tail (high counts)
#Trails Speed related
-Trials_lgMinBpU=0 #start the downward slope of trials at this LgU
+Trials_lgMinBpU=4 #start the downward slope of trials at this LgU
Trials_lgMaxBpU=20 #stop the downward slope of trials at this LgU
# Date-Time Profile
@@ -39,3 +39,5 @@ ReadableDateFormat=yyyy/MM/dd HH:mm:ss z
#Job Profile
JobProfile=org.apache.datasketches.characterization.cpc.CpcSerDeProfile
LgK=11
+# CPC is always serialized in compact (compressed form)
+# CPC is always deserialized on the heap.
diff --git a/src/main/resources/cpc/CpcUnionUpdateSpeedJob.conf b/src/main/resources/cpc/CpcUnionUpdateSpeedJob.conf
index 3b36faa..e7e7e13 100644
--- a/src/main/resources/cpc/CpcUnionUpdateSpeedJob.conf
+++ b/src/main/resources/cpc/CpcUnionUpdateSpeedJob.conf
@@ -19,16 +19,16 @@
#Uniques Profile
Trials_lgMinU=0 #The starting # of uniques that is printed at the end.
-Trials_lgMaxU=26 #How high the # uniques go
+Trials_lgMaxU=24 #How high the # uniques go
Trials_UPPO=16 #The horizontal x-resolution of trials points
# Trials Profile
-Trials_lgMaxT=16 #Max trials at start (low counts)
-Trials_lgMinT=8 #Min trials at tail (high counts)
+Trials_lgMaxT=14 #Max trials at start (low counts)
+Trials_lgMinT=5 #Min trials at tail (high counts)
#Trails Speed related
Trials_lgMinBpU=0 #start the downward slope of trials at this LgU
-Trials_lgMaxBpU=26 #stop the downward slope of trials at this LgU
+Trials_lgMaxBpU=24 #stop the downward slope of trials at this LgU
# Date-Time Profile
TimeZone=PST
diff --git a/src/main/resources/hll/HllSerDeJob.conf b/src/main/resources/hll/HllSerDeJob.conf
index 9a4adcf..9fa7aab 100644
--- a/src/main/resources/hll/HllSerDeJob.conf
+++ b/src/main/resources/hll/HllSerDeJob.conf
@@ -19,11 +19,11 @@
#Uniques Profile
Trials_lgMinU=0 #The starting # of uniques that is printed at the end.
-Trials_lgMaxU=24 #How high the # uniques go
+Trials_lgMaxU=20 #How high the # uniques go
Trials_UPPO=2 #The horizontal x-resolution of trial points, Points Per Octave
# Trials Profile
-Trials_lgMaxT=20 #Max trials at start (low counts)
+Trials_lgMaxT=16 #Max trials at start (low counts)
Trials_lgMinT=7 #Min trials at tail (high counts)
#Trails Speed related
@@ -38,9 +38,9 @@ ReadableDateFormat=yyyy/MM/dd HH:mm:ss z
#Job Profile
JobProfile=org.apache.datasketches.characterization.hll.HllSerDeProfile
-LgK=20
+LgK=12
HLL_tgtHllType=HLL4
HLL_direct=false
HLL_useComposite=false
-HLL_compact=false
-HLL_wrap=true
+HLL_compact=false #whether the serialization is compact or updatable form
+HLL_wrap=true #whether the deserialize operation is wrap or heapify
---------------------------------------------------------------------
To unsubscribe, e-mail: commits-unsubscribe@datasketches.apache.org
For additional commands, e-mail: commits-help@datasketches.apache.org