You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@accumulo.apache.org by kt...@apache.org on 2019/07/24 15:19:45 UTC

[accumulo-testing] 01/01: Improve bulk CI docs

This is an automated email from the ASF dual-hosted git repository.

kturner pushed a commit to branch keith-turner-patch-1
in repository https://gitbox.apache.org/repos/asf/accumulo-testing.git

commit c50bd97f90f54bf61ed3f42b4bd32d363126e6dc
Author: Keith Turner <kt...@apache.org>
AuthorDate: Wed Jul 24 11:19:38 2019 -0400

    Improve bulk CI docs
---
 docs/bulk-test.md | 9 +++++++++
 1 file changed, 9 insertions(+)

diff --git a/docs/bulk-test.md b/docs/bulk-test.md
index 17076e7..071cce8 100644
--- a/docs/bulk-test.md
+++ b/docs/bulk-test.md
@@ -30,6 +30,9 @@ for i in $(seq 1 10); do
   ./bin/cingest bulk /tmp/bt/$i
 done
 
+# Optionally, copy data before importing.  This can be useful in debugging problems.
+hadoop distcp hdfs://$NAMENODE/tmp/bt hdfs://$NAMENODE/tmp/bt-copy
+
 for i in $(seq 1 10); do
   (
     echo table ci
@@ -53,6 +56,12 @@ scan -t accumulo.metadata -b ~blip -e ~blip~
 scan -t accumulo.metadata -c loaded
 ```
 
+Additionally check that no rfiles exists in the source dir.
+
+```bash
+hadoop fs -ls -R /tmp/bt | grep rf
+```
+
 The referenced counts output by `cingest verify` should equal :
 
 ```