You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@accumulo.apache.org by kt...@apache.org on 2019/07/24 15:19:45 UTC
[accumulo-testing] 01/01: Improve bulk CI docs
This is an automated email from the ASF dual-hosted git repository.
kturner pushed a commit to branch keith-turner-patch-1
in repository https://gitbox.apache.org/repos/asf/accumulo-testing.git
commit c50bd97f90f54bf61ed3f42b4bd32d363126e6dc
Author: Keith Turner <kt...@apache.org>
AuthorDate: Wed Jul 24 11:19:38 2019 -0400
Improve bulk CI docs
---
docs/bulk-test.md | 9 +++++++++
1 file changed, 9 insertions(+)
diff --git a/docs/bulk-test.md b/docs/bulk-test.md
index 17076e7..071cce8 100644
--- a/docs/bulk-test.md
+++ b/docs/bulk-test.md
@@ -30,6 +30,9 @@ for i in $(seq 1 10); do
./bin/cingest bulk /tmp/bt/$i
done
+# Optionally, copy data before importing. This can be useful in debugging problems.
+hadoop distcp hdfs://$NAMENODE/tmp/bt hdfs://$NAMENODE/tmp/bt-copy
+
for i in $(seq 1 10); do
(
echo table ci
@@ -53,6 +56,12 @@ scan -t accumulo.metadata -b ~blip -e ~blip~
scan -t accumulo.metadata -c loaded
```
+Additionally check that no rfiles exists in the source dir.
+
+```bash
+hadoop fs -ls -R /tmp/bt | grep rf
+```
+
The referenced counts output by `cingest verify` should equal :
```