You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@hbase.apache.org by mi...@apache.org on 2016/02/06 02:34:14 UTC

[03/17] hbase-site git commit: Published site at 9c832109458ced70d0db701e7f58ef41b1df0fc7.

http://git-wip-us.apache.org/repos/asf/hbase-site/blob/9bc06f81/xref/org/apache/hadoop/hbase/mapreduce/ImportTsv.html
----------------------------------------------------------------------
diff --git a/xref/org/apache/hadoop/hbase/mapreduce/ImportTsv.html b/xref/org/apache/hadoop/hbase/mapreduce/ImportTsv.html
index f9f6e8a..2420caf 100644
--- a/xref/org/apache/hadoop/hbase/mapreduce/ImportTsv.html
+++ b/xref/org/apache/hadoop/hbase/mapreduce/ImportTsv.html
@@ -101,704 +101,706 @@
 <a class="jxr_linenumber" name="91" href="#91">91</a>    <em class="jxr_comment">// If true, bad lines are logged to stderr. Default: false.</em>
 <a class="jxr_linenumber" name="92" href="#92">92</a>    <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">final</strong> <strong class="jxr_keyword">static</strong> String LOG_BAD_LINES_CONF_KEY = <span class="jxr_string">"importtsv.log.bad.lines"</span>;
 <a class="jxr_linenumber" name="93" href="#93">93</a>    <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">final</strong> <strong class="jxr_keyword">static</strong> String SKIP_LINES_CONF_KEY = <span class="jxr_string">"importtsv.skip.bad.lines"</span>;
-<a class="jxr_linenumber" name="94" href="#94">94</a>    <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">final</strong> <strong class="jxr_keyword">static</strong> String COLUMNS_CONF_KEY = <span class="jxr_string">"importtsv.columns"</span>;
-<a class="jxr_linenumber" name="95" href="#95">95</a>    <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">final</strong> <strong class="jxr_keyword">static</strong> String SEPARATOR_CONF_KEY = <span class="jxr_string">"importtsv.separator"</span>;
-<a class="jxr_linenumber" name="96" href="#96">96</a>    <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">final</strong> <strong class="jxr_keyword">static</strong> String ATTRIBUTE_SEPERATOR_CONF_KEY = <span class="jxr_string">"attributes.seperator"</span>;
-<a class="jxr_linenumber" name="97" href="#97">97</a>    <em class="jxr_comment">//This config is used to propagate credentials from parent MR jobs which launch</em>
-<a class="jxr_linenumber" name="98" href="#98">98</a>    <em class="jxr_comment">//ImportTSV jobs. SEE IntegrationTestImportTsv.</em>
-<a class="jxr_linenumber" name="99" href="#99">99</a>    <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">final</strong> <strong class="jxr_keyword">static</strong> String CREDENTIALS_LOCATION = <span class="jxr_string">"credentials_location"</span>;
-<a class="jxr_linenumber" name="100" href="#100">100</a>   <strong class="jxr_keyword">final</strong> <strong class="jxr_keyword">static</strong> String DEFAULT_SEPARATOR = <span class="jxr_string">"\t"</span>;
-<a class="jxr_linenumber" name="101" href="#101">101</a>   <strong class="jxr_keyword">final</strong> <strong class="jxr_keyword">static</strong> String DEFAULT_ATTRIBUTES_SEPERATOR = <span class="jxr_string">"=&gt;"</span>;
-<a class="jxr_linenumber" name="102" href="#102">102</a>   <strong class="jxr_keyword">final</strong> <strong class="jxr_keyword">static</strong> String DEFAULT_MULTIPLE_ATTRIBUTES_SEPERATOR = <span class="jxr_string">","</span>;
-<a class="jxr_linenumber" name="103" href="#103">103</a>   <strong class="jxr_keyword">final</strong> <strong class="jxr_keyword">static</strong> Class DEFAULT_MAPPER = TsvImporterMapper.<strong class="jxr_keyword">class</strong>;
-<a class="jxr_linenumber" name="104" href="#104">104</a>   <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">final</strong> <strong class="jxr_keyword">static</strong> String CREATE_TABLE_CONF_KEY = <span class="jxr_string">"create.table"</span>;
-<a class="jxr_linenumber" name="105" href="#105">105</a>   <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">final</strong> <strong class="jxr_keyword">static</strong> String NO_STRICT_COL_FAMILY = <span class="jxr_string">"no.strict"</span>;
-<a class="jxr_linenumber" name="106" href="#106">106</a>   <em class="jxr_javadoccomment">/**</em>
-<a class="jxr_linenumber" name="107" href="#107">107</a> <em class="jxr_javadoccomment">   * If table didn't exist and was created in dry-run mode, this flag is</em>
-<a class="jxr_linenumber" name="108" href="#108">108</a> <em class="jxr_javadoccomment">   * flipped to delete it when MR ends.</em>
-<a class="jxr_linenumber" name="109" href="#109">109</a> <em class="jxr_javadoccomment">   */</em>
-<a class="jxr_linenumber" name="110" href="#110">110</a>   <strong class="jxr_keyword">private</strong> <strong class="jxr_keyword">static</strong> <strong class="jxr_keyword">boolean</strong> DRY_RUN_TABLE_CREATED;
-<a class="jxr_linenumber" name="111" href="#111">111</a> 
-<a class="jxr_linenumber" name="112" href="#112">112</a>   <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">static</strong> <strong class="jxr_keyword">class</strong> <a href="../../../../../org/apache/hadoop/hbase/mapreduce/ImportTsv.html">TsvParser</a> {
-<a class="jxr_linenumber" name="113" href="#113">113</a>     <em class="jxr_javadoccomment">/**</em>
-<a class="jxr_linenumber" name="114" href="#114">114</a> <em class="jxr_javadoccomment">     * Column families and qualifiers mapped to the TSV columns</em>
-<a class="jxr_linenumber" name="115" href="#115">115</a> <em class="jxr_javadoccomment">     */</em>
-<a class="jxr_linenumber" name="116" href="#116">116</a>     <strong class="jxr_keyword">private</strong> <strong class="jxr_keyword">final</strong> byte[][] families;
-<a class="jxr_linenumber" name="117" href="#117">117</a>     <strong class="jxr_keyword">private</strong> <strong class="jxr_keyword">final</strong> byte[][] qualifiers;
-<a class="jxr_linenumber" name="118" href="#118">118</a> 
-<a class="jxr_linenumber" name="119" href="#119">119</a>     <strong class="jxr_keyword">private</strong> <strong class="jxr_keyword">final</strong> byte separatorByte;
-<a class="jxr_linenumber" name="120" href="#120">120</a> 
-<a class="jxr_linenumber" name="121" href="#121">121</a>     <strong class="jxr_keyword">private</strong> <strong class="jxr_keyword">int</strong> rowKeyColumnIndex;
-<a class="jxr_linenumber" name="122" href="#122">122</a> 
-<a class="jxr_linenumber" name="123" href="#123">123</a>     <strong class="jxr_keyword">private</strong> <strong class="jxr_keyword">int</strong> maxColumnCount;
-<a class="jxr_linenumber" name="124" href="#124">124</a> 
-<a class="jxr_linenumber" name="125" href="#125">125</a>     <em class="jxr_comment">// Default value must be negative</em>
-<a class="jxr_linenumber" name="126" href="#126">126</a>     <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">static</strong> <strong class="jxr_keyword">final</strong> <strong class="jxr_keyword">int</strong> DEFAULT_TIMESTAMP_COLUMN_INDEX = -1;
-<a class="jxr_linenumber" name="127" href="#127">127</a> 
-<a class="jxr_linenumber" name="128" href="#128">128</a>     <strong class="jxr_keyword">private</strong> <strong class="jxr_keyword">int</strong> timestampKeyColumnIndex = DEFAULT_TIMESTAMP_COLUMN_INDEX;
-<a class="jxr_linenumber" name="129" href="#129">129</a> 
-<a class="jxr_linenumber" name="130" href="#130">130</a>     <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">static</strong> <strong class="jxr_keyword">final</strong> String ROWKEY_COLUMN_SPEC = <span class="jxr_string">"HBASE_ROW_KEY"</span>;
-<a class="jxr_linenumber" name="131" href="#131">131</a> 
-<a class="jxr_linenumber" name="132" href="#132">132</a>     <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">static</strong> <strong class="jxr_keyword">final</strong> String TIMESTAMPKEY_COLUMN_SPEC = <span class="jxr_string">"HBASE_TS_KEY"</span>;
-<a class="jxr_linenumber" name="133" href="#133">133</a> 
-<a class="jxr_linenumber" name="134" href="#134">134</a>     <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">static</strong> <strong class="jxr_keyword">final</strong> String ATTRIBUTES_COLUMN_SPEC = <span class="jxr_string">"HBASE_ATTRIBUTES_KEY"</span>;
-<a class="jxr_linenumber" name="135" href="#135">135</a> 
-<a class="jxr_linenumber" name="136" href="#136">136</a>     <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">static</strong> <strong class="jxr_keyword">final</strong> String CELL_VISIBILITY_COLUMN_SPEC = <span class="jxr_string">"HBASE_CELL_VISIBILITY"</span>;
-<a class="jxr_linenumber" name="137" href="#137">137</a> 
-<a class="jxr_linenumber" name="138" href="#138">138</a>     <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">static</strong> <strong class="jxr_keyword">final</strong> String CELL_TTL_COLUMN_SPEC = <span class="jxr_string">"HBASE_CELL_TTL"</span>;
-<a class="jxr_linenumber" name="139" href="#139">139</a> 
-<a class="jxr_linenumber" name="140" href="#140">140</a>     <strong class="jxr_keyword">private</strong> <strong class="jxr_keyword">int</strong> attrKeyColumnIndex = DEFAULT_ATTRIBUTES_COLUMN_INDEX;
-<a class="jxr_linenumber" name="141" href="#141">141</a> 
-<a class="jxr_linenumber" name="142" href="#142">142</a>     <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">static</strong> <strong class="jxr_keyword">final</strong> <strong class="jxr_keyword">int</strong> DEFAULT_ATTRIBUTES_COLUMN_INDEX = -1;
-<a class="jxr_linenumber" name="143" href="#143">143</a> 
-<a class="jxr_linenumber" name="144" href="#144">144</a>     <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">static</strong> <strong class="jxr_keyword">final</strong> <strong class="jxr_keyword">int</strong> DEFAULT_CELL_VISIBILITY_COLUMN_INDEX = -1;
-<a class="jxr_linenumber" name="145" href="#145">145</a> 
-<a class="jxr_linenumber" name="146" href="#146">146</a>     <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">static</strong> <strong class="jxr_keyword">final</strong> <strong class="jxr_keyword">int</strong> DEFAULT_CELL_TTL_COLUMN_INDEX = -1;
-<a class="jxr_linenumber" name="147" href="#147">147</a> 
-<a class="jxr_linenumber" name="148" href="#148">148</a>     <strong class="jxr_keyword">private</strong> <strong class="jxr_keyword">int</strong> cellVisibilityColumnIndex = DEFAULT_CELL_VISIBILITY_COLUMN_INDEX;
-<a class="jxr_linenumber" name="149" href="#149">149</a> 
-<a class="jxr_linenumber" name="150" href="#150">150</a>     <strong class="jxr_keyword">private</strong> <strong class="jxr_keyword">int</strong> cellTTLColumnIndex = DEFAULT_CELL_TTL_COLUMN_INDEX;
-<a class="jxr_linenumber" name="151" href="#151">151</a> 
-<a class="jxr_linenumber" name="152" href="#152">152</a>     <em class="jxr_javadoccomment">/**</em>
-<a class="jxr_linenumber" name="153" href="#153">153</a> <em class="jxr_javadoccomment">     * @param columnsSpecification the list of columns to parser out, comma separated.</em>
-<a class="jxr_linenumber" name="154" href="#154">154</a> <em class="jxr_javadoccomment">     * The row key should be the special token TsvParser.ROWKEY_COLUMN_SPEC</em>
-<a class="jxr_linenumber" name="155" href="#155">155</a> <em class="jxr_javadoccomment">     * @param separatorStr</em>
-<a class="jxr_linenumber" name="156" href="#156">156</a> <em class="jxr_javadoccomment">     */</em>
-<a class="jxr_linenumber" name="157" href="#157">157</a>     <strong class="jxr_keyword">public</strong> <a href="../../../../../org/apache/hadoop/hbase/mapreduce/ImportTsv.html">TsvParser</a>(String columnsSpecification, String separatorStr) {
-<a class="jxr_linenumber" name="158" href="#158">158</a>       <em class="jxr_comment">// Configure separator</em>
-<a class="jxr_linenumber" name="159" href="#159">159</a>       byte[] separator = Bytes.toBytes(separatorStr);
-<a class="jxr_linenumber" name="160" href="#160">160</a>       Preconditions.checkArgument(separator.length == 1,
-<a class="jxr_linenumber" name="161" href="#161">161</a>         <span class="jxr_string">"TsvParser only supports single-byte separators"</span>);
-<a class="jxr_linenumber" name="162" href="#162">162</a>       separatorByte = separator[0];
-<a class="jxr_linenumber" name="163" href="#163">163</a> 
-<a class="jxr_linenumber" name="164" href="#164">164</a>       <em class="jxr_comment">// Configure columns</em>
-<a class="jxr_linenumber" name="165" href="#165">165</a>       ArrayList&lt;String&gt; columnStrings = Lists.newArrayList(
-<a class="jxr_linenumber" name="166" href="#166">166</a>         Splitter.on(',').trimResults().split(columnsSpecification));
-<a class="jxr_linenumber" name="167" href="#167">167</a> 
-<a class="jxr_linenumber" name="168" href="#168">168</a>       maxColumnCount = columnStrings.size();
-<a class="jxr_linenumber" name="169" href="#169">169</a>       families = <strong class="jxr_keyword">new</strong> byte[maxColumnCount][];
-<a class="jxr_linenumber" name="170" href="#170">170</a>       qualifiers = <strong class="jxr_keyword">new</strong> byte[maxColumnCount][];
-<a class="jxr_linenumber" name="171" href="#171">171</a> 
-<a class="jxr_linenumber" name="172" href="#172">172</a>       <strong class="jxr_keyword">for</strong> (<strong class="jxr_keyword">int</strong> i = 0; i &lt; columnStrings.size(); i++) {
-<a class="jxr_linenumber" name="173" href="#173">173</a>         String str = columnStrings.get(i);
-<a class="jxr_linenumber" name="174" href="#174">174</a>         <strong class="jxr_keyword">if</strong> (ROWKEY_COLUMN_SPEC.equals(str)) {
-<a class="jxr_linenumber" name="175" href="#175">175</a>           rowKeyColumnIndex = i;
-<a class="jxr_linenumber" name="176" href="#176">176</a>           <strong class="jxr_keyword">continue</strong>;
-<a class="jxr_linenumber" name="177" href="#177">177</a>         }
-<a class="jxr_linenumber" name="178" href="#178">178</a>         <strong class="jxr_keyword">if</strong> (TIMESTAMPKEY_COLUMN_SPEC.equals(str)) {
-<a class="jxr_linenumber" name="179" href="#179">179</a>           timestampKeyColumnIndex = i;
-<a class="jxr_linenumber" name="180" href="#180">180</a>           <strong class="jxr_keyword">continue</strong>;
-<a class="jxr_linenumber" name="181" href="#181">181</a>         }
-<a class="jxr_linenumber" name="182" href="#182">182</a>         <strong class="jxr_keyword">if</strong> (ATTRIBUTES_COLUMN_SPEC.equals(str)) {
-<a class="jxr_linenumber" name="183" href="#183">183</a>           attrKeyColumnIndex = i;
-<a class="jxr_linenumber" name="184" href="#184">184</a>           <strong class="jxr_keyword">continue</strong>;
-<a class="jxr_linenumber" name="185" href="#185">185</a>         }
-<a class="jxr_linenumber" name="186" href="#186">186</a>         <strong class="jxr_keyword">if</strong> (CELL_VISIBILITY_COLUMN_SPEC.equals(str)) {
-<a class="jxr_linenumber" name="187" href="#187">187</a>           cellVisibilityColumnIndex = i;
-<a class="jxr_linenumber" name="188" href="#188">188</a>           <strong class="jxr_keyword">continue</strong>;
-<a class="jxr_linenumber" name="189" href="#189">189</a>         }
-<a class="jxr_linenumber" name="190" href="#190">190</a>         <strong class="jxr_keyword">if</strong> (CELL_TTL_COLUMN_SPEC.equals(str)) {
-<a class="jxr_linenumber" name="191" href="#191">191</a>           cellTTLColumnIndex = i;
-<a class="jxr_linenumber" name="192" href="#192">192</a>           <strong class="jxr_keyword">continue</strong>;
-<a class="jxr_linenumber" name="193" href="#193">193</a>         }
-<a class="jxr_linenumber" name="194" href="#194">194</a>         String[] parts = str.split(<span class="jxr_string">":"</span>, 2);
-<a class="jxr_linenumber" name="195" href="#195">195</a>         <strong class="jxr_keyword">if</strong> (parts.length == 1) {
-<a class="jxr_linenumber" name="196" href="#196">196</a>           families[i] = str.getBytes();
-<a class="jxr_linenumber" name="197" href="#197">197</a>           qualifiers[i] = HConstants.EMPTY_BYTE_ARRAY;
-<a class="jxr_linenumber" name="198" href="#198">198</a>         } <strong class="jxr_keyword">else</strong> {
-<a class="jxr_linenumber" name="199" href="#199">199</a>           families[i] = parts[0].getBytes();
-<a class="jxr_linenumber" name="200" href="#200">200</a>           qualifiers[i] = parts[1].getBytes();
-<a class="jxr_linenumber" name="201" href="#201">201</a>         }
-<a class="jxr_linenumber" name="202" href="#202">202</a>       }
-<a class="jxr_linenumber" name="203" href="#203">203</a>     }
-<a class="jxr_linenumber" name="204" href="#204">204</a> 
-<a class="jxr_linenumber" name="205" href="#205">205</a>     <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">boolean</strong> hasTimestamp() {
-<a class="jxr_linenumber" name="206" href="#206">206</a>       <strong class="jxr_keyword">return</strong> timestampKeyColumnIndex != DEFAULT_TIMESTAMP_COLUMN_INDEX;
-<a class="jxr_linenumber" name="207" href="#207">207</a>     }
-<a class="jxr_linenumber" name="208" href="#208">208</a> 
-<a class="jxr_linenumber" name="209" href="#209">209</a>     <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">int</strong> getTimestampKeyColumnIndex() {
-<a class="jxr_linenumber" name="210" href="#210">210</a>       <strong class="jxr_keyword">return</strong> timestampKeyColumnIndex;
-<a class="jxr_linenumber" name="211" href="#211">211</a>     }
-<a class="jxr_linenumber" name="212" href="#212">212</a> 
-<a class="jxr_linenumber" name="213" href="#213">213</a>     <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">boolean</strong> hasAttributes() {
-<a class="jxr_linenumber" name="214" href="#214">214</a>       <strong class="jxr_keyword">return</strong> attrKeyColumnIndex != DEFAULT_ATTRIBUTES_COLUMN_INDEX;
-<a class="jxr_linenumber" name="215" href="#215">215</a>     }
-<a class="jxr_linenumber" name="216" href="#216">216</a> 
-<a class="jxr_linenumber" name="217" href="#217">217</a>     <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">boolean</strong> hasCellVisibility() {
-<a class="jxr_linenumber" name="218" href="#218">218</a>       <strong class="jxr_keyword">return</strong> cellVisibilityColumnIndex != DEFAULT_CELL_VISIBILITY_COLUMN_INDEX;
-<a class="jxr_linenumber" name="219" href="#219">219</a>     }
-<a class="jxr_linenumber" name="220" href="#220">220</a> 
-<a class="jxr_linenumber" name="221" href="#221">221</a>     <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">boolean</strong> hasCellTTL() {
-<a class="jxr_linenumber" name="222" href="#222">222</a>       <strong class="jxr_keyword">return</strong> cellTTLColumnIndex != DEFAULT_CELL_VISIBILITY_COLUMN_INDEX;
-<a class="jxr_linenumber" name="223" href="#223">223</a>     }
-<a class="jxr_linenumber" name="224" href="#224">224</a> 
-<a class="jxr_linenumber" name="225" href="#225">225</a>     <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">int</strong> getAttributesKeyColumnIndex() {
-<a class="jxr_linenumber" name="226" href="#226">226</a>       <strong class="jxr_keyword">return</strong> attrKeyColumnIndex;
-<a class="jxr_linenumber" name="227" href="#227">227</a>     }
-<a class="jxr_linenumber" name="228" href="#228">228</a> 
-<a class="jxr_linenumber" name="229" href="#229">229</a>     <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">int</strong> getCellVisibilityColumnIndex() {
-<a class="jxr_linenumber" name="230" href="#230">230</a>       <strong class="jxr_keyword">return</strong> cellVisibilityColumnIndex;
-<a class="jxr_linenumber" name="231" href="#231">231</a>     }
-<a class="jxr_linenumber" name="232" href="#232">232</a> 
-<a class="jxr_linenumber" name="233" href="#233">233</a>     <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">int</strong> getCellTTLColumnIndex() {
-<a class="jxr_linenumber" name="234" href="#234">234</a>       <strong class="jxr_keyword">return</strong> cellTTLColumnIndex;
-<a class="jxr_linenumber" name="235" href="#235">235</a>     }
-<a class="jxr_linenumber" name="236" href="#236">236</a> 
-<a class="jxr_linenumber" name="237" href="#237">237</a>     <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">int</strong> getRowKeyColumnIndex() {
-<a class="jxr_linenumber" name="238" href="#238">238</a>       <strong class="jxr_keyword">return</strong> rowKeyColumnIndex;
-<a class="jxr_linenumber" name="239" href="#239">239</a>     }
-<a class="jxr_linenumber" name="240" href="#240">240</a> 
-<a class="jxr_linenumber" name="241" href="#241">241</a>     <strong class="jxr_keyword">public</strong> byte[] getFamily(<strong class="jxr_keyword">int</strong> idx) {
-<a class="jxr_linenumber" name="242" href="#242">242</a>       <strong class="jxr_keyword">return</strong> families[idx];
-<a class="jxr_linenumber" name="243" href="#243">243</a>     }
-<a class="jxr_linenumber" name="244" href="#244">244</a>     <strong class="jxr_keyword">public</strong> byte[] getQualifier(<strong class="jxr_keyword">int</strong> idx) {
-<a class="jxr_linenumber" name="245" href="#245">245</a>       <strong class="jxr_keyword">return</strong> qualifiers[idx];
-<a class="jxr_linenumber" name="246" href="#246">246</a>     }
-<a class="jxr_linenumber" name="247" href="#247">247</a> 
-<a class="jxr_linenumber" name="248" href="#248">248</a>     <strong class="jxr_keyword">public</strong> <a href="../../../../../org/apache/hadoop/hbase/mapreduce/ImportTsv.html">ParsedLine</a> parse(byte[] lineBytes, <strong class="jxr_keyword">int</strong> length)
-<a class="jxr_linenumber" name="249" href="#249">249</a>     <strong class="jxr_keyword">throws</strong> <a href="../../../../../org/apache/hadoop/hbase/mapreduce/ImportTsv.html">BadTsvLineException</a> {
-<a class="jxr_linenumber" name="250" href="#250">250</a>       <em class="jxr_comment">// Enumerate separator offsets</em>
-<a class="jxr_linenumber" name="251" href="#251">251</a>       ArrayList&lt;Integer&gt; tabOffsets = <strong class="jxr_keyword">new</strong> ArrayList&lt;Integer&gt;(maxColumnCount);
-<a class="jxr_linenumber" name="252" href="#252">252</a>       <strong class="jxr_keyword">for</strong> (<strong class="jxr_keyword">int</strong> i = 0; i &lt; length; i++) {
-<a class="jxr_linenumber" name="253" href="#253">253</a>         <strong class="jxr_keyword">if</strong> (lineBytes[i] == separatorByte) {
-<a class="jxr_linenumber" name="254" href="#254">254</a>           tabOffsets.add(i);
-<a class="jxr_linenumber" name="255" href="#255">255</a>         }
-<a class="jxr_linenumber" name="256" href="#256">256</a>       }
-<a class="jxr_linenumber" name="257" href="#257">257</a>       <strong class="jxr_keyword">if</strong> (tabOffsets.isEmpty()) {
-<a class="jxr_linenumber" name="258" href="#258">258</a>         <strong class="jxr_keyword">throw</strong> <strong class="jxr_keyword">new</strong> <a href="../../../../../org/apache/hadoop/hbase/mapreduce/ImportTsv.html">BadTsvLineException</a>(<span class="jxr_string">"No delimiter"</span>);
-<a class="jxr_linenumber" name="259" href="#259">259</a>       }
-<a class="jxr_linenumber" name="260" href="#260">260</a> 
-<a class="jxr_linenumber" name="261" href="#261">261</a>       tabOffsets.add(length);
-<a class="jxr_linenumber" name="262" href="#262">262</a> 
-<a class="jxr_linenumber" name="263" href="#263">263</a>       <strong class="jxr_keyword">if</strong> (tabOffsets.size() &gt; maxColumnCount) {
-<a class="jxr_linenumber" name="264" href="#264">264</a>         <strong class="jxr_keyword">throw</strong> <strong class="jxr_keyword">new</strong> <a href="../../../../../org/apache/hadoop/hbase/mapreduce/ImportTsv.html">BadTsvLineException</a>(<span class="jxr_string">"Excessive columns"</span>);
-<a class="jxr_linenumber" name="265" href="#265">265</a>       } <strong class="jxr_keyword">else</strong> <strong class="jxr_keyword">if</strong> (tabOffsets.size() &lt;= getRowKeyColumnIndex()) {
-<a class="jxr_linenumber" name="266" href="#266">266</a>         <strong class="jxr_keyword">throw</strong> <strong class="jxr_keyword">new</strong> <a href="../../../../../org/apache/hadoop/hbase/mapreduce/ImportTsv.html">BadTsvLineException</a>(<span class="jxr_string">"No row key"</span>);
-<a class="jxr_linenumber" name="267" href="#267">267</a>       } <strong class="jxr_keyword">else</strong> <strong class="jxr_keyword">if</strong> (hasTimestamp()
-<a class="jxr_linenumber" name="268" href="#268">268</a>           &amp;&amp; tabOffsets.size() &lt;= getTimestampKeyColumnIndex()) {
-<a class="jxr_linenumber" name="269" href="#269">269</a>         <strong class="jxr_keyword">throw</strong> <strong class="jxr_keyword">new</strong> <a href="../../../../../org/apache/hadoop/hbase/mapreduce/ImportTsv.html">BadTsvLineException</a>(<span class="jxr_string">"No timestamp"</span>);
-<a class="jxr_linenumber" name="270" href="#270">270</a>       } <strong class="jxr_keyword">else</strong> <strong class="jxr_keyword">if</strong> (hasAttributes() &amp;&amp; tabOffsets.size() &lt;= getAttributesKeyColumnIndex()) {
-<a class="jxr_linenumber" name="271" href="#271">271</a>         <strong class="jxr_keyword">throw</strong> <strong class="jxr_keyword">new</strong> <a href="../../../../../org/apache/hadoop/hbase/mapreduce/ImportTsv.html">BadTsvLineException</a>(<span class="jxr_string">"No attributes specified"</span>);
-<a class="jxr_linenumber" name="272" href="#272">272</a>       } <strong class="jxr_keyword">else</strong> <strong class="jxr_keyword">if</strong> (hasCellVisibility() &amp;&amp; tabOffsets.size() &lt;= getCellVisibilityColumnIndex()) {
-<a class="jxr_linenumber" name="273" href="#273">273</a>         <strong class="jxr_keyword">throw</strong> <strong class="jxr_keyword">new</strong> <a href="../../../../../org/apache/hadoop/hbase/mapreduce/ImportTsv.html">BadTsvLineException</a>(<span class="jxr_string">"No cell visibility specified"</span>);
-<a class="jxr_linenumber" name="274" href="#274">274</a>       } <strong class="jxr_keyword">else</strong> <strong class="jxr_keyword">if</strong> (hasCellTTL() &amp;&amp; tabOffsets.size() &lt;= getCellTTLColumnIndex()) {
-<a class="jxr_linenumber" name="275" href="#275">275</a>         <strong class="jxr_keyword">throw</strong> <strong class="jxr_keyword">new</strong> <a href="../../../../../org/apache/hadoop/hbase/mapreduce/ImportTsv.html">BadTsvLineException</a>(<span class="jxr_string">"No cell TTL specified"</span>);
-<a class="jxr_linenumber" name="276" href="#276">276</a>       }
-<a class="jxr_linenumber" name="277" href="#277">277</a>       <strong class="jxr_keyword">return</strong> <strong class="jxr_keyword">new</strong> <a href="../../../../../org/apache/hadoop/hbase/mapreduce/ImportTsv.html">ParsedLine</a>(tabOffsets, lineBytes);
-<a class="jxr_linenumber" name="278" href="#278">278</a>     }
-<a class="jxr_linenumber" name="279" href="#279">279</a> 
-<a class="jxr_linenumber" name="280" href="#280">280</a>     <strong class="jxr_keyword">class</strong> <a href="../../../../../org/apache/hadoop/hbase/mapreduce/ImportTsv.html">ParsedLine</a> {
-<a class="jxr_linenumber" name="281" href="#281">281</a>       <strong class="jxr_keyword">private</strong> <strong class="jxr_keyword">final</strong> ArrayList&lt;Integer&gt; tabOffsets;
-<a class="jxr_linenumber" name="282" href="#282">282</a>       <strong class="jxr_keyword">private</strong> byte[] lineBytes;
-<a class="jxr_linenumber" name="283" href="#283">283</a> 
-<a class="jxr_linenumber" name="284" href="#284">284</a>       <a href="../../../../../org/apache/hadoop/hbase/mapreduce/ImportTsv.html">ParsedLine</a>(ArrayList&lt;Integer&gt; tabOffsets, byte[] lineBytes) {
-<a class="jxr_linenumber" name="285" href="#285">285</a>         <strong class="jxr_keyword">this</strong>.tabOffsets = tabOffsets;
-<a class="jxr_linenumber" name="286" href="#286">286</a>         <strong class="jxr_keyword">this</strong>.lineBytes = lineBytes;
-<a class="jxr_linenumber" name="287" href="#287">287</a>       }
-<a class="jxr_linenumber" name="288" href="#288">288</a> 
-<a class="jxr_linenumber" name="289" href="#289">289</a>       <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">int</strong> getRowKeyOffset() {
-<a class="jxr_linenumber" name="290" href="#290">290</a>         <strong class="jxr_keyword">return</strong> getColumnOffset(rowKeyColumnIndex);
-<a class="jxr_linenumber" name="291" href="#291">291</a>       }
-<a class="jxr_linenumber" name="292" href="#292">292</a>       <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">int</strong> getRowKeyLength() {
-<a class="jxr_linenumber" name="293" href="#293">293</a>         <strong class="jxr_keyword">return</strong> getColumnLength(rowKeyColumnIndex);
-<a class="jxr_linenumber" name="294" href="#294">294</a>       }
-<a class="jxr_linenumber" name="295" href="#295">295</a> 
-<a class="jxr_linenumber" name="296" href="#296">296</a>       <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">long</strong> getTimestamp(<strong class="jxr_keyword">long</strong> ts) <strong class="jxr_keyword">throws</strong> BadTsvLineException {
-<a class="jxr_linenumber" name="297" href="#297">297</a>         <em class="jxr_comment">// Return ts if HBASE_TS_KEY is not configured in column spec</em>
-<a class="jxr_linenumber" name="298" href="#298">298</a>         <strong class="jxr_keyword">if</strong> (!hasTimestamp()) {
-<a class="jxr_linenumber" name="299" href="#299">299</a>           <strong class="jxr_keyword">return</strong> ts;
-<a class="jxr_linenumber" name="300" href="#300">300</a>         }
-<a class="jxr_linenumber" name="301" href="#301">301</a> 
-<a class="jxr_linenumber" name="302" href="#302">302</a>         String timeStampStr = Bytes.toString(lineBytes,
-<a class="jxr_linenumber" name="303" href="#303">303</a>             getColumnOffset(timestampKeyColumnIndex),
-<a class="jxr_linenumber" name="304" href="#304">304</a>             getColumnLength(timestampKeyColumnIndex));
-<a class="jxr_linenumber" name="305" href="#305">305</a>         <strong class="jxr_keyword">try</strong> {
-<a class="jxr_linenumber" name="306" href="#306">306</a>           <strong class="jxr_keyword">return</strong> Long.parseLong(timeStampStr);
-<a class="jxr_linenumber" name="307" href="#307">307</a>         } <strong class="jxr_keyword">catch</strong> (NumberFormatException nfe) {
-<a class="jxr_linenumber" name="308" href="#308">308</a>           <em class="jxr_comment">// treat this record as bad record</em>
-<a class="jxr_linenumber" name="309" href="#309">309</a>           <strong class="jxr_keyword">throw</strong> <strong class="jxr_keyword">new</strong> <a href="../../../../../org/apache/hadoop/hbase/mapreduce/ImportTsv.html">BadTsvLineException</a>(<span class="jxr_string">"Invalid timestamp "</span> + timeStampStr);
-<a class="jxr_linenumber" name="310" href="#310">310</a>         }
-<a class="jxr_linenumber" name="311" href="#311">311</a>       }
-<a class="jxr_linenumber" name="312" href="#312">312</a> 
-<a class="jxr_linenumber" name="313" href="#313">313</a>       <strong class="jxr_keyword">private</strong> String getAttributes() {
-<a class="jxr_linenumber" name="314" href="#314">314</a>         <strong class="jxr_keyword">if</strong> (!hasAttributes()) {
-<a class="jxr_linenumber" name="315" href="#315">315</a>           <strong class="jxr_keyword">return</strong> <strong class="jxr_keyword">null</strong>;
-<a class="jxr_linenumber" name="316" href="#316">316</a>         } <strong class="jxr_keyword">else</strong> {
-<a class="jxr_linenumber" name="317" href="#317">317</a>           <strong class="jxr_keyword">return</strong> Bytes.toString(lineBytes, getColumnOffset(attrKeyColumnIndex),
-<a class="jxr_linenumber" name="318" href="#318">318</a>               getColumnLength(attrKeyColumnIndex));
-<a class="jxr_linenumber" name="319" href="#319">319</a>         }
-<a class="jxr_linenumber" name="320" href="#320">320</a>       }
-<a class="jxr_linenumber" name="321" href="#321">321</a> 
-<a class="jxr_linenumber" name="322" href="#322">322</a>       <strong class="jxr_keyword">public</strong> String[] getIndividualAttributes() {
-<a class="jxr_linenumber" name="323" href="#323">323</a>         String attributes = getAttributes();
-<a class="jxr_linenumber" name="324" href="#324">324</a>         <strong class="jxr_keyword">if</strong> (attributes != <strong class="jxr_keyword">null</strong>) {
-<a class="jxr_linenumber" name="325" href="#325">325</a>           <strong class="jxr_keyword">return</strong> attributes.split(DEFAULT_MULTIPLE_ATTRIBUTES_SEPERATOR);
-<a class="jxr_linenumber" name="326" href="#326">326</a>         } <strong class="jxr_keyword">else</strong> {
-<a class="jxr_linenumber" name="327" href="#327">327</a>           <strong class="jxr_keyword">return</strong> <strong class="jxr_keyword">null</strong>;
-<a class="jxr_linenumber" name="328" href="#328">328</a>         }
-<a class="jxr_linenumber" name="329" href="#329">329</a>       }
-<a class="jxr_linenumber" name="330" href="#330">330</a> 
-<a class="jxr_linenumber" name="331" href="#331">331</a>       <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">int</strong> getAttributeKeyOffset() {
-<a class="jxr_linenumber" name="332" href="#332">332</a>         <strong class="jxr_keyword">if</strong> (hasAttributes()) {
-<a class="jxr_linenumber" name="333" href="#333">333</a>           <strong class="jxr_keyword">return</strong> getColumnOffset(attrKeyColumnIndex);
-<a class="jxr_linenumber" name="334" href="#334">334</a>         } <strong class="jxr_keyword">else</strong> {
-<a class="jxr_linenumber" name="335" href="#335">335</a>           <strong class="jxr_keyword">return</strong> DEFAULT_ATTRIBUTES_COLUMN_INDEX;
-<a class="jxr_linenumber" name="336" href="#336">336</a>         }
-<a class="jxr_linenumber" name="337" href="#337">337</a>       }
-<a class="jxr_linenumber" name="338" href="#338">338</a> 
-<a class="jxr_linenumber" name="339" href="#339">339</a>       <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">int</strong> getAttributeKeyLength() {
-<a class="jxr_linenumber" name="340" href="#340">340</a>         <strong class="jxr_keyword">if</strong> (hasAttributes()) {
-<a class="jxr_linenumber" name="341" href="#341">341</a>           <strong class="jxr_keyword">return</strong> getColumnLength(attrKeyColumnIndex);
-<a class="jxr_linenumber" name="342" href="#342">342</a>         } <strong class="jxr_keyword">else</strong> {
-<a class="jxr_linenumber" name="343" href="#343">343</a>           <strong class="jxr_keyword">return</strong> DEFAULT_ATTRIBUTES_COLUMN_INDEX;
-<a class="jxr_linenumber" name="344" href="#344">344</a>         }
-<a class="jxr_linenumber" name="345" href="#345">345</a>       }
-<a class="jxr_linenumber" name="346" href="#346">346</a> 
-<a class="jxr_linenumber" name="347" href="#347">347</a>       <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">int</strong> getCellVisibilityColumnOffset() {
-<a class="jxr_linenumber" name="348" href="#348">348</a>         <strong class="jxr_keyword">if</strong> (hasCellVisibility()) {
-<a class="jxr_linenumber" name="349" href="#349">349</a>           <strong class="jxr_keyword">return</strong> getColumnOffset(cellVisibilityColumnIndex);
-<a class="jxr_linenumber" name="350" href="#350">350</a>         } <strong class="jxr_keyword">else</strong> {
-<a class="jxr_linenumber" name="351" href="#351">351</a>           <strong class="jxr_keyword">return</strong> DEFAULT_CELL_VISIBILITY_COLUMN_INDEX;
-<a class="jxr_linenumber" name="352" href="#352">352</a>         }
-<a class="jxr_linenumber" name="353" href="#353">353</a>       }
-<a class="jxr_linenumber" name="354" href="#354">354</a> 
-<a class="jxr_linenumber" name="355" href="#355">355</a>       <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">int</strong> getCellVisibilityColumnLength() {
-<a class="jxr_linenumber" name="356" href="#356">356</a>         <strong class="jxr_keyword">if</strong> (hasCellVisibility()) {
-<a class="jxr_linenumber" name="357" href="#357">357</a>           <strong class="jxr_keyword">return</strong> getColumnLength(cellVisibilityColumnIndex);
-<a class="jxr_linenumber" name="358" href="#358">358</a>         } <strong class="jxr_keyword">else</strong> {
-<a class="jxr_linenumber" name="359" href="#359">359</a>           <strong class="jxr_keyword">return</strong> DEFAULT_CELL_VISIBILITY_COLUMN_INDEX;
-<a class="jxr_linenumber" name="360" href="#360">360</a>         }
-<a class="jxr_linenumber" name="361" href="#361">361</a>       }
-<a class="jxr_linenumber" name="362" href="#362">362</a> 
-<a class="jxr_linenumber" name="363" href="#363">363</a>       <strong class="jxr_keyword">public</strong> String getCellVisibility() {
-<a class="jxr_linenumber" name="364" href="#364">364</a>         <strong class="jxr_keyword">if</strong> (!hasCellVisibility()) {
-<a class="jxr_linenumber" name="365" href="#365">365</a>           <strong class="jxr_keyword">return</strong> <strong class="jxr_keyword">null</strong>;
-<a class="jxr_linenumber" name="366" href="#366">366</a>         } <strong class="jxr_keyword">else</strong> {
-<a class="jxr_linenumber" name="367" href="#367">367</a>           <strong class="jxr_keyword">return</strong> Bytes.toString(lineBytes, getColumnOffset(cellVisibilityColumnIndex),
-<a class="jxr_linenumber" name="368" href="#368">368</a>               getColumnLength(cellVisibilityColumnIndex));
-<a class="jxr_linenumber" name="369" href="#369">369</a>         }
-<a class="jxr_linenumber" name="370" href="#370">370</a>       }
-<a class="jxr_linenumber" name="371" href="#371">371</a> 
-<a class="jxr_linenumber" name="372" href="#372">372</a>       <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">int</strong> getCellTTLColumnOffset() {
-<a class="jxr_linenumber" name="373" href="#373">373</a>         <strong class="jxr_keyword">if</strong> (hasCellTTL()) {
-<a class="jxr_linenumber" name="374" href="#374">374</a>           <strong class="jxr_keyword">return</strong> getColumnOffset(cellTTLColumnIndex);
-<a class="jxr_linenumber" name="375" href="#375">375</a>         } <strong class="jxr_keyword">else</strong> {
-<a class="jxr_linenumber" name="376" href="#376">376</a>           <strong class="jxr_keyword">return</strong> DEFAULT_CELL_TTL_COLUMN_INDEX;
-<a class="jxr_linenumber" name="377" href="#377">377</a>         }
-<a class="jxr_linenumber" name="378" href="#378">378</a>       }
-<a class="jxr_linenumber" name="379" href="#379">379</a> 
-<a class="jxr_linenumber" name="380" href="#380">380</a>       <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">int</strong> getCellTTLColumnLength() {
-<a class="jxr_linenumber" name="381" href="#381">381</a>         <strong class="jxr_keyword">if</strong> (hasCellTTL()) {
-<a class="jxr_linenumber" name="382" href="#382">382</a>           <strong class="jxr_keyword">return</strong> getColumnLength(cellTTLColumnIndex);
-<a class="jxr_linenumber" name="383" href="#383">383</a>         } <strong class="jxr_keyword">else</strong> {
-<a class="jxr_linenumber" name="384" href="#384">384</a>           <strong class="jxr_keyword">return</strong> DEFAULT_CELL_TTL_COLUMN_INDEX;
-<a class="jxr_linenumber" name="385" href="#385">385</a>         }
-<a class="jxr_linenumber" name="386" href="#386">386</a>       }
-<a class="jxr_linenumber" name="387" href="#387">387</a> 
-<a class="jxr_linenumber" name="388" href="#388">388</a>       <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">long</strong> getCellTTL() {
-<a class="jxr_linenumber" name="389" href="#389">389</a>         <strong class="jxr_keyword">if</strong> (!hasCellTTL()) {
-<a class="jxr_linenumber" name="390" href="#390">390</a>           <strong class="jxr_keyword">return</strong> 0;
-<a class="jxr_linenumber" name="391" href="#391">391</a>         } <strong class="jxr_keyword">else</strong> {
-<a class="jxr_linenumber" name="392" href="#392">392</a>           <strong class="jxr_keyword">return</strong> Bytes.toLong(lineBytes, getColumnOffset(cellTTLColumnIndex),
-<a class="jxr_linenumber" name="393" href="#393">393</a>               getColumnLength(cellTTLColumnIndex));
-<a class="jxr_linenumber" name="394" href="#394">394</a>         }
-<a class="jxr_linenumber" name="395" href="#395">395</a>       }
-<a class="jxr_linenumber" name="396" href="#396">396</a> 
-<a class="jxr_linenumber" name="397" href="#397">397</a>       <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">int</strong> getColumnOffset(<strong class="jxr_keyword">int</strong> idx) {
-<a class="jxr_linenumber" name="398" href="#398">398</a>         <strong class="jxr_keyword">if</strong> (idx &gt; 0)
-<a class="jxr_linenumber" name="399" href="#399">399</a>           <strong class="jxr_keyword">return</strong> tabOffsets.get(idx - 1) + 1;
-<a class="jxr_linenumber" name="400" href="#400">400</a>         <strong class="jxr_keyword">else</strong>
-<a class="jxr_linenumber" name="401" href="#401">401</a>           <strong class="jxr_keyword">return</strong> 0;
-<a class="jxr_linenumber" name="402" href="#402">402</a>       }
-<a class="jxr_linenumber" name="403" href="#403">403</a>       <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">int</strong> getColumnLength(<strong class="jxr_keyword">int</strong> idx) {
-<a class="jxr_linenumber" name="404" href="#404">404</a>         <strong class="jxr_keyword">return</strong> tabOffsets.get(idx) - getColumnOffset(idx);
-<a class="jxr_linenumber" name="405" href="#405">405</a>       }
-<a class="jxr_linenumber" name="406" href="#406">406</a>       <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">int</strong> getColumnCount() {
-<a class="jxr_linenumber" name="407" href="#407">407</a>         <strong class="jxr_keyword">return</strong> tabOffsets.size();
-<a class="jxr_linenumber" name="408" href="#408">408</a>       }
-<a class="jxr_linenumber" name="409" href="#409">409</a>       <strong class="jxr_keyword">public</strong> byte[] getLineBytes() {
-<a class="jxr_linenumber" name="410" href="#410">410</a>         <strong class="jxr_keyword">return</strong> lineBytes;
-<a class="jxr_linenumber" name="411" href="#411">411</a>       }
-<a class="jxr_linenumber" name="412" href="#412">412</a>     }
-<a class="jxr_linenumber" name="413" href="#413">413</a> 
-<a class="jxr_linenumber" name="414" href="#414">414</a>     <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">static</strong> <strong class="jxr_keyword">class</strong> <a href="../../../../../org/apache/hadoop/hbase/mapreduce/ImportTsv.html">BadTsvLineException</a> <strong class="jxr_keyword">extends</strong> Exception {
-<a class="jxr_linenumber" name="415" href="#415">415</a>       <strong class="jxr_keyword">public</strong> <a href="../../../../../org/apache/hadoop/hbase/mapreduce/ImportTsv.html">BadTsvLineException</a>(String err) {
-<a class="jxr_linenumber" name="416" href="#416">416</a>         <strong class="jxr_keyword">super</strong>(err);
-<a class="jxr_linenumber" name="417" href="#417">417</a>       }
-<a class="jxr_linenumber" name="418" href="#418">418</a>       <strong class="jxr_keyword">private</strong> <strong class="jxr_keyword">static</strong> <strong class="jxr_keyword">final</strong> <strong class="jxr_keyword">long</strong> serialVersionUID = 1L;
-<a class="jxr_linenumber" name="419" href="#419">419</a>     }
-<a class="jxr_linenumber" name="420" href="#420">420</a> 
-<a class="jxr_linenumber" name="421" href="#421">421</a>     <em class="jxr_javadoccomment">/**</em>
-<a class="jxr_linenumber" name="422" href="#422">422</a> <em class="jxr_javadoccomment">     * Return starting position and length of row key from the specified line bytes.</em>
-<a class="jxr_linenumber" name="423" href="#423">423</a> <em class="jxr_javadoccomment">     * @param lineBytes</em>
-<a class="jxr_linenumber" name="424" href="#424">424</a> <em class="jxr_javadoccomment">     * @param length</em>
-<a class="jxr_linenumber" name="425" href="#425">425</a> <em class="jxr_javadoccomment">     * @return Pair of row key offset and length.</em>
-<a class="jxr_linenumber" name="426" href="#426">426</a> <em class="jxr_javadoccomment">     * @throws BadTsvLineException</em>
-<a class="jxr_linenumber" name="427" href="#427">427</a> <em class="jxr_javadoccomment">     */</em>
-<a class="jxr_linenumber" name="428" href="#428">428</a>     <strong class="jxr_keyword">public</strong> Pair&lt;Integer, Integer&gt; parseRowKey(byte[] lineBytes, <strong class="jxr_keyword">int</strong> length)
-<a class="jxr_linenumber" name="429" href="#429">429</a>         <strong class="jxr_keyword">throws</strong> <a href="../../../../../org/apache/hadoop/hbase/mapreduce/ImportTsv.html">BadTsvLineException</a> {
-<a class="jxr_linenumber" name="430" href="#430">430</a>       <strong class="jxr_keyword">int</strong> rkColumnIndex = 0;
-<a class="jxr_linenumber" name="431" href="#431">431</a>       <strong class="jxr_keyword">int</strong> startPos = 0, endPos = 0;
-<a class="jxr_linenumber" name="432" href="#432">432</a>       <strong class="jxr_keyword">for</strong> (<strong class="jxr_keyword">int</strong> i = 0; i &lt;= length; i++) {
-<a class="jxr_linenumber" name="433" href="#433">433</a>         <strong class="jxr_keyword">if</strong> (i == length || lineBytes[i] == separatorByte) {
-<a class="jxr_linenumber" name="434" href="#434">434</a>           endPos = i - 1;
-<a class="jxr_linenumber" name="435" href="#435">435</a>           <strong class="jxr_keyword">if</strong> (rkColumnIndex++ == getRowKeyColumnIndex()) {
-<a class="jxr_linenumber" name="436" href="#436">436</a>             <strong class="jxr_keyword">if</strong> ((endPos + 1) == startPos) {
-<a class="jxr_linenumber" name="437" href="#437">437</a>               <strong class="jxr_keyword">throw</strong> <strong class="jxr_keyword">new</strong> <a href="../../../../../org/apache/hadoop/hbase/mapreduce/ImportTsv.html">BadTsvLineException</a>(<span class="jxr_string">"Empty value for ROW KEY."</span>);
-<a class="jxr_linenumber" name="438" href="#438">438</a>             }
-<a class="jxr_linenumber" name="439" href="#439">439</a>             <strong class="jxr_keyword">break</strong>;
-<a class="jxr_linenumber" name="440" href="#440">440</a>           } <strong class="jxr_keyword">else</strong> {
-<a class="jxr_linenumber" name="441" href="#441">441</a>             startPos = endPos + 2;
-<a class="jxr_linenumber" name="442" href="#442">442</a>           }
-<a class="jxr_linenumber" name="443" href="#443">443</a>         }
-<a class="jxr_linenumber" name="444" href="#444">444</a>         <strong class="jxr_keyword">if</strong> (i == length) {
-<a class="jxr_linenumber" name="445" href="#445">445</a>           <strong class="jxr_keyword">throw</strong> <strong class="jxr_keyword">new</strong> <a href="../../../../../org/apache/hadoop/hbase/mapreduce/ImportTsv.html">BadTsvLineException</a>(
-<a class="jxr_linenumber" name="446" href="#446">446</a>               <span class="jxr_string">"Row key does not exist as number of columns in the line"</span>
-<a class="jxr_linenumber" name="447" href="#447">447</a>                   + <span class="jxr_string">" are less than row key position."</span>);
-<a class="jxr_linenumber" name="448" href="#448">448</a>         }
-<a class="jxr_linenumber" name="449" href="#449">449</a>       }
-<a class="jxr_linenumber" name="450" href="#450">450</a>       <strong class="jxr_keyword">return</strong> <strong class="jxr_keyword">new</strong> Pair&lt;Integer, Integer&gt;(startPos, endPos - startPos + 1);
-<a class="jxr_linenumber" name="451" href="#451">451</a>     }
-<a class="jxr_linenumber" name="452" href="#452">452</a>   }
-<a class="jxr_linenumber" name="453" href="#453">453</a> 
-<a class="jxr_linenumber" name="454" href="#454">454</a>   <em class="jxr_javadoccomment">/**</em>
-<a class="jxr_linenumber" name="455" href="#455">455</a> <em class="jxr_javadoccomment">   * Sets up the actual job.</em>
-<a class="jxr_linenumber" name="456" href="#456">456</a> <em class="jxr_javadoccomment">   *</em>
-<a class="jxr_linenumber" name="457" href="#457">457</a> <em class="jxr_javadoccomment">   * @param conf  The current configuration.</em>
-<a class="jxr_linenumber" name="458" href="#458">458</a> <em class="jxr_javadoccomment">   * @param args  The command line parameters.</em>
-<a class="jxr_linenumber" name="459" href="#459">459</a> <em class="jxr_javadoccomment">   * @return The newly created job.</em>
-<a class="jxr_linenumber" name="460" href="#460">460</a> <em class="jxr_javadoccomment">   * @throws IOException When setting up the job fails.</em>
-<a class="jxr_linenumber" name="461" href="#461">461</a> <em class="jxr_javadoccomment">   */</em>
-<a class="jxr_linenumber" name="462" href="#462">462</a>   <strong class="jxr_keyword">protected</strong> <strong class="jxr_keyword">static</strong> Job createSubmittableJob(Configuration conf, String[] args)
-<a class="jxr_linenumber" name="463" href="#463">463</a>       <strong class="jxr_keyword">throws</strong> IOException, ClassNotFoundException {
-<a class="jxr_linenumber" name="464" href="#464">464</a>     Job job = <strong class="jxr_keyword">null</strong>;
-<a class="jxr_linenumber" name="465" href="#465">465</a>     <strong class="jxr_keyword">boolean</strong> isDryRun = conf.getBoolean(DRY_RUN_CONF_KEY, false);
-<a class="jxr_linenumber" name="466" href="#466">466</a>     <strong class="jxr_keyword">try</strong> (Connection connection = ConnectionFactory.createConnection(conf)) {
-<a class="jxr_linenumber" name="467" href="#467">467</a>       <strong class="jxr_keyword">try</strong> (Admin admin = connection.getAdmin()) {
-<a class="jxr_linenumber" name="468" href="#468">468</a>         <em class="jxr_comment">// Support non-XML supported characters</em>
-<a class="jxr_linenumber" name="469" href="#469">469</a>         <em class="jxr_comment">// by re-encoding the passed separator as a Base64 string.</em>
-<a class="jxr_linenumber" name="470" href="#470">470</a>         String actualSeparator = conf.get(SEPARATOR_CONF_KEY);
-<a class="jxr_linenumber" name="471" href="#471">471</a>         <strong class="jxr_keyword">if</strong> (actualSeparator != <strong class="jxr_keyword">null</strong>) {
-<a class="jxr_linenumber" name="472" href="#472">472</a>           conf.set(SEPARATOR_CONF_KEY,
-<a class="jxr_linenumber" name="473" href="#473">473</a>               Base64.encodeBytes(actualSeparator.getBytes()));
-<a class="jxr_linenumber" name="474" href="#474">474</a>         }
-<a class="jxr_linenumber" name="475" href="#475">475</a> 
-<a class="jxr_linenumber" name="476" href="#476">476</a>         <em class="jxr_comment">// See if a non-default Mapper was set</em>
-<a class="jxr_linenumber" name="477" href="#477">477</a>         String mapperClassName = conf.get(MAPPER_CONF_KEY);
-<a class="jxr_linenumber" name="478" href="#478">478</a>         Class mapperClass = mapperClassName != <strong class="jxr_keyword">null</strong>? Class.forName(mapperClassName): DEFAULT_MAPPER;
-<a class="jxr_linenumber" name="479" href="#479">479</a> 
-<a class="jxr_linenumber" name="480" href="#480">480</a>         <a href="../../../../../org/apache/hadoop/hbase/TableName.html">TableName</a> tableName = TableName.valueOf(args[0]);
-<a class="jxr_linenumber" name="481" href="#481">481</a>         Path inputDir = <strong class="jxr_keyword">new</strong> Path(args[1]);
-<a class="jxr_linenumber" name="482" href="#482">482</a>         String jobName = conf.get(JOB_NAME_CONF_KEY,NAME + <span class="jxr_string">"_"</span> + tableName.getNameAsString());
-<a class="jxr_linenumber" name="483" href="#483">483</a>         job = Job.getInstance(conf, jobName);
-<a class="jxr_linenumber" name="484" href="#484">484</a>         job.setJarByClass(mapperClass);
-<a class="jxr_linenumber" name="485" href="#485">485</a>         FileInputFormat.setInputPaths(job, inputDir);
-<a class="jxr_linenumber" name="486" href="#486">486</a>         job.setInputFormatClass(TextInputFormat.<strong class="jxr_keyword">class</strong>);
-<a class="jxr_linenumber" name="487" href="#487">487</a>         job.setMapperClass(mapperClass);
-<a class="jxr_linenumber" name="488" href="#488">488</a>         job.setMapOutputKeyClass(ImmutableBytesWritable.<strong class="jxr_keyword">class</strong>);
-<a class="jxr_linenumber" name="489" href="#489">489</a>         String hfileOutPath = conf.get(BULK_OUTPUT_CONF_KEY);
-<a class="jxr_linenumber" name="490" href="#490">490</a>         String[] columns = conf.getStrings(COLUMNS_CONF_KEY);
-<a class="jxr_linenumber" name="491" href="#491">491</a>         <strong class="jxr_keyword">if</strong>(StringUtils.isNotEmpty(conf.get(CREDENTIALS_LOCATION))) {
-<a class="jxr_linenumber" name="492" href="#492">492</a>           String fileLoc = conf.get(CREDENTIALS_LOCATION);
-<a class="jxr_linenumber" name="493" href="#493">493</a>           Credentials cred = Credentials.readTokenStorageFile(<strong class="jxr_keyword">new</strong> File(fileLoc), conf);
-<a class="jxr_linenumber" name="494" href="#494">494</a>           job.getCredentials().addAll(cred);
-<a class="jxr_linenumber" name="495" href="#495">495</a>         }
-<a class="jxr_linenumber" name="496" href="#496">496</a> 
-<a class="jxr_linenumber" name="497" href="#497">497</a>         <strong class="jxr_keyword">if</strong> (hfileOutPath != <strong class="jxr_keyword">null</strong>) {
-<a class="jxr_linenumber" name="498" href="#498">498</a>           <strong class="jxr_keyword">if</strong> (!admin.tableExists(tableName)) {
-<a class="jxr_linenumber" name="499" href="#499">499</a>             LOG.warn(format(<span class="jxr_string">"Table '%s' does not exist."</span>, tableName));
-<a class="jxr_linenumber" name="500" href="#500">500</a>             <strong class="jxr_keyword">if</strong> (<span class="jxr_string">"yes"</span>.equalsIgnoreCase(conf.get(CREATE_TABLE_CONF_KEY, <span class="jxr_string">"yes"</span>))) {
-<a class="jxr_linenumber" name="501" href="#501">501</a>               <em class="jxr_comment">// TODO: this is backwards. Instead of depending on the existence of a table,</em>
-<a class="jxr_linenumber" name="502" href="#502">502</a>               <em class="jxr_comment">// create a sane splits file for HFileOutputFormat based on data sampling.</em>
-<a class="jxr_linenumber" name="503" href="#503">503</a>               createTable(admin, tableName, columns);
-<a class="jxr_linenumber" name="504" href="#504">504</a>               <strong class="jxr_keyword">if</strong> (isDryRun) {
-<a class="jxr_linenumber" name="505" href="#505">505</a>                 LOG.warn(<span class="jxr_string">"Dry run: Table will be deleted at end of dry run."</span>);
-<a class="jxr_linenumber" name="506" href="#506">506</a>                 <strong class="jxr_keyword">synchronized</strong> (ImportTsv.<strong class="jxr_keyword">class</strong>) {
-<a class="jxr_linenumber" name="507" href="#507">507</a>                   DRY_RUN_TABLE_CREATED = <strong class="jxr_keyword">true</strong>;
-<a class="jxr_linenumber" name="508" href="#508">508</a>                 }
-<a class="jxr_linenumber" name="509" href="#509">509</a>               }
-<a class="jxr_linenumber" name="510" href="#510">510</a>             } <strong class="jxr_keyword">else</strong> {
-<a class="jxr_linenumber" name="511" href="#511">511</a>               String errorMsg =
-<a class="jxr_linenumber" name="512" href="#512">512</a>                   format(<span class="jxr_string">"Table '%s' does not exist and '%s' is set to no."</span>, tableName,
-<a class="jxr_linenumber" name="513" href="#513">513</a>                       CREATE_TABLE_CONF_KEY);
-<a class="jxr_linenumber" name="514" href="#514">514</a>               LOG.error(errorMsg);
-<a class="jxr_linenumber" name="515" href="#515">515</a>               <strong class="jxr_keyword">throw</strong> <strong class="jxr_keyword">new</strong> <a href="../../../../../org/apache/hadoop/hbase/TableNotFoundException.html">TableNotFoundException</a>(errorMsg);
-<a class="jxr_linenumber" name="516" href="#516">516</a>             }
-<a class="jxr_linenumber" name="517" href="#517">517</a>           }
-<a class="jxr_linenumber" name="518" href="#518">518</a>           <strong class="jxr_keyword">try</strong> (Table table = connection.getTable(tableName);
-<a class="jxr_linenumber" name="519" href="#519">519</a>               <a href="../../../../../org/apache/hadoop/hbase/client/RegionLocator.html">RegionLocator</a> regionLocator = connection.getRegionLocator(tableName)) {
-<a class="jxr_linenumber" name="520" href="#520">520</a>             <strong class="jxr_keyword">boolean</strong> noStrict = conf.getBoolean(NO_STRICT_COL_FAMILY, false);
-<a class="jxr_linenumber" name="521" href="#521">521</a>             <em class="jxr_comment">// if no.strict is false then check column family</em>
-<a class="jxr_linenumber" name="522" href="#522">522</a>             <strong class="jxr_keyword">if</strong>(!noStrict) {
-<a class="jxr_linenumber" name="523" href="#523">523</a>               ArrayList&lt;String&gt; unmatchedFamilies = <strong class="jxr_keyword">new</strong> ArrayList&lt;String&gt;();
-<a class="jxr_linenumber" name="524" href="#524">524</a>               Set&lt;String&gt; cfSet = getColumnFamilies(columns);
-<a class="jxr_linenumber" name="525" href="#525">525</a>               <a href="../../../../../org/apache/hadoop/hbase/HTableDescriptor.html">HTableDescriptor</a> tDesc = table.getTableDescriptor();
-<a class="jxr_linenumber" name="526" href="#526">526</a>               <strong class="jxr_keyword">for</strong> (String cf : cfSet) {
-<a class="jxr_linenumber" name="527" href="#527">527</a>                 <strong class="jxr_keyword">if</strong>(tDesc.getFamily(Bytes.toBytes(cf)) == <strong class="jxr_keyword">null</strong>) {
-<a class="jxr_linenumber" name="528" href="#528">528</a>                   unmatchedFamilies.add(cf);
-<a class="jxr_linenumber" name="529" href="#529">529</a>                 }
-<a class="jxr_linenumber" name="530" href="#530">530</a>               }
-<a class="jxr_linenumber" name="531" href="#531">531</a>               <strong class="jxr_keyword">if</strong>(unmatchedFamilies.size() &gt; 0) {
-<a class="jxr_linenumber" name="532" href="#532">532</a>                 ArrayList&lt;String&gt; familyNames = <strong class="jxr_keyword">new</strong> ArrayList&lt;String&gt;();
-<a class="jxr_linenumber" name="533" href="#533">533</a>                 <strong class="jxr_keyword">for</strong> (HColumnDescriptor family : table.getTableDescriptor().getFamilies()) {
-<a class="jxr_linenumber" name="534" href="#534">534</a>                   familyNames.add(family.getNameAsString());
-<a class="jxr_linenumber" name="535" href="#535">535</a>                 }
-<a class="jxr_linenumber" name="536" href="#536">536</a>                 String msg =
-<a class="jxr_linenumber" name="537" href="#537">537</a>                     <span class="jxr_string">"Column Families "</span> + unmatchedFamilies + <span class="jxr_string">" specified in "</span> + COLUMNS_CONF_KEY
-<a class="jxr_linenumber" name="538" href="#538">538</a>                     + <span class="jxr_string">" does not match with any of the table "</span> + tableName
-<a class="jxr_linenumber" name="539" href="#539">539</a>                     + <span class="jxr_string">" column families "</span> + familyNames + <span class="jxr_string">".\n"</span>
-<a class="jxr_linenumber" name="540" href="#540">540</a>                     + <span class="jxr_string">"To disable column family check, use -D"</span> + NO_STRICT_COL_FAMILY
-<a class="jxr_linenumber" name="541" href="#541">541</a>                     + <span class="jxr_string">"=true.\n"</span>;
-<a class="jxr_linenumber" name="542" href="#542">542</a>                 usage(msg);
-<a class="jxr_linenumber" name="543" href="#543">543</a>                 System.exit(-1);
-<a class="jxr_linenumber" name="544" href="#544">544</a>               }
-<a class="jxr_linenumber" name="545" href="#545">545</a>             }
-<a class="jxr_linenumber" name="546" href="#546">546</a>             <strong class="jxr_keyword">if</strong> (mapperClass.equals(TsvImporterTextMapper.<strong class="jxr_keyword">class</strong>)) {
-<a class="jxr_linenumber" name="547" href="#547">547</a>               job.setMapOutputValueClass(Text.<strong class="jxr_keyword">class</strong>);
-<a class="jxr_linenumber" name="548" href="#548">548</a>               job.setReducerClass(TextSortReducer.<strong class="jxr_keyword">class</strong>);
-<a class="jxr_linenumber" name="549" href="#549">549</a>             } <strong class="jxr_keyword">else</strong> {
-<a class="jxr_linenumber" name="550" href="#550">550</a>               job.setMapOutputValueClass(Put.<strong class="jxr_keyword">class</strong>);
-<a class="jxr_linenumber" name="551" href="#551">551</a>               job.setCombinerClass(PutCombiner.<strong class="jxr_keyword">class</strong>);
-<a class="jxr_linenumber" name="552" href="#552">552</a>               job.setReducerClass(PutSortReducer.<strong class="jxr_keyword">class</strong>);
-<a class="jxr_linenumber" name="553" href="#553">553</a>             }
-<a class="jxr_linenumber" name="554" href="#554">554</a>             <strong class="jxr_keyword">if</strong> (!isDryRun) {
-<a class="jxr_linenumber" name="555" href="#555">555</a>               Path outputDir = <strong class="jxr_keyword">new</strong> Path(hfileOutPath);
-<a class="jxr_linenumber" name="556" href="#556">556</a>               FileOutputFormat.setOutputPath(job, outputDir);
-<a class="jxr_linenumber" name="557" href="#557">557</a>               HFileOutputFormat2.configureIncrementalLoad(job, table.getTableDescriptor(),
-<a class="jxr_linenumber" name="558" href="#558">558</a>                   regionLocator);
-<a class="jxr_linenumber" name="559" href="#559">559</a>             }
-<a class="jxr_linenumber" name="560" href="#560">560</a>           }
-<a class="jxr_linenumber" name="561" href="#561">561</a>         } <strong class="jxr_keyword">else</strong> {
-<a class="jxr_linenumber" name="562" href="#562">562</a>           <strong class="jxr_keyword">if</strong> (!admin.tableExists(tableName)) {
-<a class="jxr_linenumber" name="563" href="#563">563</a>             String errorMsg = format(<span class="jxr_string">"Table '%s' does not exist."</span>, tableName);
-<a class="jxr_linenumber" name="564" href="#564">564</a>             LOG.error(errorMsg);
-<a class="jxr_linenumber" name="565" href="#565">565</a>             <strong class="jxr_keyword">throw</strong> <strong class="jxr_keyword">new</strong> <a href="../../../../../org/apache/hadoop/hbase/TableNotFoundException.html">TableNotFoundException</a>(errorMsg);
-<a class="jxr_linenumber" name="566" href="#566">566</a>           }
-<a class="jxr_linenumber" name="567" href="#567">567</a>           <strong class="jxr_keyword">if</strong> (mapperClass.equals(TsvImporterTextMapper.<strong class="jxr_keyword">class</strong>)) {
-<a class="jxr_linenumber" name="568" href="#568">568</a>             usage(TsvImporterTextMapper.<strong class="jxr_keyword">class</strong>.toString()
-<a class="jxr_linenumber" name="569" href="#569">569</a>                 + <span class="jxr_string">" should not be used for non bulkloading case. use "</span>
-<a class="jxr_linenumber" name="570" href="#570">570</a>                 + TsvImporterMapper.<strong class="jxr_keyword">class</strong>.toString()
-<a class="jxr_linenumber" name="571" href="#571">571</a>                 + <span class="jxr_string">" or custom mapper whose value type is Put."</span>);
-<a class="jxr_linenumber" name="572" href="#572">572</a>             System.exit(-1);
-<a class="jxr_linenumber" name="573" href="#573">573</a>           }
-<a class="jxr_linenumber" name="574" href="#574">574</a>           <strong class="jxr_keyword">if</strong> (!isDryRun) {
-<a class="jxr_linenumber" name="575" href="#575">575</a>             <em class="jxr_comment">// No reducers. Just write straight to table. Call initTableReducerJob</em>
-<a class="jxr_linenumber" name="576" href="#576">576</a>             <em class="jxr_comment">// to set up the TableOutputFormat.</em>
-<a class="jxr_linenumber" name="577" href="#577">577</a>             TableMapReduceUtil.initTableReducerJob(tableName.getNameAsString(), <strong class="jxr_keyword">null</strong>, job);
-<a class="jxr_linenumber" name="578" href="#578">578</a>           }
-<a class="jxr_linenumber" name="579" href="#579">579</a>           job.setNumReduceTasks(0);
-<a class="jxr_linenumber" name="580" href="#580">580</a>         }
-<a class="jxr_linenumber" name="581" href="#581">581</a>         <strong class="jxr_keyword">if</strong> (isDryRun) {
-<a class="jxr_linenumber" name="582" href="#582">582</a>           job.setOutputFormatClass(NullOutputFormat.<strong class="jxr_keyword">class</strong>);
-<a class="jxr_linenumber" name="583" href="#583">583</a>           job.getConfiguration().setStrings(<span class="jxr_string">"io.serializations"</span>,
-<a class="jxr_linenumber" name="584" href="#584">584</a>               job.getConfiguration().get(<span class="jxr_string">"io.serializations"</span>),
-<a class="jxr_linenumber" name="585" href="#585">585</a>               MutationSerialization.<strong class="jxr_keyword">class</strong>.getName(), ResultSerialization.<strong class="jxr_keyword">class</strong>.getName(),
-<a class="jxr_linenumber" name="586" href="#586">586</a>               KeyValueSerialization.<strong class="jxr_keyword">class</strong>.getName());
-<a class="jxr_linenumber" name="587" href="#587">587</a>         }
-<a class="jxr_linenumber" name="588" href="#588">588</a>         TableMapReduceUtil.addDependencyJars(job);
-<a class="jxr_linenumber" name="589" href="#589">589</a>         TableMapReduceUtil.addDependencyJars(job.getConfiguration(),
-<a class="jxr_linenumber" name="590" href="#590">590</a>             com.google.common.base.Function.<strong class="jxr_keyword">class</strong> <em class="jxr_comment">/*<em class="jxr_comment"> Guava used by <a href="../../../../../org/apache/hadoop/hbase/mapreduce/ImportTsv.html">TsvParser</a> */</em>);</em>
-<a class="jxr_linenumber" name="591" href="#591">591</a>       }
-<a class="jxr_linenumber" name="592" href="#592">592</a>     }
-<a class="jxr_linenumber" name="593" href="#593">593</a>     <strong class="jxr_keyword">return</strong> job;
-<a class="jxr_linenumber" name="594" href="#594">594</a>   }
-<a class="jxr_linenumber" name="595" href="#595">595</a> 
-<a class="jxr_linenumber" name="596" href="#596">596</a>   <strong class="jxr_keyword">private</strong> <strong class="jxr_keyword">static</strong> <strong class="jxr_keyword">void</strong> createTable(<a href="../../../../../org/apache/hadoop/hbase/client/Admin.html">Admin</a> admin, <a href="../../../../../org/apache/hadoop/hbase/TableName.html">TableName</a> tableName, String[] columns)
-<a class="jxr_linenumber" name="597" href="#597">597</a>       <strong class="jxr_keyword">throws</strong> IOException {
-<a class="jxr_linenumber" name="598" href="#598">598</a>     <a href="../../../../../org/apache/hadoop/hbase/HTableDescriptor.html">HTableDescriptor</a> htd = <strong class="jxr_keyword">new</strong> <a href="../../../../../org/apache/hadoop/hbase/HTableDescriptor.html">HTableDescriptor</a>(tableName);
-<a class="jxr_linenumber" name="599" href="#599">599</a>     Set&lt;String&gt; cfSet = getColumnFamilies(columns);
-<a class="jxr_linenumber" name="600" href="#600">600</a>     <strong class="jxr_keyword">for</strong> (String cf : cfSet) {
-<a class="jxr_linenumber" name="601" href="#601">601</a>       <a href="../../../../../org/apache/hadoop/hbase/HColumnDescriptor.html">HColumnDescriptor</a> hcd = <strong class="jxr_keyword">new</strong> <a href="../../../../../org/apache/hadoop/hbase/HColumnDescriptor.html">HColumnDescriptor</a>(Bytes.toBytes(cf));
-<a class="jxr_linenumber" name="602" href="#602">602</a>       htd.addFamily(hcd);
-<a class="jxr_linenumber" name="603" href="#603">603</a>     }
-<a class="jxr_linenumber" name="604" href="#604">604</a>     LOG.warn(format(<span class="jxr_string">"Creating table '%s' with '%s' columns and default descriptors."</span>,
-<a class="jxr_linenumber" name="605" href="#605">605</a>       tableName, cfSet));
-<a class="jxr_linenumber" name="606" href="#606">606</a>     admin.createTable(htd);
-<a class="jxr_linenumber" name="607" href="#607">607</a>   }
-<a class="jxr_linenumber" name="608" href="#608">608</a> 
-<a class="jxr_linenumber" name="609" href="#609">609</a>   <strong class="jxr_keyword">private</strong> <strong class="jxr_keyword">static</strong> <strong class="jxr_keyword">void</strong> deleteTable(Configuration conf, String[] args) {
-<a class="jxr_linenumber" name="610" href="#610">610</a>     <a href="../../../../../org/apache/hadoop/hbase/TableName.html">TableName</a> tableName = TableName.valueOf(args[0]);
-<a class="jxr_linenumber" name="611" href="#611">611</a>     <strong class="jxr_keyword">try</strong> (Connection connection = ConnectionFactory.createConnection(conf);
-<a class="jxr_linenumber" name="612" href="#612">612</a>          <a href="../../../../../org/apache/hadoop/hbase/client/Admin.html">Admin</a> admin = connection.getAdmin()) {
-<a class="jxr_linenumber" name="613" href="#613">613</a>       <strong class="jxr_keyword">try</strong> {
-<a class="jxr_linenumber" name="614" href="#614">614</a>         admin.disableTable(tableName);
-<a class="jxr_linenumber" name="615" href="#615">615</a>       } <strong class="jxr_keyword">catch</strong> (TableNotEnabledException e) {
-<a class="jxr_linenumber" name="616" href="#616">616</a>         LOG.debug(<span class="jxr_string">"Dry mode: Table: "</span> + tableName + <span class="jxr_string">" already disabled, so just deleting it."</span>);
-<a class="jxr_linenumber" name="617" href="#617">617</a>       }
-<a class="jxr_linenumber" name="618" href="#618">618</a>       admin.deleteTable(tableName);
-<a class="jxr_linenumber" name="619" href="#619">619</a>     } <strong class="jxr_keyword">catch</strong> (IOException e) {
-<a class="jxr_linenumber" name="620" href="#620">620</a>       LOG.error(format(<span class="jxr_string">"***Dry run: Failed to delete table '%s'.***%n%s"</span>, tableName,
-<a class="jxr_linenumber" name="621" href="#621">621</a>           e.toString()));
-<a class="jxr_linenumber" name="622" href="#622">622</a>       <strong class="jxr_keyword">return</strong>;
-<a class="jxr_linenumber" name="623" href="#623">623</a>     }
-<a class="jxr_linenumber" name="624" href="#624">624</a>     LOG.info(format(<span class="jxr_string">"Dry run: Deleted table '%s'."</span>, tableName));
-<a class="jxr_linenumber" name="625" href="#625">625</a>   }
-<a class="jxr_linenumber" name="626" href="#626">626</a> 
-<a class="jxr_linenumber" name="627" href="#627">627</a>   <strong class="jxr_keyword">private</strong> <strong class="jxr_keyword">static</strong> Set&lt;String&gt; getColumnFamilies(String[] columns) {
-<a class="jxr_linenumber" name="628" href="#628">628</a>     Set&lt;String&gt; cfSet = <strong class="jxr_keyword">new</strong> HashSet&lt;String&gt;();
-<a class="jxr_linenumber" name="629" href="#629">629</a>     <strong class="jxr_keyword">for</strong> (String aColumn : columns) {
-<a class="jxr_linenumber" name="630" href="#630">630</a>       <strong class="jxr_keyword">if</strong> (TsvParser.ROWKEY_COLUMN_SPEC.equals(aColumn)
-<a class="jxr_linenumber" name="631" href="#631">631</a>           || TsvParser.TIMESTAMPKEY_COLUMN_SPEC.equals(aColumn)
-<a class="jxr_linenumber" name="632" href="#632">632</a>           || TsvParser.CELL_VISIBILITY_COLUMN_SPEC.equals(aColumn)
-<a class="jxr_linenumber" name="633" href="#633">633</a>           || TsvParser.CELL_TTL_COLUMN_SPEC.equals(aColumn)
-<a class="jxr_linenumber" name="634" href="#634">634</a>           || TsvParser.ATTRIBUTES_COLUMN_SPEC.equals(aColumn))
-<a class="jxr_linenumber" name="635" href="#635">635</a>         <strong class="jxr_keyword">continue</strong>;
-<a class="jxr_linenumber" name="636" href="#636">636</a>       <em class="jxr_comment">// we are only concerned with the first one (in case this is a cf:cq)</em>
-<a class="jxr_linenumber" name="637" href="#637">637</a>       cfSet.add(aColumn.split(<span class="jxr_string">":"</span>, 2)[0]);
-<a class="jxr_linenumber" name="638" href="#638">638</a>     }
-<a class="jxr_linenumber" name="639" href="#639">639</a>     <strong class="jxr_keyword">return</strong> cfSet;
-<a class="jxr_linenumber" name="640" href="#640">640</a>   }
-<a class="jxr_linenumber" name="641" href="#641">641</a> 
-<a class="jxr_linenumber" name="642" href="#642">642</a>   <em class="jxr_comment">/*</em>
-<a class="jxr_linenumber" name="643" href="#643">643</a> <em class="jxr_comment">   * @param errorMsg Error message.  Can be null.</em>
-<a class="jxr_linenumber" name="644" href="#644">644</a> <em class="jxr_comment">   */</em>
-<a class="jxr_linenumber" name="645" href="#645">645</a>   <strong class="jxr_keyword">private</strong> <strong class="jxr_keyword">static</strong> <strong class="jxr_keyword">void</strong> usage(<strong class="jxr_keyword">final</strong> String errorMsg) {
-<a class="jxr_linenumber" name="646" href="#646">646</a>     <strong class="jxr_keyword">if</strong> (errorMsg != <strong class="jxr_keyword">null</strong> &amp;&amp; errorMsg.length() &gt; 0) {
-<a class="jxr_linenumber" name="647" href="#647">647</a>       System.err.println(<span class="jxr_string">"ERROR: "</span> + errorMsg);
-<a class="jxr_linenumber" name="648" href="#648">648</a>     }
-<a class="jxr_linenumber" name="649" href="#649">649</a>     String usage =
-<a class="jxr_linenumber" name="650" href="#650">650</a>       <span class="jxr_string">"Usage: "</span> + NAME + <span class="jxr_string">" -D"</span>+ COLUMNS_CONF_KEY + <span class="jxr_string">"=a,b,c &lt;tablename&gt; &lt;inputdir&gt;\n"</span> +
-<a class="jxr_linenumber" name="651" href="#651">651</a>       <span class="jxr_string">"\n"</span> +
-<a class="jxr_linenumber" name="652" href="#652">652</a>       <span class="jxr_string">"Imports the given input directory of TSV data into the specified table.\n"</span> +
-<a class="jxr_linenumber" name="653" href="#653">653</a>       <span class="jxr_string">"\n"</span> +
-<a class="jxr_linenumber" name="654" href="#654">654</a>       <span class="jxr_string">"The column names of the TSV data must be specified using the -D"</span> + COLUMNS_CONF_KEY + <span class="jxr_string">"\n"</span> +
-<a class="jxr_linenumber" name="655" href="#655">655</a>       <span class="jxr_string">"option. This option takes the form of comma-separated column names, where each\n"</span> +
-<a class="jxr_linenumber" name="656" href="#656">656</a>       <span class="jxr_string">"column name is either a simple column family, or a columnfamily:qualifier. The special\n"</span> +
-<a class="jxr_linenumber" name="657" href="#657">657</a>       <span class="jxr_string">"column name "</span> + TsvParser.ROWKEY_COLUMN_SPEC + <span class="jxr_string">" is used to designate that this column should be used\n"</span> +
-<a class="jxr_linenumber" name="658" href="#658">658</a>       <span class="jxr_string">"as the row key for each imported record. You must specify exactly one column\n"</span> +
-<a class="jxr_linenumber" name="659" href="#659">659</a>       <span class="jxr_string">"to be the row key, and you must specify a column name for every column that exists in the\n"</span> +
-<a class="jxr_linenumber" name="660" href="#660">660</a>       <span class="jxr_string">"input data. Another special column"</span> + TsvParser.TIMESTAMPKEY_COLUMN_SPEC +
-<a class="jxr_linenumber" name="661" href="#661">661</a>       <span class="jxr_string">" designates that this column should be\n"</span> +
-<a class="jxr_linenumber" name="662" href="#662">662</a>       <span class="jxr_string">"used as timestamp for each record. Unlike "</span> + TsvParser.ROWKEY_COLUMN_SPEC + <span class="jxr_string">", "</span> +
-<a class="jxr_linenumber" name="663" href="#663">663</a>       TsvParser.TIMESTAMPKEY_COLUMN_SPEC + <span class="jxr_string">" is optional."</span> + <span class="jxr_string">"\n"</span> +
-<a class="jxr_linenumber" name="664" href="#664">664</a>       <span class="jxr_string">"You must specify at most one column as timestamp key for each imported record.\n"</span> +
-<a class="jxr_linenumber" name="665" href="#665">665</a>       <span class="jxr_string">"Record with invalid timestamps (blank, non-numeric) will be treated as bad record.\n"</span> +
-<a class="jxr_linenumber" name="666" href="#666">666</a>       <span class="jxr_string">"Note: if you use this option, then '"</span> + TIMESTAMP_CONF_KEY + <span class="jxr_string">"' option will be ignored.\n"</span> +
-<a class="jxr_linenumber" name="667" href="#667">667</a>       <span class="jxr_string">"\n"</span> +
-<a class="jxr_linenumber" name="668" href="#668">668</a>       <span class="jxr_string">"Other special columns that can be specified are "</span> + TsvParser.CELL_TTL_COLUMN_SPEC +
-<a class="jxr_linenumber" name="669" href="#669">669</a>       <span class="jxr_string">" and "</span> + TsvParser.CELL_VISIBILITY_COLUMN_SPEC + <span class="jxr_string">".\n"</span> +
-<a class="jxr_linenumber" name="670" href="#670">670</a>       TsvParser.CELL_TTL_COLUMN_SPEC + <span class="jxr_string">" designates that this column will be used "</span> +
-<a class="jxr_linenumber" name="671" href="#671">671</a>       <span class="jxr_string">"as a Cell's Time To Live (TTL) attribute.\n"</span> +
-<a class="jxr_linenumber" name="672" href="#672">672</a>       TsvParser.CELL_VISIBILITY_COLUMN_SPEC + <span class="jxr_string">" designates that this column contains the "</span> +
-<a class="jxr_linenumber" name="673" href="#673">673</a>       <span class="jxr_string">"visibility label expression.\n"</span> +
-<a class="jxr_linenumber" name="674" href="#674">674</a>       <span class="jxr_string">"\n"</span> +
-<a class="jxr_linenumber" name="675" href="#675">675</a>       TsvParser.ATTRIBUTES_COLUMN_SPEC+<span class="jxr_string">" can be used to specify Operation Attributes per record.\n"</span>+
-<a class="jxr_linenumber" name="676" href="#676">676</a>       <span class="jxr_string">" Should be specified as key=&gt;value where "</span>+TsvParser.DEFAULT_ATTRIBUTES_COLUMN_INDEX+ <span class="jxr_string">" is used \n"</span>+
-<a class="jxr_linenumber" name="677" href="#677">677</a>       <span class="jxr_string">" as the seperator.  Note that more than one OperationAttributes can be specified.\n"</span>+
-<a class="jxr_linenumber" name="678" href="#678">678</a>       <span class="jxr_string">"By default importtsv will load data directly into HBase. To instead generate\n"</span> +
-<a class="jxr_linenumber" name="679" href="#679">679</a>       <span class="jxr_string">"HFiles of data to prepare for a bulk data load, pass the option:\n"</span> +
-<a class="jxr_linenumber" name="680" href="#680">680</a>       <span class="jxr_string">"  -D"</span> + BULK_OUTPUT_CONF_KEY + <span class="jxr_string">"=/path/for/output\n"</span> +
-<a class="jxr_linenumber" name="681" href="#681">681</a>       <span class="jxr_string">"  Note: if you do not use this option, then the target table must already exist in HBase\n"</span> +
-<a class="jxr_linenumber" name="682" href="#682">682</a>       <span class="jxr_string">"\n"</span> +
-<a class="jxr_linenumber" name="683" href="#683">683</a>       <span class="jxr_string">"Other options that may be specified with -D include:\n"</span> +
-<a class="jxr_linenumber" name="684" href="#684">684</a>       <span class="jxr_string">"  -D"</span> + DRY_RUN_CONF_KEY + <span class="jxr_string">"=true - Dry run mode. Data is not actually populated into"</span> +
-<a class="jxr_linenumber" name="685" href="#685">685</a>       <span class="jxr_string">" table. If table does not exist, it is created but deleted in the end.\n"</span> +
-<a class="jxr_linenumber" name="686" href="#686">686</a>       <span class="jxr_string">"  -D"</span> + SKIP_LINES_CONF_KEY + <span class="jxr_string">"=false - fail if encountering an invalid line\n"</span> +
-<a class="jxr_linenumber" name="687" href="#687">687</a>       <span class="jxr_string">"  -D"</span> + LOG_BAD_LINES_CONF_KEY + <span class="jxr_string">"=true - logs invalid lines to stderr\n"</span> +
-<a class="jxr_linenumber" name="688" href="#688">688</a>       <span class="jxr_string">"  '-D"</span> + SEPARATOR_CONF_KEY + <span class="jxr_string">"=|' - eg separate on pipes instead of tabs\n"</span> +
-<a class="jxr_linenumber" name="689" href="#689">689</a>       <span class="jxr_string">"  -D"</span> + TIMESTAMP_CONF_KEY + <span class="jxr_string">"=currentTimeAsLong - use the specified timestamp for the import\n"</span> +
-<a class="jxr_linenumber" name="690" href="#690">690</a>       <span class="jxr_string">"  -D"</span> + MAPPER_CONF_KEY + <span class="jxr_string">"=my.Mapper - A user-defined Mapper to use instead of "</span> +
-<a class="jxr_linenumber" name="691" href="#691">691</a>       DEFAULT_MAPPER.getName() + <span class="jxr_string">"\n"</span> +
-<a class="jxr_linenumber" name="692" href="#692">692</a>       <span class="jxr_string">"  -D"</span> + JOB_NAME_CONF_KEY + <span class="jxr_string">"=jobName - use the specified mapreduce job name for the import\n"</span> +
-<a class="jxr_linenumber" name="693" href="#693">693</a>       <span class="jxr_string">"  -D"</span> + CREATE_TABLE_CONF_KEY + <span class="jxr_string">"=no - can be used to avoid creation of table by this tool\n"</span> +
-<a class="jxr_linenumber" name="694" href="#694">694</a>       <span class="jxr_string">"  Note: if you set this to 'no', then the target table must already exist in HBase\n"</span> +
-<a class="jxr_linenumber" name="695" href="#695">695</a>       <span class="jxr_string">"  -D"</span> + NO_STRICT_COL_FAMILY + <span class="jxr_string">"=true - ignore column family check in hbase table. "</span> +
-<a class="jxr_linenumber" name="696" href="#696">696</a>       <span class="jxr_string">"Default is false\n\n"</span> +
-<a class="jxr_linenumber" name="697" href="#697">697</a>       <span class="jxr_string">"For performance consider the following options:\n"</span> +
-<a class="jxr_linenumber" name="698" href="#698">698</a>       <span class="jxr_string">"  -Dmapreduce.map.speculative=false\n"</span> +
-<a class="jxr_linenumber" name="699" href="#699">699</a>       <span class="jxr_string">"  -Dmapreduce.reduce.speculative=false"</span>;
-<a class="jxr_linenumber" name="700" href="#700">700</a> 
-<a class="jxr_linenumber" name="701" href="#701">701</a>     System.err.println(usage);
-<a class="jxr_linenumber" name="702" href="#702">702</a>   }
-<a class="jxr_linenumber" name="703" href="#703">703</a> 
-<a class="jxr_linenumber" name="704" href="#704">704</a>   @Override
-<a class="jxr_linenumber" name="705" href="#705">705</a>   <strong class="jxr_keyword">public</strong> <strong class="jxr_keyword">int</strong> run(String[] args) <strong class="jxr_keyword">throws</strong> Exception {
-<a class="jxr_linenumber" name="706" href="#706">706</a>     <strong class="jxr_keyword">if</strong> (args.length &lt; 2) {
-<a class="jxr_linenumber" name="707" href="#707">707</a>       usage(<span class="jxr_string">"Wrong number of arguments: "</span> + args.length);
-<a class="jxr_linenumber" name="708" href="#708">708</a>       <strong class="jxr_keyword">return</strong> -1;
-<a class="jxr_linenumber" name="709" href="#709">709</a>     }
-<a class="jxr_linenumber" name="710" href="#710">710</a> 
-<a class="jxr_linenumber" name="711" href="#711">711</a>     <em class="jxr_comment">// When MAPPER_CONF_KEY is null, the user wants to use the provided TsvImporterMapper, so</em>
-<a class="jxr_linenumber" name="712" href="#712">712</a>     <em class="jxr_comment">// perform validation on these additional args. When it's not null, user has provided their</em>
-<a class="jxr_linenumber" name="713" href="#713">713</a>     <em class="jxr_comment">// own mapper, thus these validation are not relevant.</em>
-<a class="jxr_linenumber" name="714" href="#714">714</a>     <em class="jxr_comment">// TODO: validation for TsvImporterMapper, not this tool. Move elsewhere.</em>
-<a class="jxr_linenumber" name="715" href="#715">715</a>     <strong class="jxr_keyword">if</strong> (<strong class="jxr_keyword">null</strong> == getConf().get(MAPPER_CONF_KEY)) {
-<a class="jxr_linenumber" name="716" href="#716">716</a>       <em class="jxr_comment">// Make sure columns are specified</em>
-<a class="jxr_linenumber" name="717" href="#717">717</a>       String[] columns = getConf().getStrings(COLUMNS_CONF_KEY);
-<a class="jxr_linenumber" name="718" href="#718">718</a>       <strong class="jxr_keyword">if</strong> (columns == <strong class="jxr_keyword">null</strong>) {
-<a class="jxr_linenumber" name="719" href="#719">719</a>         usage(<span class="jxr_string">"No columns specified. Please specify with -D"</span> +
-<a class="jxr_linenumber" name="720" href="#720">720</a>             COLUMNS_CONF_KEY+<span class="jxr_string">"=..."</span>);
-<a class="jxr_linenumber" name="721" href="#721">721</a>         <strong class="jxr_keyword">return</strong> -1;
-<a class="jxr_linenumber" name="722" href="#722">722</a>       }
-<a class="jxr_linenumber" name="723" href="#723">723</a> 
-<a class="jxr_linenumber" name="724" href="#724">724</a>       <em class="jxr_comment">// Make sure they specify exactly one column as the row key</em>
-<a class="jxr_linenumber" name="725" href="#725">725</a>       <strong class="jxr_keyword">int</strong> rowkeysFound = 0;
-<a class="jxr_linenumber" name="726" href="#726">726</a>       <strong class="jxr_keyword">for</strong> (String col : columns) {
-<a class="jxr_linenumber" name="727" href="#727">727</a>         <strong class="jxr_keyword">if</strong> (col.equals(TsvParser.ROWKEY_COLUMN_SPEC)) rowkeysFound++;
-<a class="jxr_linenumber" name="728" href="#728">728</a>       }
-<a class="jxr_linenumber" name="729" href="#729">729</a>       <strong class="jxr_keyword">if</strong> (rowkeysFound != 1) {
-<a class="jxr_linenumber" name="730" href="#730">730</a>         usage(<span class="jxr_string">"Must specify exactly one column as "</span> + TsvParser.ROWKEY_COLUMN_SPEC);
-<a class="jxr_linenumber" name="731" href="#731">731</a>         <strong class="jxr_keyword">return</strong> -1;
-<a class="jxr_linenumber" name="732" href="#732">732</a>       }
-<a class="jxr_linenumber" name="733" href="#733">733</a> 
-<a class="jxr_linenumber" name="734" href="#734">734</a>       <em class="jxr_comment">// Make sure we have at most one column as the timestamp key</em>
-<a class="jxr_linenumber" name="735" href="#735">735</a>       <strong class="jxr_keyword">int</strong> tskeysFound = 0;
-<a class="jxr_linenumber" name="736" href="#736">736</a>       <strong class="jxr_keyword">for</strong> (String col : columns) {
-<a class="jxr_linenumber" name="737" href="#737">737</a>         <strong class="jxr_keyword">if</strong> (col.equals(TsvParser.TIMESTAMPKEY_COLUMN_SPEC))
-<a class="jxr_linenumber" name="738" href="#738">738</a>           tskeysFound++;
-<a class="jxr_linenumber" name="739" href="#739">739</a>       }
-<a class="jxr_linenumber" name="740" href="#740">740</a>       <strong class="jxr_keyword">if</strong> (tskeysFound &gt; 1) {
-<a class="jxr_linenumber" name="741" href="#741">741</a>         usage(<span class="jxr_string">"Must specify at most one column as "</span>
-<a class="jxr_linenumber" name="742" href="#742">742</a>             + TsvParser.TIMESTAMPKEY_COLUMN_SPEC);
-<a class="jxr_linenumber" name="743" href="#743">743</a>         <strong class="jxr_keyword">return</strong> -1;
-<a class="jxr_linenumber" name="744" href="#744">744</a>       }
-<a class="jxr_linenumber" name="745" href="#745">745</a> 
-<a class="jxr_linenumber" name="746" href="#746">746</a>       <strong class="jxr_keyword">int</strong> attrKeysFound = 0;
-<a class="jxr_linenumber" name="747" href="#747">747</a>       <strong class="jxr_keyword">for</strong> (String col : columns) {
-<a class="jxr_linenumber" name="748" href="#748">748</a>         <strong class="jxr_keyword">if</strong> (col.equals(TsvParser.ATTRIBUTES_COLUMN_SPEC))
-<a class="jxr_linenumber" name="749" href="#749">749</a>           attrKeysFound++;
-<a class="jxr_linenumber" name="750" href="#750">750</a>       }
-<a class="jxr_linenumber" name="751" href="#751">751</a>       <strong class="jxr_keyword">if</strong> (attrKeysFound &gt; 1) {
-<a class="jxr_linenumber" name="752" href="#752">752</a>         usage(<span class="jxr_string">"Must specify at most one column as "</span>
-<a class="jxr_linenumber" name="753" href="#753">753</a>             + TsvParser.ATTRIBUTES_COLUMN_SPEC);
-<a class="jxr_linenumber" nam

<TRUNCATED>