You are viewing a plain text version of this content. The canonical link for it is here.
Posted to oak-commits@jackrabbit.apache.org by re...@apache.org on 2015/10/27 13:45:45 UTC
svn commit: r1710798 - in /jackrabbit/oak/branches/1.2: ./
oak-core/src/main/java/org/apache/jackrabbit/oak/plugins/document/rdb/RDBExport.java
Author: reschke
Date: Tue Oct 27 12:45:45 2015
New Revision: 1710798
URL: http://svn.apache.org/viewvc?rev=1710798&view=rev
Log:
OAK-3532: simple tool for dumping RDB tables (ported to 1.2)
Added:
jackrabbit/oak/branches/1.2/oak-core/src/main/java/org/apache/jackrabbit/oak/plugins/document/rdb/RDBExport.java
- copied, changed from r1709852, jackrabbit/oak/trunk/oak-core/src/main/java/org/apache/jackrabbit/oak/plugins/document/rdb/RDBExport.java
Modified:
jackrabbit/oak/branches/1.2/ (props changed)
Propchange: jackrabbit/oak/branches/1.2/
------------------------------------------------------------------------------
--- svn:mergeinfo (original)
+++ svn:mergeinfo Tue Oct 27 12:45:45 2015
@@ -1,3 +1,3 @@
/jackrabbit/oak/branches/1.0:1665962
-/jackrabbit/oak/trunk:1672350,1672468,1672537,1672603,1672642,1672644,1672834-1672835,1673351,1673410,1673414-1673415,1673436,1673644,1673662-1673664,1673669,1673695,1673713,1673738,1673787,1673791,1674046,1674065,1674075,1674107,1674228,1674780,1674880,1675054-1675055,1675319,1675332,1675354,1675357,1675382,1675555,1675566,1675593,1676198,1676237,1676407,1676458,1676539,1676670,1676693,1676703,1676725,1677579,1677581,1677609,1677611,1677774,1677788,1677797,1677804,1677806,1677939,1677991,1678023,1678095-1678096,1678124,1678171,1678173,1678211,1678323,1678758,1678938,1678954,1679144,1679165,1679191,1679232,1679235,1679503,1679958,1679961,1680170,1680172,1680182,1680222,1680232,1680236,1680461,1680633,1680643,1680747,1680805-1680806,1680903,1681282,1681767,1681918,1681955,1682042,1682218,1682235,1682437,1682494,1682555,1682855,1682904,1683059,1683089,1683213,1683249,1683259,1683278,1683323,1683687,1683700,1684174-1684175,1684186,1684376,1684442,1684561,1684570,1684601,1684618,1684820
,1684868,1685023,1685075,1685370,1685552,1685589-1685590,1685840,1685964,1685977,1685989,1685999,1686023,1686032,1686097,1686162,1686229,1686234,1686253,1686414,1686780,1686854,1686857,1686971,1687053-1687055,1687175,1687196,1687198,1687220,1687239-1687240,1687301,1687441,1687553,1688089-1688090,1688172,1688179,1688349,1688421,1688436,1688453,1688616,1688622,1688634,1688636,1688817,1689003-1689004,1689008,1689577,1689581,1689623,1689810,1689828,1689831,1689833,1689903,1690017,1690043,1690047,1690057,1690247,1690249,1690634-1690637,1690650,1690669,1690674,1690885,1690941,1691139,1691151,1691159,1691167,1691183,1691188,1691210,1691280,1691307,1691331-1691333,1691345,1691384-1691385,1691401,1691509,1692133-1692134,1692156,1692250,1692274,1692363,1692382,1692478,1692955,1693002,1693030,1693209,1693421,1693525-1693526,1694007,1694393-1694394,1694651,1694653-1694654,1695032,1695050,1695122,1695280,1695299,1695420,1695457,1695482,1695507,1695521,1695540,1696190,1696194,1696242,1696285,1696
375,1696522,1696578,1696759,1696916,1697363,1697373,1697410,1697582,1697589,1697616,1697672,1700191,1700231,1700397,1700403,1700506,1700571,1700727,1700749,1700769,1700775,1701065,1701619,1701733,1701743,1701750,1701768,1701806,1701810,1701814,1701948,1701955,1701959,1701965,1701986,1702014,1702022,1702051,1702241,1702272,1702387,1702405,1702423,1702860,1702942,1702960,1703212,1703382,1703395,1703411,1703428,1703430,1703568,1703592,1703758,1703858,1703878,1704256,1704282,1704285,1704457,1704479,1704490,1704614,1704629,1704636,1704655,1704670,1704886,1705005,1705027,1705043,1705055,1705250,1705268,1705273,1705323,1705677,1705701,1705871,1705992,1706212,1706764,1706772,1707049,1707191,1707435,1708105,1708315,1708546,1708592,1708766,1709012,1710031,1710049,1710559,1710575,1710614,1710637
+/jackrabbit/oak/trunk:1672350,1672468,1672537,1672603,1672642,1672644,1672834-1672835,1673351,1673410,1673414-1673415,1673436,1673644,1673662-1673664,1673669,1673695,1673713,1673738,1673787,1673791,1674046,1674065,1674075,1674107,1674228,1674780,1674880,1675054-1675055,1675319,1675332,1675354,1675357,1675382,1675555,1675566,1675593,1676198,1676237,1676407,1676458,1676539,1676670,1676693,1676703,1676725,1677579,1677581,1677609,1677611,1677774,1677788,1677797,1677804,1677806,1677939,1677991,1678023,1678095-1678096,1678124,1678171,1678173,1678211,1678323,1678758,1678938,1678954,1679144,1679165,1679191,1679232,1679235,1679503,1679958,1679961,1680170,1680172,1680182,1680222,1680232,1680236,1680461,1680633,1680643,1680747,1680805-1680806,1680903,1681282,1681767,1681918,1681955,1682042,1682218,1682235,1682437,1682494,1682555,1682855,1682904,1683059,1683089,1683213,1683249,1683259,1683278,1683323,1683687,1683700,1684174-1684175,1684186,1684376,1684442,1684561,1684570,1684601,1684618,1684820
,1684868,1685023,1685075,1685370,1685552,1685589-1685590,1685840,1685964,1685977,1685989,1685999,1686023,1686032,1686097,1686162,1686229,1686234,1686253,1686414,1686780,1686854,1686857,1686971,1687053-1687055,1687175,1687196,1687198,1687220,1687239-1687240,1687301,1687441,1687553,1688089-1688090,1688172,1688179,1688349,1688421,1688436,1688453,1688616,1688622,1688634,1688636,1688817,1689003-1689004,1689008,1689577,1689581,1689623,1689810,1689828,1689831,1689833,1689903,1690017,1690043,1690047,1690057,1690247,1690249,1690634-1690637,1690650,1690669,1690674,1690885,1690941,1691139,1691151,1691159,1691167,1691183,1691188,1691210,1691280,1691307,1691331-1691333,1691345,1691384-1691385,1691401,1691509,1692133-1692134,1692156,1692250,1692274,1692363,1692382,1692478,1692955,1693002,1693030,1693209,1693421,1693525-1693526,1694007,1694393-1694394,1694651,1694653-1694654,1695032,1695050,1695122,1695280,1695299,1695420,1695457,1695482,1695507,1695521,1695540,1696190,1696194,1696242,1696285,1696
375,1696522,1696578,1696759,1696916,1697363,1697373,1697410,1697582,1697589,1697616,1697672,1700191,1700231,1700397,1700403,1700506,1700571,1700727,1700749,1700769,1700775,1701065,1701619,1701733,1701743,1701750,1701768,1701806,1701810,1701814,1701948,1701955,1701959,1701965,1701986,1702014,1702022,1702051,1702241,1702272,1702387,1702405,1702423,1702860,1702942,1702960,1703212,1703382,1703395,1703411,1703428,1703430,1703568,1703592,1703758,1703858,1703878,1704256,1704282,1704285,1704457,1704479,1704490,1704614,1704629,1704636,1704655,1704670,1704886,1705005,1705027,1705043,1705055,1705250,1705268,1705273,1705323,1705677,1705701,1705871,1705992,1706212,1706764,1706772,1707049,1707191,1707435,1708105,1708315,1708546,1708592,1708766,1709012,1709852,1709978,1710013,1710031,1710049,1710205,1710242,1710559,1710575,1710590,1710614,1710637
/jackrabbit/trunk:1345480
Copied: jackrabbit/oak/branches/1.2/oak-core/src/main/java/org/apache/jackrabbit/oak/plugins/document/rdb/RDBExport.java (from r1709852, jackrabbit/oak/trunk/oak-core/src/main/java/org/apache/jackrabbit/oak/plugins/document/rdb/RDBExport.java)
URL: http://svn.apache.org/viewvc/jackrabbit/oak/branches/1.2/oak-core/src/main/java/org/apache/jackrabbit/oak/plugins/document/rdb/RDBExport.java?p2=jackrabbit/oak/branches/1.2/oak-core/src/main/java/org/apache/jackrabbit/oak/plugins/document/rdb/RDBExport.java&p1=jackrabbit/oak/trunk/oak-core/src/main/java/org/apache/jackrabbit/oak/plugins/document/rdb/RDBExport.java&r1=1709852&r2=1710798&rev=1710798&view=diff
==============================================================================
--- jackrabbit/oak/trunk/oak-core/src/main/java/org/apache/jackrabbit/oak/plugins/document/rdb/RDBExport.java (original)
+++ jackrabbit/oak/branches/1.2/oak-core/src/main/java/org/apache/jackrabbit/oak/plugins/document/rdb/RDBExport.java Tue Oct 27 12:45:45 2015
@@ -16,39 +16,216 @@
*/
package org.apache.jackrabbit.oak.plugins.document.rdb;
+import java.io.BufferedReader;
+import java.io.File;
+import java.io.FileInputStream;
+import java.io.FileOutputStream;
+import java.io.IOException;
+import java.io.InputStream;
+import java.io.InputStreamReader;
+import java.io.OutputStream;
+import java.io.PrintStream;
+import java.nio.charset.Charset;
import java.sql.Connection;
import java.sql.DriverManager;
import java.sql.ResultSet;
+import java.sql.ResultSetMetaData;
import java.sql.SQLException;
import java.sql.Statement;
+import java.sql.Types;
+import java.util.ArrayList;
import java.util.HashSet;
+import java.util.Set;
+import org.apache.commons.io.IOUtils;
+import org.apache.jackrabbit.oak.commons.json.JsopBuilder;
import org.apache.jackrabbit.oak.plugins.document.Collection;
+import org.apache.jackrabbit.oak.plugins.document.Document;
+import org.apache.jackrabbit.oak.plugins.document.DocumentStoreException;
import org.apache.jackrabbit.oak.plugins.document.NodeDocument;
import org.apache.jackrabbit.oak.plugins.document.memory.MemoryDocumentStore;
+import org.apache.jackrabbit.oak.util.OakVersion;
+/**
+ * Utility for dumping contents from {@link RDBDocumentStore}'s tables.
+ */
public class RDBExport {
- public static void main(String[] args) throws ClassNotFoundException, SQLException {
- String url = null, user = null, pw = null, table = null, query = null;
- RDBDocumentSerializer ser = new RDBDocumentSerializer(new MemoryDocumentStore(), new HashSet<String>());
+ private static final Charset UTF8 = Charset.forName("UTF-8");
+
+ public static void main(String[] args) throws ClassNotFoundException, SQLException, IOException {
+ String url = null, user = null, pw = null, table = "nodes", query = null, dumpfile = null, lobdir = null;
+ boolean asArray = false;
+ PrintStream out = System.out;
+ Set<String> excl = new HashSet<String>();
+ excl.add(Document.ID);
+ RDBDocumentSerializer ser = new RDBDocumentSerializer(new MemoryDocumentStore(), excl);
+
+ String param = null;
try {
- url = args[0];
- user = args[1];
- pw = args[2];
- table = args[3];
- query = args.length >= 5 ? args[4] : null;
+ for (int i = 0; i < args.length; i++) {
+ param = args[i];
+ if ("-u".equals(param) || "--username".equals(param)) {
+ user = args[++i];
+ } else if ("-p".equals(param) || "--password".equals(param)) {
+ pw = args[++i];
+ } else if ("-c".equals(param) || "--collection".equals(param)) {
+ table = args[++i];
+ } else if ("-j".equals(param) || "--jdbc-url".equals(param)) {
+ url = args[++i];
+ } else if ("-q".equals(param) || "--query".equals(param)) {
+ query = args[++i];
+ } else if ("-o".equals(param) || "--out".equals(param)) {
+ OutputStream os = new FileOutputStream(args[++i]);
+ out = new PrintStream(os, true, "UTF-8");
+ } else if ("--from-db2-dump".equals(param)) {
+ dumpfile = args[++i];
+ } else if ("--lobdir".equals(param)) {
+ lobdir = args[++i];
+ } else if ("--jsonArray".equals(param)) {
+ asArray = true;
+ } else if ("--version".equals(param)) {
+ System.out.println(RDBExport.class.getName() + " version " + OakVersion.getVersion());
+ System.exit(0);
+ } else if ("--help".equals(param)) {
+ printHelp();
+ System.exit(0);
+ } else {
+ System.err.println(RDBExport.class.getName() + ": invalid parameter " + args[i]);
+ printUsage();
+ System.exit(2);
+ }
+ }
} catch (IndexOutOfBoundsException ex) {
- System.err.println("Usage: ... " + RDBCreator.class.getName() + " JDBC-URL username password table [query]");
+ System.err.println(RDBExport.class.getName() + ": value missing for parameter " + param);
+ printUsage();
+ System.exit(2);
+ }
+
+ if (dumpfile != null && url != null) {
+ System.err.println(RDBExport.class.getName() + ": must use either dump file or JDBC URL");
+ printUsage();
System.exit(2);
+ } else if (dumpfile != null) {
+ dumpFile(dumpfile, lobdir, asArray, out, ser);
+ } else {
+ dumpJDBC(url, user, pw, table, query, asArray, out, ser);
+ }
+
+ out.flush();
+ out.close();
+ }
+
+ private static void dumpFile(String filename, String lobdir, boolean asArray, PrintStream out, RDBDocumentSerializer ser)
+ throws IOException {
+ File f = new File(filename);
+ File lobDirectory = lobdir == null ? new File(f.getParentFile(), "lobdir") : new File(lobdir);
+ FileInputStream fis = new FileInputStream(f);
+ InputStreamReader ir = new InputStreamReader(fis, UTF8);
+ BufferedReader br = new BufferedReader(ir);
+
+ if (asArray) {
+ out.println("[");
+ }
+ boolean needComma = asArray;
+ String line = br.readLine();
+ while (line != null) {
+ ArrayList<String> fields = parseDel(line);
+ String id = fields.get(0);
+ String smodified = fields.get(1);
+ String shasbinary = fields.get(2);
+ String sdeletedonce = fields.get(3);
+ String smodcount = fields.get(4);
+ String scmodcount = fields.get(5);
+ String sdata = fields.get(7);
+ String sbdata = fields.get(8);
+
+ byte[] bytes = null;
+ if (sbdata.length() != 0) {
+ String lobfile = sbdata.replace("/", "");
+ int lastdot = lobfile.lastIndexOf('.');
+ String length = lobfile.substring(lastdot + 1);
+ lobfile = lobfile.substring(0, lastdot);
+ lastdot = lobfile.lastIndexOf('.');
+ String startpos = lobfile.substring(lastdot + 1);
+ lobfile = lobfile.substring(0, lastdot);
+ int s = Integer.valueOf(startpos);
+ int l = Integer.valueOf(length);
+ File lf = new File(lobDirectory, lobfile);
+ InputStream is = new FileInputStream(lf);
+ bytes = new byte[l];
+ IOUtils.skip(is, s);
+ IOUtils.read(is, bytes, 0, l);
+ IOUtils.closeQuietly(is);
+ }
+ try {
+ RDBRow row = new RDBRow(id, "1".equals(shasbinary), "1".equals(sdeletedonce),
+ smodified.length() == 0 ? 0 : Long.parseLong(smodified), Long.parseLong(smodcount),
+ Long.parseLong(scmodcount), sdata, bytes);
+ StringBuilder fulljson = dumpRow(ser, id, row);
+ if (asArray && needComma) {
+ fulljson.append(",");
+ }
+ out.println(fulljson);
+ needComma = true;
+ } catch (DocumentStoreException ex) {
+ System.err.println("Error: skipping line for ID " + id + " because of " + ex.getMessage());
+ }
+ line = br.readLine();
+ }
+ br.close();
+ if (asArray) {
+ out.println("]");
+ }
+ }
+
+ private static ArrayList<String> parseDel(String line) {
+ ArrayList<String> result = new ArrayList<String>();
+
+ boolean inQuoted = false;
+ char quotechar = '"';
+ char fielddelim = ',';
+ StringBuilder value = new StringBuilder();
+ for (int i = 0; i < line.length(); i++) {
+ char c = line.charAt(i);
+ if (!inQuoted) {
+ if (c == fielddelim) {
+ result.add(value.toString());
+ value = new StringBuilder();
+ } else {
+ if (value.length() == 0 && c == quotechar) {
+ inQuoted = true;
+ } else {
+ value.append(c);
+ }
+ }
+ } else {
+ if (c == quotechar) {
+ if (i + 1 != line.length() && line.charAt(i + 1) == quotechar) {
+ // quoted quote char
+ value.append(c);
+ i += 1;
+ } else {
+ inQuoted = false;
+ }
+ } else {
+ value.append(c);
+ }
+ }
}
+ result.add(value.toString());
+
+ return result;
+ }
+ private static void dumpJDBC(String url, String user, String pw, String table, String query, boolean asArray, PrintStream out,
+ RDBDocumentSerializer ser) throws SQLException {
String driver = RDBJDBCTools.driverForDBType(RDBJDBCTools.jdbctype(url));
try {
Class.forName(driver);
} catch (ClassNotFoundException ex) {
- System.err.println("Attempt to load class " + driver + " failed.");
+ System.err.println(RDBExport.class.getName() + ":attempt to load class " + driver + " failed:" + ex.getMessage());
}
Connection c = DriverManager.getConnection(url, user, pw);
c.setReadOnly(true);
@@ -59,21 +236,89 @@ public class RDBExport {
}
sql += " order by id";
ResultSet rs = stmt.executeQuery(sql);
+
+ if (asArray) {
+ out.println("[");
+ }
+ boolean needComma = asArray;
+ ResultSetMetaData rsm = null;
+ boolean idIsAscii = true;
while (rs.next()) {
- String id = rs.getString(1);
- long modified = rs.getLong(2);
- long modcount = rs.getLong(3);
- long cmodcount = rs.getLong(4);
- long hasBinary = rs.getLong(5);
- long deletedOnce = rs.getLong(6);
- String data = rs.getString(7);
- byte[] bdata = rs.getBytes(8);
+ if (rsm == null) {
+ rsm = rs.getMetaData();
+ idIsAscii = !isBinaryType(rsm.getColumnType(1));
+ }
+ String id = idIsAscii ? rs.getString("ID") : new String(rs.getBytes("ID"), UTF8);
+ long modified = rs.getLong("MODIFIED");
+ long modcount = rs.getLong("MODCOUNT");
+ long cmodcount = rs.getLong("CMODCOUNT");
+ long hasBinary = rs.getLong("HASBINARY");
+ long deletedOnce = rs.getLong("DELETEDONCE");
+ String data = rs.getString("DATA");
+ byte[] bdata = rs.getBytes("BDATA");
+
RDBRow row = new RDBRow(id, hasBinary == 1, deletedOnce == 1, modified, modcount, cmodcount, data, bdata);
- NodeDocument doc = ser.fromRow(Collection.NODES, row);
- System.out.println(ser.asString(doc));
+ StringBuilder fulljson = dumpRow(ser, id, row);
+ if (asArray && needComma && !rs.isLast()) {
+ fulljson.append(",");
+ }
+ out.println(fulljson);
+ needComma = true;
+ }
+ if (asArray) {
+ out.println("]");
}
+ out.close();
rs.close();
stmt.close();
c.close();
}
+
+ private static StringBuilder dumpRow(RDBDocumentSerializer ser, String id, RDBRow row) {
+ NodeDocument doc = ser.fromRow(Collection.NODES, row);
+ String docjson = ser.asString(doc);
+ StringBuilder fulljson = new StringBuilder();
+ fulljson.append("{\"_id\":\"");
+ JsopBuilder.escape(id, fulljson);
+ fulljson.append("\",");
+ fulljson.append(docjson.substring(1));
+ return fulljson;
+ }
+
+ private static boolean isBinaryType(int sqlType) {
+ return sqlType == Types.VARBINARY || sqlType == Types.BINARY || sqlType == Types.LONGVARBINARY;
+ }
+
+ private static void printUsage() {
+ System.err.println("Usage: " + RDBExport.class.getName()
+ + " -j/--jdbc-url JDBC-URL [-u/--username username] [-p/--password password] [-c/--collection table] [-q/--query query] [-o/--out file] [--jsonArray]");
+ System.err.println(
+ "Usage: " + RDBExport.class.getName() + " --from-DB2-dump file [--lobdir lobdir] [-o/--out file] [--jsonArray]");
+ System.err.println("Usage: " + RDBExport.class.getName() + " --version");
+ System.err.println("Usage: " + RDBExport.class.getName() + " --help");
+ }
+
+ private static void printHelp() {
+ System.err.println("Export Apache OAK RDB data to JSON files");
+ System.err.println("");
+ System.err.println("Generic options:");
+ System.err.println(" --help produce this help message");
+ System.err.println(" --version show version information");
+ System.err.println("");
+ System.err.println("JDBC options:");
+ System.err.println(" -j/--jdbc-url JDBC-URL JDBC URL of database to connect to");
+ System.err.println(" -u/--username username database username");
+ System.err.println(" -p/--password password database password");
+ System.err.println(" -c/--collection table table name (defaults to 'nodes')");
+ System.err.println(" -q/--query query SQL where clause (minus 'where')");
+ System.err.println("");
+ System.err.println("Dump file options:");
+ System.err.println(" --from-DB2-dump file name of DB2 DEL export file");
+ System.err.println(" --lobdir dir name of DB2 DEL export file LOB directory");
+ System.err.println(" (defaults to ./lobdir under the dump file)");
+ System.err.println("");
+ System.err.println("Output options:");
+ System.err.println(" -o/--out file Output to name file (instead of stdout)");
+ System.err.println(" --jsonArray Output a JSON array (instead of one JSON doc per line)");
+ }
}