You are viewing a plain text version of this content. The canonical link for it is here.
Posted to oak-commits@jackrabbit.apache.org by re...@apache.org on 2015/10/27 13:45:45 UTC

svn commit: r1710798 - in /jackrabbit/oak/branches/1.2: ./ oak-core/src/main/java/org/apache/jackrabbit/oak/plugins/document/rdb/RDBExport.java

Author: reschke
Date: Tue Oct 27 12:45:45 2015
New Revision: 1710798

URL: http://svn.apache.org/viewvc?rev=1710798&view=rev
Log:
OAK-3532: simple tool for dumping RDB tables (ported to 1.2)

Added:
    jackrabbit/oak/branches/1.2/oak-core/src/main/java/org/apache/jackrabbit/oak/plugins/document/rdb/RDBExport.java
      - copied, changed from r1709852, jackrabbit/oak/trunk/oak-core/src/main/java/org/apache/jackrabbit/oak/plugins/document/rdb/RDBExport.java
Modified:
    jackrabbit/oak/branches/1.2/   (props changed)

Propchange: jackrabbit/oak/branches/1.2/
------------------------------------------------------------------------------
--- svn:mergeinfo (original)
+++ svn:mergeinfo Tue Oct 27 12:45:45 2015
@@ -1,3 +1,3 @@
 /jackrabbit/oak/branches/1.0:1665962
-/jackrabbit/oak/trunk:1672350,1672468,1672537,1672603,1672642,1672644,1672834-1672835,1673351,1673410,1673414-1673415,1673436,1673644,1673662-1673664,1673669,1673695,1673713,1673738,1673787,1673791,1674046,1674065,1674075,1674107,1674228,1674780,1674880,1675054-1675055,1675319,1675332,1675354,1675357,1675382,1675555,1675566,1675593,1676198,1676237,1676407,1676458,1676539,1676670,1676693,1676703,1676725,1677579,1677581,1677609,1677611,1677774,1677788,1677797,1677804,1677806,1677939,1677991,1678023,1678095-1678096,1678124,1678171,1678173,1678211,1678323,1678758,1678938,1678954,1679144,1679165,1679191,1679232,1679235,1679503,1679958,1679961,1680170,1680172,1680182,1680222,1680232,1680236,1680461,1680633,1680643,1680747,1680805-1680806,1680903,1681282,1681767,1681918,1681955,1682042,1682218,1682235,1682437,1682494,1682555,1682855,1682904,1683059,1683089,1683213,1683249,1683259,1683278,1683323,1683687,1683700,1684174-1684175,1684186,1684376,1684442,1684561,1684570,1684601,1684618,1684820
 ,1684868,1685023,1685075,1685370,1685552,1685589-1685590,1685840,1685964,1685977,1685989,1685999,1686023,1686032,1686097,1686162,1686229,1686234,1686253,1686414,1686780,1686854,1686857,1686971,1687053-1687055,1687175,1687196,1687198,1687220,1687239-1687240,1687301,1687441,1687553,1688089-1688090,1688172,1688179,1688349,1688421,1688436,1688453,1688616,1688622,1688634,1688636,1688817,1689003-1689004,1689008,1689577,1689581,1689623,1689810,1689828,1689831,1689833,1689903,1690017,1690043,1690047,1690057,1690247,1690249,1690634-1690637,1690650,1690669,1690674,1690885,1690941,1691139,1691151,1691159,1691167,1691183,1691188,1691210,1691280,1691307,1691331-1691333,1691345,1691384-1691385,1691401,1691509,1692133-1692134,1692156,1692250,1692274,1692363,1692382,1692478,1692955,1693002,1693030,1693209,1693421,1693525-1693526,1694007,1694393-1694394,1694651,1694653-1694654,1695032,1695050,1695122,1695280,1695299,1695420,1695457,1695482,1695507,1695521,1695540,1696190,1696194,1696242,1696285,1696
 375,1696522,1696578,1696759,1696916,1697363,1697373,1697410,1697582,1697589,1697616,1697672,1700191,1700231,1700397,1700403,1700506,1700571,1700727,1700749,1700769,1700775,1701065,1701619,1701733,1701743,1701750,1701768,1701806,1701810,1701814,1701948,1701955,1701959,1701965,1701986,1702014,1702022,1702051,1702241,1702272,1702387,1702405,1702423,1702860,1702942,1702960,1703212,1703382,1703395,1703411,1703428,1703430,1703568,1703592,1703758,1703858,1703878,1704256,1704282,1704285,1704457,1704479,1704490,1704614,1704629,1704636,1704655,1704670,1704886,1705005,1705027,1705043,1705055,1705250,1705268,1705273,1705323,1705677,1705701,1705871,1705992,1706212,1706764,1706772,1707049,1707191,1707435,1708105,1708315,1708546,1708592,1708766,1709012,1710031,1710049,1710559,1710575,1710614,1710637
+/jackrabbit/oak/trunk:1672350,1672468,1672537,1672603,1672642,1672644,1672834-1672835,1673351,1673410,1673414-1673415,1673436,1673644,1673662-1673664,1673669,1673695,1673713,1673738,1673787,1673791,1674046,1674065,1674075,1674107,1674228,1674780,1674880,1675054-1675055,1675319,1675332,1675354,1675357,1675382,1675555,1675566,1675593,1676198,1676237,1676407,1676458,1676539,1676670,1676693,1676703,1676725,1677579,1677581,1677609,1677611,1677774,1677788,1677797,1677804,1677806,1677939,1677991,1678023,1678095-1678096,1678124,1678171,1678173,1678211,1678323,1678758,1678938,1678954,1679144,1679165,1679191,1679232,1679235,1679503,1679958,1679961,1680170,1680172,1680182,1680222,1680232,1680236,1680461,1680633,1680643,1680747,1680805-1680806,1680903,1681282,1681767,1681918,1681955,1682042,1682218,1682235,1682437,1682494,1682555,1682855,1682904,1683059,1683089,1683213,1683249,1683259,1683278,1683323,1683687,1683700,1684174-1684175,1684186,1684376,1684442,1684561,1684570,1684601,1684618,1684820
 ,1684868,1685023,1685075,1685370,1685552,1685589-1685590,1685840,1685964,1685977,1685989,1685999,1686023,1686032,1686097,1686162,1686229,1686234,1686253,1686414,1686780,1686854,1686857,1686971,1687053-1687055,1687175,1687196,1687198,1687220,1687239-1687240,1687301,1687441,1687553,1688089-1688090,1688172,1688179,1688349,1688421,1688436,1688453,1688616,1688622,1688634,1688636,1688817,1689003-1689004,1689008,1689577,1689581,1689623,1689810,1689828,1689831,1689833,1689903,1690017,1690043,1690047,1690057,1690247,1690249,1690634-1690637,1690650,1690669,1690674,1690885,1690941,1691139,1691151,1691159,1691167,1691183,1691188,1691210,1691280,1691307,1691331-1691333,1691345,1691384-1691385,1691401,1691509,1692133-1692134,1692156,1692250,1692274,1692363,1692382,1692478,1692955,1693002,1693030,1693209,1693421,1693525-1693526,1694007,1694393-1694394,1694651,1694653-1694654,1695032,1695050,1695122,1695280,1695299,1695420,1695457,1695482,1695507,1695521,1695540,1696190,1696194,1696242,1696285,1696
 375,1696522,1696578,1696759,1696916,1697363,1697373,1697410,1697582,1697589,1697616,1697672,1700191,1700231,1700397,1700403,1700506,1700571,1700727,1700749,1700769,1700775,1701065,1701619,1701733,1701743,1701750,1701768,1701806,1701810,1701814,1701948,1701955,1701959,1701965,1701986,1702014,1702022,1702051,1702241,1702272,1702387,1702405,1702423,1702860,1702942,1702960,1703212,1703382,1703395,1703411,1703428,1703430,1703568,1703592,1703758,1703858,1703878,1704256,1704282,1704285,1704457,1704479,1704490,1704614,1704629,1704636,1704655,1704670,1704886,1705005,1705027,1705043,1705055,1705250,1705268,1705273,1705323,1705677,1705701,1705871,1705992,1706212,1706764,1706772,1707049,1707191,1707435,1708105,1708315,1708546,1708592,1708766,1709012,1709852,1709978,1710013,1710031,1710049,1710205,1710242,1710559,1710575,1710590,1710614,1710637
 /jackrabbit/trunk:1345480

Copied: jackrabbit/oak/branches/1.2/oak-core/src/main/java/org/apache/jackrabbit/oak/plugins/document/rdb/RDBExport.java (from r1709852, jackrabbit/oak/trunk/oak-core/src/main/java/org/apache/jackrabbit/oak/plugins/document/rdb/RDBExport.java)
URL: http://svn.apache.org/viewvc/jackrabbit/oak/branches/1.2/oak-core/src/main/java/org/apache/jackrabbit/oak/plugins/document/rdb/RDBExport.java?p2=jackrabbit/oak/branches/1.2/oak-core/src/main/java/org/apache/jackrabbit/oak/plugins/document/rdb/RDBExport.java&p1=jackrabbit/oak/trunk/oak-core/src/main/java/org/apache/jackrabbit/oak/plugins/document/rdb/RDBExport.java&r1=1709852&r2=1710798&rev=1710798&view=diff
==============================================================================
--- jackrabbit/oak/trunk/oak-core/src/main/java/org/apache/jackrabbit/oak/plugins/document/rdb/RDBExport.java (original)
+++ jackrabbit/oak/branches/1.2/oak-core/src/main/java/org/apache/jackrabbit/oak/plugins/document/rdb/RDBExport.java Tue Oct 27 12:45:45 2015
@@ -16,39 +16,216 @@
  */
 package org.apache.jackrabbit.oak.plugins.document.rdb;
 
+import java.io.BufferedReader;
+import java.io.File;
+import java.io.FileInputStream;
+import java.io.FileOutputStream;
+import java.io.IOException;
+import java.io.InputStream;
+import java.io.InputStreamReader;
+import java.io.OutputStream;
+import java.io.PrintStream;
+import java.nio.charset.Charset;
 import java.sql.Connection;
 import java.sql.DriverManager;
 import java.sql.ResultSet;
+import java.sql.ResultSetMetaData;
 import java.sql.SQLException;
 import java.sql.Statement;
+import java.sql.Types;
+import java.util.ArrayList;
 import java.util.HashSet;
+import java.util.Set;
 
+import org.apache.commons.io.IOUtils;
+import org.apache.jackrabbit.oak.commons.json.JsopBuilder;
 import org.apache.jackrabbit.oak.plugins.document.Collection;
+import org.apache.jackrabbit.oak.plugins.document.Document;
+import org.apache.jackrabbit.oak.plugins.document.DocumentStoreException;
 import org.apache.jackrabbit.oak.plugins.document.NodeDocument;
 import org.apache.jackrabbit.oak.plugins.document.memory.MemoryDocumentStore;
+import org.apache.jackrabbit.oak.util.OakVersion;
 
+/**
+ * Utility for dumping contents from {@link RDBDocumentStore}'s tables.
+ */
 public class RDBExport {
 
-    public static void main(String[] args) throws ClassNotFoundException, SQLException {
-        String url = null, user = null, pw = null, table = null, query = null;
-        RDBDocumentSerializer ser = new RDBDocumentSerializer(new MemoryDocumentStore(), new HashSet<String>());
+    private static final Charset UTF8 = Charset.forName("UTF-8");
+
+    public static void main(String[] args) throws ClassNotFoundException, SQLException, IOException {
 
+        String url = null, user = null, pw = null, table = "nodes", query = null, dumpfile = null, lobdir = null;
+        boolean asArray = false;
+        PrintStream out = System.out;
+        Set<String> excl = new HashSet<String>();
+        excl.add(Document.ID);
+        RDBDocumentSerializer ser = new RDBDocumentSerializer(new MemoryDocumentStore(), excl);
+
+        String param = null;
         try {
-            url = args[0];
-            user = args[1];
-            pw = args[2];
-            table = args[3];
-            query = args.length >= 5 ? args[4] : null;
+            for (int i = 0; i < args.length; i++) {
+                param = args[i];
+                if ("-u".equals(param) || "--username".equals(param)) {
+                    user = args[++i];
+                } else if ("-p".equals(param) || "--password".equals(param)) {
+                    pw = args[++i];
+                } else if ("-c".equals(param) || "--collection".equals(param)) {
+                    table = args[++i];
+                } else if ("-j".equals(param) || "--jdbc-url".equals(param)) {
+                    url = args[++i];
+                } else if ("-q".equals(param) || "--query".equals(param)) {
+                    query = args[++i];
+                } else if ("-o".equals(param) || "--out".equals(param)) {
+                    OutputStream os = new FileOutputStream(args[++i]);
+                    out = new PrintStream(os, true, "UTF-8");
+                } else if ("--from-db2-dump".equals(param)) {
+                    dumpfile = args[++i];
+                } else if ("--lobdir".equals(param)) {
+                    lobdir = args[++i];
+                } else if ("--jsonArray".equals(param)) {
+                    asArray = true;
+                } else if ("--version".equals(param)) {
+                    System.out.println(RDBExport.class.getName() + " version " + OakVersion.getVersion());
+                    System.exit(0);
+                } else if ("--help".equals(param)) {
+                    printHelp();
+                    System.exit(0);
+                } else {
+                    System.err.println(RDBExport.class.getName() + ": invalid parameter " + args[i]);
+                    printUsage();
+                    System.exit(2);
+                }
+            }
         } catch (IndexOutOfBoundsException ex) {
-            System.err.println("Usage: ... " + RDBCreator.class.getName() + " JDBC-URL username password table [query]");
+            System.err.println(RDBExport.class.getName() + ": value missing for parameter " + param);
+            printUsage();
+            System.exit(2);
+        }
+
+        if (dumpfile != null && url != null) {
+            System.err.println(RDBExport.class.getName() + ": must use either dump file or JDBC URL");
+            printUsage();
             System.exit(2);
+        } else if (dumpfile != null) {
+            dumpFile(dumpfile, lobdir, asArray, out, ser);
+        } else {
+            dumpJDBC(url, user, pw, table, query, asArray, out, ser);
+        }
+
+        out.flush();
+        out.close();
+    }
+
+    private static void dumpFile(String filename, String lobdir, boolean asArray, PrintStream out, RDBDocumentSerializer ser)
+            throws IOException {
+        File f = new File(filename);
+        File lobDirectory = lobdir == null ? new File(f.getParentFile(), "lobdir") : new File(lobdir);
+        FileInputStream fis = new FileInputStream(f);
+        InputStreamReader ir = new InputStreamReader(fis, UTF8);
+        BufferedReader br = new BufferedReader(ir);
+
+        if (asArray) {
+            out.println("[");
+        }
+        boolean needComma = asArray;
+        String line = br.readLine();
+        while (line != null) {
+            ArrayList<String> fields = parseDel(line);
+            String id = fields.get(0);
+            String smodified = fields.get(1);
+            String shasbinary = fields.get(2);
+            String sdeletedonce = fields.get(3);
+            String smodcount = fields.get(4);
+            String scmodcount = fields.get(5);
+            String sdata = fields.get(7);
+            String sbdata = fields.get(8);
+
+            byte[] bytes = null;
+            if (sbdata.length() != 0) {
+                String lobfile = sbdata.replace("/", "");
+                int lastdot = lobfile.lastIndexOf('.');
+                String length = lobfile.substring(lastdot + 1);
+                lobfile = lobfile.substring(0, lastdot);
+                lastdot = lobfile.lastIndexOf('.');
+                String startpos = lobfile.substring(lastdot + 1);
+                lobfile = lobfile.substring(0, lastdot);
+                int s = Integer.valueOf(startpos);
+                int l = Integer.valueOf(length);
+                File lf = new File(lobDirectory, lobfile);
+                InputStream is = new FileInputStream(lf);
+                bytes = new byte[l];
+                IOUtils.skip(is, s);
+                IOUtils.read(is, bytes, 0, l);
+                IOUtils.closeQuietly(is);
+            }
+            try {
+                RDBRow row = new RDBRow(id, "1".equals(shasbinary), "1".equals(sdeletedonce),
+                        smodified.length() == 0 ? 0 : Long.parseLong(smodified), Long.parseLong(smodcount),
+                        Long.parseLong(scmodcount), sdata, bytes);
+                StringBuilder fulljson = dumpRow(ser, id, row);
+                if (asArray && needComma) {
+                    fulljson.append(",");
+                }
+                out.println(fulljson);
+                needComma = true;
+            } catch (DocumentStoreException ex) {
+                System.err.println("Error: skipping line for ID " + id + " because of " + ex.getMessage());
+            }
+            line = br.readLine();
+        }
+        br.close();
+        if (asArray) {
+            out.println("]");
+        }
+    }
+
+    private static ArrayList<String> parseDel(String line) {
+        ArrayList<String> result = new ArrayList<String>();
+
+        boolean inQuoted = false;
+        char quotechar = '"';
+        char fielddelim = ',';
+        StringBuilder value = new StringBuilder();
+        for (int i = 0; i < line.length(); i++) {
+            char c = line.charAt(i);
+            if (!inQuoted) {
+                if (c == fielddelim) {
+                    result.add(value.toString());
+                    value = new StringBuilder();
+                } else {
+                    if (value.length() == 0 && c == quotechar) {
+                        inQuoted = true;
+                    } else {
+                        value.append(c);
+                    }
+                }
+            } else {
+                if (c == quotechar) {
+                    if (i + 1 != line.length() && line.charAt(i + 1) == quotechar) {
+                        // quoted quote char
+                        value.append(c);
+                        i += 1;
+                    } else {
+                        inQuoted = false;
+                    }
+                } else {
+                    value.append(c);
+                }
+            }
         }
+        result.add(value.toString());
+
+        return result;
+    }
 
+    private static void dumpJDBC(String url, String user, String pw, String table, String query, boolean asArray, PrintStream out,
+            RDBDocumentSerializer ser) throws SQLException {
         String driver = RDBJDBCTools.driverForDBType(RDBJDBCTools.jdbctype(url));
         try {
             Class.forName(driver);
         } catch (ClassNotFoundException ex) {
-            System.err.println("Attempt to load class " + driver + " failed.");
+            System.err.println(RDBExport.class.getName() + ":attempt to load class " + driver + " failed:" + ex.getMessage());
         }
         Connection c = DriverManager.getConnection(url, user, pw);
         c.setReadOnly(true);
@@ -59,21 +236,89 @@ public class RDBExport {
         }
         sql += " order by id";
         ResultSet rs = stmt.executeQuery(sql);
+
+        if (asArray) {
+            out.println("[");
+        }
+        boolean needComma = asArray;
+        ResultSetMetaData rsm = null;
+        boolean idIsAscii = true;
         while (rs.next()) {
-            String id = rs.getString(1);
-            long modified = rs.getLong(2);
-            long modcount = rs.getLong(3);
-            long cmodcount = rs.getLong(4);
-            long hasBinary = rs.getLong(5);
-            long deletedOnce = rs.getLong(6);
-            String data = rs.getString(7);
-            byte[] bdata = rs.getBytes(8);
+            if (rsm == null) {
+                rsm = rs.getMetaData();
+                idIsAscii = !isBinaryType(rsm.getColumnType(1));
+            }
+            String id = idIsAscii ? rs.getString("ID") : new String(rs.getBytes("ID"), UTF8);
+            long modified = rs.getLong("MODIFIED");
+            long modcount = rs.getLong("MODCOUNT");
+            long cmodcount = rs.getLong("CMODCOUNT");
+            long hasBinary = rs.getLong("HASBINARY");
+            long deletedOnce = rs.getLong("DELETEDONCE");
+            String data = rs.getString("DATA");
+            byte[] bdata = rs.getBytes("BDATA");
+
             RDBRow row = new RDBRow(id, hasBinary == 1, deletedOnce == 1, modified, modcount, cmodcount, data, bdata);
-            NodeDocument doc = ser.fromRow(Collection.NODES, row);
-            System.out.println(ser.asString(doc));
+            StringBuilder fulljson = dumpRow(ser, id, row);
+            if (asArray && needComma && !rs.isLast()) {
+                fulljson.append(",");
+            }
+            out.println(fulljson);
+            needComma = true;
+        }
+        if (asArray) {
+            out.println("]");
         }
+        out.close();
         rs.close();
         stmt.close();
         c.close();
     }
+
+    private static StringBuilder dumpRow(RDBDocumentSerializer ser, String id, RDBRow row) {
+        NodeDocument doc = ser.fromRow(Collection.NODES, row);
+        String docjson = ser.asString(doc);
+        StringBuilder fulljson = new StringBuilder();
+        fulljson.append("{\"_id\":\"");
+        JsopBuilder.escape(id, fulljson);
+        fulljson.append("\",");
+        fulljson.append(docjson.substring(1));
+        return fulljson;
+    }
+
+    private static boolean isBinaryType(int sqlType) {
+        return sqlType == Types.VARBINARY || sqlType == Types.BINARY || sqlType == Types.LONGVARBINARY;
+    }
+
+    private static void printUsage() {
+        System.err.println("Usage: " + RDBExport.class.getName()
+                + " -j/--jdbc-url JDBC-URL [-u/--username username] [-p/--password password] [-c/--collection table] [-q/--query query] [-o/--out file] [--jsonArray]");
+        System.err.println(
+                "Usage: " + RDBExport.class.getName() + " --from-DB2-dump file [--lobdir lobdir] [-o/--out file] [--jsonArray]");
+        System.err.println("Usage: " + RDBExport.class.getName() + " --version");
+        System.err.println("Usage: " + RDBExport.class.getName() + " --help");
+    }
+
+    private static void printHelp() {
+        System.err.println("Export Apache OAK RDB data to JSON files");
+        System.err.println("");
+        System.err.println("Generic options:");
+        System.err.println("  --help                             produce this help message");
+        System.err.println("  --version                          show version information");
+        System.err.println("");
+        System.err.println("JDBC options:");
+        System.err.println("  -j/--jdbc-url JDBC-URL             JDBC URL of database to connect to");
+        System.err.println("  -u/--username username             database username");
+        System.err.println("  -p/--password password             database password");
+        System.err.println("  -c/--collection table              table name (defaults to 'nodes')");
+        System.err.println("  -q/--query query                   SQL where clause (minus 'where')");
+        System.err.println("");
+        System.err.println("Dump file options:");
+        System.err.println("  --from-DB2-dump file               name of DB2 DEL export file");
+        System.err.println("  --lobdir dir                       name of DB2 DEL export file LOB directory");
+        System.err.println("                                     (defaults to ./lobdir under the dump file)");
+        System.err.println("");
+        System.err.println("Output options:");
+        System.err.println("  -o/--out file                      Output to name file (instead of stdout)");
+        System.err.println("  --jsonArray                        Output a JSON array (instead of one JSON doc per line)");
+    }
 }