You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@beam.apache.org by ec...@apache.org on 2019/01/14 13:24:11 UTC
[beam] 02/11: Add SerializationDebugger
This is an automated email from the ASF dual-hosted git repository.
echauchot pushed a commit to branch spark-runner_structured-streaming
in repository https://gitbox.apache.org/repos/asf/beam.git
commit 5c9fcd34b7b092c1d2c0935aee06ae1fd412ed30
Author: Etienne Chauchot <ec...@apache.org>
AuthorDate: Fri Jan 11 10:07:23 2019 +0100
Add SerializationDebugger
---
.../utils/SerializationDebugger.java | 130 +++++++++++++++++++++
.../structuredstreaming/utils/package-info.java | 20 ++++
2 files changed, 150 insertions(+)
diff --git a/runners/spark-structured-streaming/src/test/java/org/apache/beam/runners/spark/structuredstreaming/utils/SerializationDebugger.java b/runners/spark-structured-streaming/src/test/java/org/apache/beam/runners/spark/structuredstreaming/utils/SerializationDebugger.java
new file mode 100644
index 0000000..0e47969
--- /dev/null
+++ b/runners/spark-structured-streaming/src/test/java/org/apache/beam/runners/spark/structuredstreaming/utils/SerializationDebugger.java
@@ -0,0 +1,130 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements. See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership. The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+/** Testing utils for spark structured streaming runner. */
+package org.apache.beam.runners.spark.structuredstreaming.utils;
+
+import java.io.IOException;
+import java.io.ObjectOutputStream;
+import java.io.OutputStream;
+import java.lang.reflect.Field;
+import java.util.ArrayList;
+import java.util.List;
+
+public class SerializationDebugger {
+
+ public static void testSerialization(Object object) throws IOException {
+ DebuggingObjectOutputStream out =
+ new DebuggingObjectOutputStream();
+ try {
+ out.writeObject(object);
+ } catch (Exception e) {
+ throw new RuntimeException(
+ "Serialization error. Path to bad object: "
+ + out.getStack(), e);
+ }
+ }
+
+ private static class DebuggingObjectOutputStream extends ObjectOutputStream {
+
+ public DebuggingObjectOutputStream() throws IOException, SecurityException {
+ }
+
+ private static final Field DEPTH_FIELD;
+
+ static {
+ try {
+ DEPTH_FIELD = ObjectOutputStream.class.getDeclaredField("depth");
+ DEPTH_FIELD.setAccessible(true);
+ } catch (NoSuchFieldException e) {
+ throw new AssertionError(e);
+ }
+ }
+
+ final List<Object> stack = new ArrayList<Object>();
+
+ /**
+ * Indicates whether or not OOS has tried to
+ * write an IOException (presumably as the
+ * result of a serialization error) to the
+ * stream.
+ */
+ boolean broken = false;
+
+ public DebuggingObjectOutputStream(OutputStream out) throws IOException {
+ super(out);
+ enableReplaceObject(true);
+ }
+
+ /**
+ * Abuse {@code replaceObject()} as a hook to
+ * maintain our stack.
+ */
+ protected Object replaceObject(Object o) {
+ // ObjectOutputStream writes serialization
+ // exceptions to the stream. Ignore
+ // everything after that so we don't lose
+ // the path to a non-serializable object. So
+ // long as the user doesn't write an
+ // IOException as the root object, we're OK.
+ int currentDepth = currentDepth();
+ if (o instanceof IOException && currentDepth == 0) {
+ broken = true;
+ }
+ if (!broken) {
+ truncate(currentDepth);
+ stack.add(o);
+ }
+ return o;
+ }
+
+ private void truncate(int depth) {
+ while (stack.size() > depth) {
+ pop();
+ }
+ }
+
+ private Object pop() {
+ return stack.remove(stack.size() - 1);
+ }
+
+ /**
+ * Returns a 0-based depth within the object
+ * graph of the current object being
+ * serialized.
+ */
+ private int currentDepth() {
+ try {
+ Integer oneBased = ((Integer) DEPTH_FIELD.get(this));
+ return oneBased - 1;
+ } catch (IllegalAccessException e) {
+ throw new AssertionError(e);
+ }
+ }
+
+ /**
+ * Returns the path to the last object
+ * serialized. If an exception occurred, this
+ * should be the path to the non-serializable
+ * object.
+ */
+ public List<Object> getStack() {
+ return stack;
+ }
+ }
+}
\ No newline at end of file
diff --git a/runners/spark-structured-streaming/src/test/java/org/apache/beam/runners/spark/structuredstreaming/utils/package-info.java b/runners/spark-structured-streaming/src/test/java/org/apache/beam/runners/spark/structuredstreaming/utils/package-info.java
new file mode 100644
index 0000000..3d7da11
--- /dev/null
+++ b/runners/spark-structured-streaming/src/test/java/org/apache/beam/runners/spark/structuredstreaming/utils/package-info.java
@@ -0,0 +1,20 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements. See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership. The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+/** Testing utils for spark structured streaming runner. */
+package org.apache.beam.runners.spark.structuredstreaming.utils;