You are viewing a plain text version of this content. The canonical link for it is here.
Posted to user@spark.apache.org by Zeming Yu <ze...@gmail.com> on 2017/05/13 12:21:50 UTC

what does this error mean?

My code runs error free on my local pc. Just tried running the same code on
a ubuntu machine on ec2, and got the error below. Any idea where to start
in terms of debugging?

---------------------------------------------------------------------------Py4JError
                                Traceback (most recent call
last)<ipython-input-21-107cdbd63b26> in <module>()----> 1
output.show(2)
/home/ubuntu/spark-2.1.1-bin-hadoop2.7/python/pyspark/sql/dataframe.py
in show(self, n, truncate)    316         """    317         if
isinstance(truncate, bool) and truncate:--> 318
print(self._jdf.showString(n, 20))    319         else:    320
    print(self._jdf.showString(n, int(truncate)))
/home/ubuntu/anaconda3/lib/python3.5/site-packages/py4j/java_gateway.py
in __call__(self, *args)   1131         answer =
self.gateway_client.send_command(command)   1132         return_value
= get_return_value(-> 1133             answer, self.gateway_client,
self.target_id, self.name)   1134    1135         for temp_arg in
temp_args:
/home/ubuntu/spark-2.1.1-bin-hadoop2.7/python/pyspark/sql/utils.py in
deco(*a, **kw)     61     def deco(*a, **kw):     62         try:--->
63             return f(*a, **kw)     64         except
py4j.protocol.Py4JJavaError as e:     65             s =
e.java_exception.toString()
/home/ubuntu/anaconda3/lib/python3.5/site-packages/py4j/protocol.py in
get_return_value(answer, gateway_client, target_id, name)    325
      raise Py4JError(    326                 "An error occurred while
calling {0}{1}{2}".--> 327                 format(target_id, ".",
name))    328     else:    329         type = answer[1]
Py4JError: An error occurred while calling o648.showString

Re: what does this error mean?

Posted by Zeming Yu <ze...@gmail.com>.
Another error. Anyone have any idea?

this one happens when I tried to convert a spark dataframe to pandas:

---------------------------------------------------------------------------Py4JError
                                Traceback (most recent call
last)/home/ubuntu/spark-2.1.1-bin-hadoop2.7/python/pyspark/sql/dataframe.py
in collect(self)    390         with SCCallSiteSync(self._sc) as
css:--> 391             port = self._jdf.collectToPython()    392
   return list(_load_from_socket(port,
BatchedSerializer(PickleSerializer())))
/home/ubuntu/anaconda3/lib/python3.5/site-packages/py4j/java_gateway.py
in __call__(self, *args)   1132         return_value =
get_return_value(-> 1133             answer, self.gateway_client,
self.target_id, self.name)   1134
/home/ubuntu/spark-2.1.1-bin-hadoop2.7/python/pyspark/sql/utils.py in
deco(*a, **kw)     62         try:---> 63             return f(*a,
**kw)     64         except py4j.protocol.Py4JJavaError as e:
/home/ubuntu/anaconda3/lib/python3.5/site-packages/py4j/protocol.py in
get_return_value(answer, gateway_client, target_id, name)    326
          "An error occurred while calling {0}{1}{2}".--> 327
       format(target_id, ".", name))    328     else:
Py4JError: An error occurred while calling o69.collectToPython

During handling of the above exception, another exception occurred:
IndexError                                Traceback (most recent call
last)/home/ubuntu/anaconda3/lib/python3.5/site-packages/py4j/java_gateway.py
in _get_connection(self)    826         try:--> 827
connection = self.deque.pop()    828         except IndexError:
IndexError: pop from an empty deque

During handling of the above exception, another exception occurred:
ConnectionRefusedError                    Traceback (most recent call
last)/home/ubuntu/anaconda3/lib/python3.5/site-packages/py4j/java_gateway.py
in start(self)    962         try:--> 963
self.socket.connect((self.address, self.port))    964
self.is_connected = True
ConnectionRefusedError: [Errno 111] Connection refused

During handling of the above exception, another exception occurred:
Py4JNetworkError                          Traceback (most recent call
last)<ipython-input-6-f8a4afbd6e4f> in <module>()      7
           'lead_time', 'dep_weekday', 'dep_weeknum',      8
               'days_to_last_holiday', 'days_to_next_holiday',----> 9
                        'duration_minutes', 'stop_minutes').toPandas()
    10 flight_pd.head()
/home/ubuntu/spark-2.1.1-bin-hadoop2.7/python/pyspark/sql/dataframe.py
in toPandas(self)   1583         """   1584         import pandas as
pd-> 1585         return pd.DataFrame.from_records(self.collect(),
columns=self.columns)   1586    1587
##########################################################################################
/home/ubuntu/spark-2.1.1-bin-hadoop2.7/python/pyspark/sql/dataframe.py
in collect(self)    389         """    390         with
SCCallSiteSync(self._sc) as css:--> 391             port =
self._jdf.collectToPython()    392         return
list(_load_from_socket(port, BatchedSerializer(PickleSerializer())))
 393
/home/ubuntu/spark-2.1.1-bin-hadoop2.7/python/pyspark/traceback_utils.py
in __exit__(self, type, value, tb)     76
SCCallSiteSync._spark_stack_depth -= 1     77         if
SCCallSiteSync._spark_stack_depth == 0:---> 78
self._context._jsc.setCallSite(None)
/home/ubuntu/anaconda3/lib/python3.5/site-packages/py4j/java_gateway.py
in __call__(self, *args)   1129             proto.END_COMMAND_PART
1130 -> 1131         answer =
self.gateway_client.send_command(command)   1132         return_value
= get_return_value(   1133             answer, self.gateway_client,
self.target_id, self.name)
/home/ubuntu/anaconda3/lib/python3.5/site-packages/py4j/java_gateway.py
in send_command(self, command, retry, binary)    879          if
`binary` is `True`.    880         """--> 881         connection =
self._get_connection()    882         try:    883             response
= connection.send_command(command)
/home/ubuntu/anaconda3/lib/python3.5/site-packages/py4j/java_gateway.py
in _get_connection(self)    827             connection =
self.deque.pop()    828         except IndexError:--> 829
connection = self._create_connection()    830         return
connection    831
/home/ubuntu/anaconda3/lib/python3.5/site-packages/py4j/java_gateway.py
in _create_connection(self)    833         connection =
GatewayConnection(    834             self.gateway_parameters,
self.gateway_property)--> 835         connection.start()    836
 return connection    837
/home/ubuntu/anaconda3/lib/python3.5/site-packages/py4j/java_gateway.py
in start(self)    968                 "server
({0}:{1})".format(self.address, self.port)    969
logger.exception(msg)--> 970             raise Py4JNetworkError(msg,
e)    971     972     def close(self, reset=False):
Py4JNetworkError: An error occurred while trying to connect to the
Java server (127.0.0.1:34166)


On Sat, May 13, 2017 at 10:21 PM, Zeming Yu <ze...@gmail.com> wrote:

> My code runs error free on my local pc. Just tried running the same code
> on a ubuntu machine on ec2, and got the error below. Any idea where to
> start in terms of debugging?
>
> ---------------------------------------------------------------------------Py4JError                                 Traceback (most recent call last)<ipython-input-21-107cdbd63b26> in <module>()----> 1 output.show(2)
> /home/ubuntu/spark-2.1.1-bin-hadoop2.7/python/pyspark/sql/dataframe.py in show(self, n, truncate)    316         """    317         if isinstance(truncate, bool) and truncate:--> 318             print(self._jdf.showString(n, 20))    319         else:    320             print(self._jdf.showString(n, int(truncate)))
> /home/ubuntu/anaconda3/lib/python3.5/site-packages/py4j/java_gateway.py in __call__(self, *args)   1131         answer = self.gateway_client.send_command(command)   1132         return_value = get_return_value(-> 1133             answer, self.gateway_client, self.target_id, self.name)   1134    1135         for temp_arg in temp_args:
> /home/ubuntu/spark-2.1.1-bin-hadoop2.7/python/pyspark/sql/utils.py in deco(*a, **kw)     61     def deco(*a, **kw):     62         try:---> 63             return f(*a, **kw)     64         except py4j.protocol.Py4JJavaError as e:     65             s = e.java_exception.toString()
> /home/ubuntu/anaconda3/lib/python3.5/site-packages/py4j/protocol.py in get_return_value(answer, gateway_client, target_id, name)    325             raise Py4JError(    326                 "An error occurred while calling {0}{1}{2}".--> 327                 format(target_id, ".", name))    328     else:    329         type = answer[1]
> Py4JError: An error occurred while calling o648.showString
>
>