You are viewing a plain text version of this content. The canonical link for it is here.
Posted to reviews@spark.apache.org by GitBox <gi...@apache.org> on 2019/04/04 11:55:19 UTC

[GitHub] [spark] kiszk commented on issue #24295: [SPARK-26811][SQL][followup] some more document fixes

kiszk commented on issue #24295: [SPARK-26811][SQL][followup] some more document fixes
URL: https://github.com/apache/spark/pull/24295#issuecomment-479866845
 
 
   I think that the following error is not related to this PR...
   
   ```
   ======================================================================
   ERROR: test_create_dataframe_from_pandas_with_timestamp (pyspark.sql.tests.test_dataframe.DataFrameTests)
   ----------------------------------------------------------------------
   Traceback (most recent call last):
     File "/home/jenkins/workspace/SparkPullRequestBuilder/python/pyspark/sql/tests/test_dataframe.py", line 562, in test_create_dataframe_from_pandas_with_timestamp
       df = self.spark.createDataFrame(pdf)
     File "/home/jenkins/workspace/SparkPullRequestBuilder/python/pyspark/sql/session.py", line 763, in createDataFrame
       data = self._convert_from_pandas(data, schema, timezone)
     File "/home/jenkins/workspace/SparkPullRequestBuilder/python/pyspark/sql/session.py", line 506, in _convert_from_pandas
       s = _check_series_convert_timestamps_tz_local(series, timezone)
     File "/home/jenkins/workspace/SparkPullRequestBuilder/python/pyspark/sql/types.py", line 1902, in _check_series_convert_timestamps_tz_local
       return _check_series_convert_timestamps_localize(s, timezone, None)
     File "/home/jenkins/workspace/SparkPullRequestBuilder/python/pyspark/sql/types.py", line 1877, in _check_series_convert_timestamps_localize
       lambda ts: ts.tz_localize(from_tz, ambiguous=False).tz_convert(to_tz).tz_localize(None)
     File "/home/anaconda/lib/python2.7/site-packages/pandas/core/series.py", line 2294, in apply
       mapped = lib.map_infer(values, f, convert=convert_dtype)
     File "pandas/src/inference.pyx", line 1207, in pandas.lib.map_infer (pandas/lib.c:66124)
     File "/home/jenkins/workspace/SparkPullRequestBuilder/python/pyspark/sql/types.py", line 1878, in <lambda>
       if ts is not pd.NaT else pd.NaT)
     File "pandas/tslib.pyx", line 609, in pandas.tslib.Timestamp.tz_localize (pandas/tslib.c:13468)
     File "pandas/tslib.pyx", line 1768, in pandas.tslib.maybe_get_tz (pandas/tslib.c:32362)
     File "/home/anaconda/lib/python2.7/site-packages/pytz/__init__.py", line 178, in timezone
       raise UnknownTimeZoneError(zone)
   UnknownTimeZoneError: 'US/Pacific-New'
   
   ======================================================================
   ERROR: test_create_dateframe_from_pandas_with_dst (pyspark.sql.tests.test_dataframe.DataFrameTests)
   ----------------------------------------------------------------------
   Traceback (most recent call last):
     File "/home/jenkins/workspace/SparkPullRequestBuilder/python/pyspark/sql/tests/test_dataframe.py", line 590, in test_create_dateframe_from_pandas_with_dst
       df = self.spark.createDataFrame(pdf)
     File "/home/jenkins/workspace/SparkPullRequestBuilder/python/pyspark/sql/session.py", line 763, in createDataFrame
       data = self._convert_from_pandas(data, schema, timezone)
     File "/home/jenkins/workspace/SparkPullRequestBuilder/python/pyspark/sql/session.py", line 506, in _convert_from_pandas
       s = _check_series_convert_timestamps_tz_local(series, timezone)
     File "/home/jenkins/workspace/SparkPullRequestBuilder/python/pyspark/sql/types.py", line 1902, in _check_series_convert_timestamps_tz_local
       return _check_series_convert_timestamps_localize(s, timezone, None)
     File "/home/jenkins/workspace/SparkPullRequestBuilder/python/pyspark/sql/types.py", line 1877, in _check_series_convert_timestamps_localize
       lambda ts: ts.tz_localize(from_tz, ambiguous=False).tz_convert(to_tz).tz_localize(None)
     File "/home/anaconda/lib/python2.7/site-packages/pandas/core/series.py", line 2294, in apply
       mapped = lib.map_infer(values, f, convert=convert_dtype)
     File "pandas/src/inference.pyx", line 1207, in pandas.lib.map_infer (pandas/lib.c:66124)
     File "/home/jenkins/workspace/SparkPullRequestBuilder/python/pyspark/sql/types.py", line 1878, in <lambda>
       if ts is not pd.NaT else pd.NaT)
     File "pandas/tslib.pyx", line 609, in pandas.tslib.Timestamp.tz_localize (pandas/tslib.c:13468)
     File "pandas/tslib.pyx", line 1768, in pandas.tslib.maybe_get_tz (pandas/tslib.c:32362)
     File "/home/anaconda/lib/python2.7/site-packages/pytz/__init__.py", line 178, in timezone
       raise UnknownTimeZoneError(zone)
   UnknownTimeZoneError: 'US/Pacific-New'
   
   ======================================================================
   ERROR: test_to_pandas (pyspark.sql.tests.test_dataframe.DataFrameTests)
   ----------------------------------------------------------------------
   Traceback (most recent call last):
     File "/home/jenkins/workspace/SparkPullRequestBuilder/python/pyspark/sql/tests/test_dataframe.py", line 522, in test_to_pandas
       pdf = self._to_pandas()
     File "/home/jenkins/workspace/SparkPullRequestBuilder/python/pyspark/sql/tests/test_dataframe.py", line 517, in _to_pandas
       return df.toPandas()
     File "/home/jenkins/workspace/SparkPullRequestBuilder/python/pyspark/sql/dataframe.py", line 2189, in toPandas
       _check_series_convert_timestamps_local_tz(pdf[field.name], timezone)
     File "/home/jenkins/workspace/SparkPullRequestBuilder/python/pyspark/sql/types.py", line 1891, in _check_series_convert_timestamps_local_tz
       return _check_series_convert_timestamps_localize(s, None, timezone)
     File "/home/jenkins/workspace/SparkPullRequestBuilder/python/pyspark/sql/types.py", line 1877, in _check_series_convert_timestamps_localize
       lambda ts: ts.tz_localize(from_tz, ambiguous=False).tz_convert(to_tz).tz_localize(None)
     File "/home/anaconda/lib/python2.7/site-packages/pandas/core/series.py", line 2294, in apply
       mapped = lib.map_infer(values, f, convert=convert_dtype)
     File "pandas/src/inference.pyx", line 1207, in pandas.lib.map_infer (pandas/lib.c:66124)
     File "/home/jenkins/workspace/SparkPullRequestBuilder/python/pyspark/sql/types.py", line 1878, in <lambda>
       if ts is not pd.NaT else pd.NaT)
     File "pandas/tslib.pyx", line 649, in pandas.tslib.Timestamp.tz_convert (pandas/tslib.c:13923)
     File "pandas/tslib.pyx", line 407, in pandas.tslib.Timestamp.__new__ (pandas/tslib.c:10447)
     File "pandas/tslib.pyx", line 1467, in pandas.tslib.convert_to_tsobject (pandas/tslib.c:27504)
     File "pandas/tslib.pyx", line 1768, in pandas.tslib.maybe_get_tz (pandas/tslib.c:32362)
     File "/home/anaconda/lib/python2.7/site-packages/pytz/__init__.py", line 178, in timezone
       raise UnknownTimeZoneError(zone)
   UnknownTimeZoneError: 'US/Pacific-New'
   ```

----------------------------------------------------------------
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.
 
For queries about this service, please contact Infrastructure at:
users@infra.apache.org


With regards,
Apache Git Services

---------------------------------------------------------------------
To unsubscribe, e-mail: reviews-unsubscribe@spark.apache.org
For additional commands, e-mail: reviews-help@spark.apache.org