aboutsummaryrefslogtreecommitdiff
path: root/python/pyspark/sql/readwriter.py
diff options
context:
space:
mode:
Diffstat (limited to 'python/pyspark/sql/readwriter.py')
-rw-r--r--python/pyspark/sql/readwriter.py17
1 files changed, 14 insertions, 3 deletions
diff --git a/python/pyspark/sql/readwriter.py b/python/pyspark/sql/readwriter.py
index dea8bad79e..bf6ac084bb 100644
--- a/python/pyspark/sql/readwriter.py
+++ b/python/pyspark/sql/readwriter.py
@@ -24,6 +24,16 @@ from pyspark.sql.types import *
__all__ = ["DataFrameReader", "DataFrameWriter"]
+def to_str(value):
+ """
+ A wrapper over str(), but convert bool values to lower case string
+ """
+ if isinstance(value, bool):
+ return str(value).lower()
+ else:
+ return str(value)
+
+
class DataFrameReader(object):
"""
Interface used to load a :class:`DataFrame` from external storage systems
@@ -77,7 +87,7 @@ class DataFrameReader(object):
def option(self, key, value):
"""Adds an input option for the underlying data source.
"""
- self._jreader = self._jreader.option(key, value)
+ self._jreader = self._jreader.option(key, to_str(value))
return self
@since(1.4)
@@ -85,7 +95,7 @@ class DataFrameReader(object):
"""Adds input options for the underlying data source.
"""
for k in options:
- self._jreader = self._jreader.option(k, options[k])
+ self._jreader = self._jreader.option(k, to_str(options[k]))
return self
@since(1.4)
@@ -97,7 +107,8 @@ class DataFrameReader(object):
:param schema: optional :class:`StructType` for the input schema.
:param options: all other string options
- >>> df = sqlContext.read.load('python/test_support/sql/parquet_partitioned')
+ >>> df = sqlContext.read.load('python/test_support/sql/parquet_partitioned', opt1=True,
+ ... opt2=1, opt3='str')
>>> df.dtypes
[('name', 'string'), ('year', 'int'), ('month', 'int'), ('day', 'int')]
"""