aboutsummaryrefslogtreecommitdiff
path: root/python/pyspark/sql/functions.py
diff options
context:
space:
mode:
authorDavies Liu <davies@databricks.com>2015-11-03 13:33:46 -0800
committerReynold Xin <rxin@databricks.com>2015-11-03 13:33:46 -0800
commit1d04dc95c0d3caa485936e65b0493bcc9719f27e (patch)
treeace98f4fe1c54db7c61d867aade0e4210514f553 /python/pyspark/sql/functions.py
parenta9676cc7107c5df6c62a58668c4d95ced1238370 (diff)
downloadspark-1d04dc95c0d3caa485936e65b0493bcc9719f27e.tar.gz
spark-1d04dc95c0d3caa485936e65b0493bcc9719f27e.tar.bz2
spark-1d04dc95c0d3caa485936e65b0493bcc9719f27e.zip
[SPARK-11467][SQL] add Python API for stddev/variance
Add Python API for stddev/stddev_pop/stddev_samp/variance/var_pop/var_samp/skewness/kurtosis Author: Davies Liu <davies@databricks.com> Closes #9424 from davies/py_var.
Diffstat (limited to 'python/pyspark/sql/functions.py')
-rw-r--r--python/pyspark/sql/functions.py17
1 files changed, 17 insertions, 0 deletions
diff --git a/python/pyspark/sql/functions.py b/python/pyspark/sql/functions.py
index fa04f4cd83..2f7c2f4aac 100644
--- a/python/pyspark/sql/functions.py
+++ b/python/pyspark/sql/functions.py
@@ -122,6 +122,21 @@ _functions_1_4 = {
'bitwiseNOT': 'Computes bitwise not.',
}
+_functions_1_6 = {
+ # unary math functions
+ "stddev": "Aggregate function: returns the unbiased sample standard deviation of" +
+ " the expression in a group.",
+ "stddev_samp": "Aggregate function: returns the unbiased sample standard deviation of" +
+ " the expression in a group.",
+ "stddev_pop": "Aggregate function: returns population standard deviation of" +
+ " the expression in a group.",
+ "variance": "Aggregate function: returns the population variance of the values in a group.",
+ "var_samp": "Aggregate function: returns the unbiased variance of the values in a group.",
+ "var_pop": "Aggregate function: returns the population variance of the values in a group.",
+ "skewness": "Aggregate function: returns the skewness of the values in a group.",
+ "kurtosis": "Aggregate function: returns the kurtosis of the values in a group."
+}
+
# math functions that take two arguments as input
_binary_mathfunctions = {
'atan2': 'Returns the angle theta from the conversion of rectangular coordinates (x, y) to' +
@@ -172,6 +187,8 @@ for _name, _doc in _binary_mathfunctions.items():
globals()[_name] = since(1.4)(_create_binary_mathfunction(_name, _doc))
for _name, _doc in _window_functions.items():
globals()[_name] = since(1.4)(_create_window_function(_name, _doc))
+for _name, _doc in _functions_1_6.items():
+ globals()[_name] = since(1.6)(_create_function(_name, _doc))
del _name, _doc