From cfca01136bd7443c1d9daf8e8e256635eec20ddc Mon Sep 17 00:00:00 2001 From: Peng <peng.meng@intel.com> Date: Mon, 22 May 2017 22:42:37 +0800 Subject: [PATCH] [SPARK-20764][ML][PYSPARK] Fix visibility discrepancy with numInstances and degreesOfFreedom in LR and GLR - Python version ## What changes were proposed in this pull request? SPARK-20097 exposed degreesOfFreedom in LinearRegressionSummary and numInstances in GeneralizedLinearRegressionSummary. Python API should be updated to reflect these changes. ## How was this patch tested? The existing UT Author: Peng <peng.meng@intel.com> Closes #18062 from mpjlu/spark-20764. --- python/pyspark/ml/regression.py | 16 ++++++++++++++++ 1 file changed, 16 insertions(+) diff --git a/python/pyspark/ml/regression.py b/python/pyspark/ml/regression.py index 3c3fcc8d9b..2d17f95b0c 100644 --- a/python/pyspark/ml/regression.py +++ b/python/pyspark/ml/regression.py @@ -323,6 +323,14 @@ class LinearRegressionSummary(JavaWrapper): """ return self._call_java("numInstances") + @property + @since("2.2.0") + def degreesOfFreedom(self): + """ + Degrees of freedom. + """ + return self._call_java("degreesOfFreedom") + @property @since("2.0.0") def devianceResiduals(self): @@ -1565,6 +1573,14 @@ class GeneralizedLinearRegressionSummary(JavaWrapper): """ return self._call_java("predictionCol") + @property + @since("2.2.0") + def numInstances(self): + """ + Number of instances in DataFrame predictions. + """ + return self._call_java("numInstances") + @property @since("2.0.0") def rank(self): -- GitLab