sparktk.frame.ops.covariance module
# vim: set encoding=utf-8
# Copyright (c) 2016 Intel Corporation
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
def covariance(self, column_a, column_b):
"""
Calculate covariance for exactly two columns.
Parameters
----------
:param column_a: (str) The name of the column from which to compute the covariance.
:param column_b: (str) The name of the column from which to compute the covariance.
:return: (float) Covariance of the two columns.
Notes
-----
This method applies only to columns containing numerical data.
Examples
--------
Consider Frame *my_frame*, which contains the data
>>> my_frame.inspect()
[#] idnum x1 x2 x3 x4
===============================
[0] 0 1.0 4.0 0.0 -1.0
[1] 1 2.0 3.0 0.0 -1.0
[2] 2 3.0 2.0 1.0 -1.0
[3] 3 4.0 1.0 2.0 -1.0
[4] 4 5.0 0.0 2.0 -1.0
my_frame.covariance computes the covariance on the pair of columns provided.
>>> my_frame.covariance("x1", "x2")
-2.5
>>> my_frame.covariance("x1", "x4")
0.0
>>> my_frame.covariance("x2", "x3")
-1.5
"""
return self._scala.covariance(column_a, column_b)
Functions
def covariance(
self, column_a, column_b)
Calculate covariance for exactly two columns.
Parameters:
column_a | (str): | The name of the column from which to compute the covariance. |
column_b | (str): | The name of the column from which to compute the covariance. |
Returns | (float): | Covariance of the two columns. |
Notes:
This method applies only to columns containing numerical data.
Examples:
Consider Frame my_frame, which contains the data
>>> my_frame.inspect()
[#] idnum x1 x2 x3 x4
===============================
[0] 0 1.0 4.0 0.0 -1.0
[1] 1 2.0 3.0 0.0 -1.0
[2] 2 3.0 2.0 1.0 -1.0
[3] 3 4.0 1.0 2.0 -1.0
[4] 4 5.0 0.0 2.0 -1.0
my_frame.covariance computes the covariance on the pair of columns provided.
>>> my_frame.covariance("x1", "x2")
-2.5
>>> my_frame.covariance("x1", "x4")
0.0
>>> my_frame.covariance("x2", "x3")
-1.5
def covariance(self, column_a, column_b):
"""
Calculate covariance for exactly two columns.
Parameters
----------
:param column_a: (str) The name of the column from which to compute the covariance.
:param column_b: (str) The name of the column from which to compute the covariance.
:return: (float) Covariance of the two columns.
Notes
-----
This method applies only to columns containing numerical data.
Examples
--------
Consider Frame *my_frame*, which contains the data
>>> my_frame.inspect()
[#] idnum x1 x2 x3 x4
===============================
[0] 0 1.0 4.0 0.0 -1.0
[1] 1 2.0 3.0 0.0 -1.0
[2] 2 3.0 2.0 1.0 -1.0
[3] 3 4.0 1.0 2.0 -1.0
[4] 4 5.0 0.0 2.0 -1.0
my_frame.covariance computes the covariance on the pair of columns provided.
>>> my_frame.covariance("x1", "x2")
-2.5
>>> my_frame.covariance("x1", "x4")
0.0
>>> my_frame.covariance("x2", "x3")
-1.5
"""
return self._scala.covariance(column_a, column_b)