timothyrenner · January 30, 2019 15:57
diff --git a/pyspark_udf_definition.py b/pyspark_udf_definition.py
 import numpy as np

 def predict(*features):
    """ Performs a prediction on the features.
    
        Parameters
        ----------
        features : List[float]
            The feature values the model needs to make a prediction.
           
        
        Returns
        -------
        float
            The predicted score.
     """
    # Turn the features into a 1xN numpy array.
    np_features = np.array([features])
    
    # Assume the model is in scope. Spark will serialize and distribute.
    # Note I have to convert from numpy's float type to a native
    # Python float.
    return model.predict(np_features)[0].item()
	import numpy as np

	def predict(*features):
	""" Performs a prediction on the features.

	Parameters
	----------
	features : List[float]
	The feature values the model needs to make a prediction.


	Returns
	-------
	float
	The predicted score.
	"""
	# Turn the features into a 1xN numpy array.
	np_features = np.array([features])

	# Assume the model is in scope. Spark will serialize and distribute.
	# Note I have to convert from numpy's float type to a native
	# Python float.
	return model.predict(np_features)[0].item()