public class MvelContextUDFs
extends java.lang.Object
| Modifier and Type | Method and Description |
|---|---|
static boolean |
and(boolean left,
boolean right) |
static java.lang.Double |
cast_double(java.lang.Object input)
Cast the input to double.
|
static java.lang.Float |
cast_float(java.lang.Object input)
Cast the input to float.
|
static java.lang.Integer |
cast_int(java.lang.Object input)
Cast the input to Integer.
|
static java.lang.String |
concat(java.lang.String left,
java.lang.String right)
Concatenate two strings into one.
|
static java.lang.Float |
cosineSimilarity(java.lang.Object obj1,
java.lang.Object obj2) |
static int |
dayofmonth(java.lang.Object input) |
static int |
dayofweek(java.lang.Object input) |
static java.util.Collection<java.lang.Object> |
distinct(java.util.Collection<java.lang.Object> collection) |
static java.lang.Double |
dotProduct(java.lang.Object obj1,
java.lang.Object obj2)
Returns a standard dotProduct of two vector objects.
|
static java.util.Map<java.lang.String,java.lang.Float> |
extract_term_value_from_array(java.util.ArrayList<org.apache.spark.sql.catalyst.expressions.GenericRowWithSchema> array,
java.lang.String termFieldName,
java.lang.String valueFieldName) |
static java.util.Map<java.lang.String,java.lang.Float> |
extract_term_value_from_array(java.util.ArrayList<org.apache.spark.sql.catalyst.expressions.GenericRowWithSchema> array,
java.lang.String termFieldName,
java.lang.String valueFieldName,
java.lang.String filterExpr) |
static java.util.Collection<java.lang.Object> |
flatten(java.util.Collection<? extends java.util.Collection<java.lang.Object>> collection) |
static java.lang.String |
get_data_type(java.lang.Object input)
Get the class type of the input object
WARNING: This is only used for debug for users.
|
static java.util.Collection<java.lang.String> |
getTerms(java.lang.Object item) |
static java.util.List<java.lang.String> |
getTopKTerms(java.lang.Object item,
int k)
return an ordered list of terms, based on descending order of corresponding values
|
static java.lang.String |
getTopTerm(java.lang.Object item)
get terms with the highest value (duplicate will resolved randomly)
|
static int |
hourofday(java.lang.Object input) |
static boolean |
if_else(boolean input,
boolean first,
boolean second) |
static java.lang.Double |
if_else(boolean input,
java.lang.Double first,
java.lang.Double second) |
static java.lang.Float |
if_else(boolean input,
java.lang.Float first,
java.lang.Float second) |
static java.lang.Integer |
if_else(boolean input,
java.lang.Integer first,
java.lang.Integer second) |
static java.lang.String |
if_else(boolean input,
java.lang.String first,
java.lang.String second)
Ternary operator.
|
static boolean |
isNonZero(java.lang.Object vector)
Return true if a feature has at least 1 term with value not zero.
|
static boolean |
isnotnull(java.lang.Object input) |
static boolean |
isnull(java.lang.Object input) |
static boolean |
isPresent(java.lang.Object featureValue)
return true if a feature variable is not null.
|
static boolean |
not(boolean input) |
static boolean |
or(boolean left,
boolean right) |
static void |
registerUDFs(org.mvel2.ParserConfiguration parserConfig) |
static long |
time_duration(java.lang.Object startTime,
java.lang.Object endTime,
java.lang.String outputGranularity) |
static java.lang.Boolean |
toBoolean(java.lang.Object item)
Converts an object to a boolean
|
static java.lang.Object |
toCategorical(java.lang.Object item)
Convert input to categorical feature
Example inputs that can be converted
- Map("a" -> 2.0) return Map("a" -> 2.0)
- Map("" -> 2.5) returns ("2.5", 1.0)
|
static java.lang.String |
toLowerCase(java.lang.String input)
convert input to lower case string
|
static java.lang.Object |
toNumeric(java.lang.Object item)
Convert input to numeric value
Example inputs that can be converted
- Map("" -> 2.0) returns 2.0
- Map("876" -> 1.0) returns 876
|
static java.lang.String |
toUpperCase(java.lang.String input)
convert input to upper case string
|
public static void registerUDFs(org.mvel2.ParserConfiguration parserConfig)
public static java.lang.String get_data_type(java.lang.Object input)
public static java.lang.Double cast_double(java.lang.Object input)
public static java.lang.Float cast_float(java.lang.Object input)
public static java.lang.Integer cast_int(java.lang.Object input)
public static boolean and(boolean left,
boolean right)
public static boolean or(boolean left,
boolean right)
public static boolean not(boolean input)
public static boolean isnull(java.lang.Object input)
public static boolean isnotnull(java.lang.Object input)
public static java.lang.String concat(java.lang.String left,
java.lang.String right)
public static java.lang.String if_else(boolean input,
java.lang.String first,
java.lang.String second)
public static java.lang.Double if_else(boolean input,
java.lang.Double first,
java.lang.Double second)
public static java.lang.Float if_else(boolean input,
java.lang.Float first,
java.lang.Float second)
public static java.lang.Integer if_else(boolean input,
java.lang.Integer first,
java.lang.Integer second)
public static boolean if_else(boolean input,
boolean first,
boolean second)
public static boolean isNonZero(java.lang.Object vector)
public static boolean isPresent(java.lang.Object featureValue)
public static java.lang.Boolean toBoolean(java.lang.Object item)
public static java.lang.Object toNumeric(java.lang.Object item)
public static java.lang.Object toCategorical(java.lang.Object item)
public static java.util.Collection<java.lang.String> getTerms(java.lang.Object item)
public static java.util.List<java.lang.String> getTopKTerms(java.lang.Object item,
int k)
item - Object that can be converted to Map of string to floatk - integer, if k<0, do reverse order selection, e.g. -1: select bottom firstpublic static java.lang.String getTopTerm(java.lang.Object item)
item - Object that can be converted to Map of string to floatpublic static java.util.Collection<java.lang.Object> distinct(java.util.Collection<java.lang.Object> collection)
public static java.util.Collection<java.lang.Object> flatten(java.util.Collection<? extends java.util.Collection<java.lang.Object>> collection)
public static java.lang.Float cosineSimilarity(java.lang.Object obj1,
java.lang.Object obj2)
public static java.lang.Double dotProduct(java.lang.Object obj1,
java.lang.Object obj2)
cosineSimilarity(Object, Object) for normalized dot-product.public static java.lang.String toLowerCase(java.lang.String input)
input - input stringpublic static java.lang.String toUpperCase(java.lang.String input)
input - input stringpublic static long time_duration(java.lang.Object startTime,
java.lang.Object endTime,
java.lang.String outputGranularity)
public static int dayofweek(java.lang.Object input)
public static int dayofmonth(java.lang.Object input)
public static int hourofday(java.lang.Object input)
public static java.util.Map<java.lang.String,java.lang.Float> extract_term_value_from_array(java.util.ArrayList<org.apache.spark.sql.catalyst.expressions.GenericRowWithSchema> array,
java.lang.String termFieldName,
java.lang.String valueFieldName)
public static java.util.Map<java.lang.String,java.lang.Float> extract_term_value_from_array(java.util.ArrayList<org.apache.spark.sql.catalyst.expressions.GenericRowWithSchema> array,
java.lang.String termFieldName,
java.lang.String valueFieldName,
java.lang.String filterExpr)