GlintFMPair

Instance Constructors

new GlintFMPair()
new GlintFMPair(uid: String)

Value Members

final def !=(arg0: Any): Boolean

Definition Classes
AnyRef → Any
final def ##(): Int

Definition Classes
AnyRef → Any
final def $[T](param: Param[T]): T

Attributes
protected
Definition Classes
Params
final def ==(arg0: Any): Boolean

Definition Classes
AnyRef → Any
def aggFeatureProbabilities(df: DataFrame, numCols: Int): Array[Float]

Computes the feature probabilities of sparse feature vector columns through mapPartitions for efficiency and through treeReduce to avoid OOM on the driver
Computes the feature probabilities of sparse feature vector columns through mapPartitions for efficiency and through treeReduce to avoid OOM on the driver
df
The dataframe to aggregate, must have sparse vector columns starting at column 0
numCols
The number of sparse vector columns
def aggWeightedFeatureProbabilities(df: DataFrame): Array[Float]

Computes the weighted feature probabilities of sparse feature vector columns through mapPartitions for efficiency and through treeReduce to avoid OOM on the driver
Computes the weighted feature probabilities of sparse feature vector columns through mapPartitions for efficiency and through treeReduce to avoid OOM on the driver
df
The dataframe to aggregate, must have a double weight column at column 0 and sparse vector column at column 1
final def asInstanceOf[T0]: T0

Definition Classes
Any
final val batchSize: IntParam

The per-worker mini-batch size Default: 256
The per-worker mini-batch size Default: 256

Definition Classes
GlintFMPairParams
final def clear(param: Param[_]): GlintFMPair.this.type

Definition Classes
Params
def clone(): AnyRef

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( ... )
def copy(extra: ParamMap): Estimator[GlintFMPairModel]

Definition Classes
GlintFMPair → Estimator → PipelineStage → Params
def copyValues[T <: Params](to: T, extra: ParamMap): T

Attributes
protected
Definition Classes
Params
final def defaultCopy[T <: Params](extra: ParamMap): T

Attributes
protected
Definition Classes
Params
final def eq(arg0: AnyRef): Boolean

Definition Classes
AnyRef
def equals(arg0: Any): Boolean

Definition Classes
AnyRef → Any
def explainParam(param: Param[_]): String

Definition Classes
Params
def explainParams(): String

Definition Classes
Params
final def extractParamMap(): ParamMap

Definition Classes
Params
final def extractParamMap(extra: ParamMap): ParamMap

Definition Classes
Params
final val factorsReg: FloatParam

The regularization rate for the latent factor weights Default: 0.001f
The regularization rate for the latent factor weights Default: 0.001f

Definition Classes
GlintFMPairParams
final val filterItemsCol: Param[String]

The name of the integer arrays column containing the itemCol ids of the items to filter from recommendations.
The name of the integer arrays column containing the itemCol ids of the items to filter from recommendations. If empty, recommendations are not filtered. Usually the arrays will contain the ids of the items of the user
Default: ""

Definition Classes
GlintFMPairParams
def finalize(): Unit

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( classOf[java.lang.Throwable] )
def fit(dataset: Dataset[_]): GlintFMPairModel

Fits a GlintFMPairModel on the data set
Fits a GlintFMPairModel on the data set
dataset
The data set containing columns (userCol: Int, itemCol: Int, itemFeaturesCol: SparseVector, userctxFeaturesCol: SparseVector) and if acceptance sampling should be used also samplingCol.

Definition Classes
GlintFMPair → Estimator
def fit(dataset: Dataset[_], paramMaps: Array[ParamMap]): Seq[GlintFMPairModel]

Definition Classes
Estimator
Annotations
@Since( "2.0.0" )
def fit(dataset: Dataset[_], paramMap: ParamMap): GlintFMPairModel

Definition Classes
Estimator
Annotations
@Since( "2.0.0" )
def fit(dataset: Dataset[_], firstParamPair: ParamPair[_], otherParamPairs: ParamPair[_]*): GlintFMPairModel

Definition Classes
Estimator
Annotations
@Since( "2.0.0" ) @varargs()
final def get[T](param: Param[T]): Option[T]

Definition Classes
Params
def getBatchSize: Int

Definition Classes
GlintFMPairParams
final def getClass(): Class[_]

Definition Classes
AnyRef → Any
final def getDefault[T](param: Param[T]): Option[T]

Definition Classes
Params
def getFactorsReg: Float

Definition Classes
GlintFMPairParams
def getFilterItemsCol: String

Definition Classes
GlintFMPairParams
def getItemCol: String

Definition Classes
GlintFMPairParams
def getItemfeaturesCol: String

Definition Classes
GlintFMPairParams
def getLinearReg: Float

Definition Classes
GlintFMPairParams
def getLoadMetadata: Boolean

Definition Classes
GlintFMPairParams
final def getMaxIter: Int

Definition Classes
HasMaxIter
def getMetadataPath: String

Definition Classes
GlintFMPairParams
def getNumDims: Int

Definition Classes
GlintFMPairParams
def getNumParameterServers: Int

Definition Classes
GlintFMPairParams
final def getOrDefault[T](param: Param[T]): T

Definition Classes
Params
def getParam(paramName: String): Param[Any]

Definition Classes
Params
def getParameterServerConfig: Config

Definition Classes
GlintFMPairParams
def getParameterServerHost: String

Definition Classes
GlintFMPairParams
final def getPredictionCol: String

Definition Classes
HasPredictionCol
def getRho: Double

Definition Classes
GlintFMPairParams
def getSampler: String

Definition Classes
GlintFMPairParams
def getSamplingCol: String

Definition Classes
GlintFMPairParams
def getSaveMetadata: Boolean

Definition Classes
GlintFMPairParams
final def getSeed: Long

Definition Classes
HasSeed
final def getStepSize: Double

Definition Classes
HasStepSize
def getTreeDepth: Int

Definition Classes
GlintFMPairParams
def getUserCol: String

Definition Classes
GlintFMPairParams
def getUserctxfeaturesCol: String

Definition Classes
GlintFMPairParams
final def hasDefault[T](param: Param[T]): Boolean

Definition Classes
Params
def hasParam(paramName: String): Boolean

Definition Classes
Params
def hashCode(): Int

Definition Classes
AnyRef → Any
def initializeLogIfNecessary(isInterpreter: Boolean, silent: Boolean): Boolean

Attributes
protected
Definition Classes
Logging
def initializeLogIfNecessary(isInterpreter: Boolean): Unit

Attributes
protected
Definition Classes
Logging
final def isDefined(param: Param[_]): Boolean

Definition Classes
Params
final def isInstanceOf[T0]: Boolean

Definition Classes
Any
final def isSet(param: Param[_]): Boolean

Definition Classes
Params
def isTraceEnabled(): Boolean

Attributes
protected
Definition Classes
Logging
final val itemCol: Param[String]

The name of the item id column of integers from 0 to number of items in training dataset Default: "itemid"
The name of the item id column of integers from 0 to number of items in training dataset Default: "itemid"

Definition Classes
GlintFMPairParams
final val itemfeaturesCol: Param[String]

The name of the item feature column of sparse vectors Default: "itemfeatures"
The name of the item feature column of sparse vectors Default: "itemfeatures"

Definition Classes
GlintFMPairParams
final val linearReg: FloatParam

The regularization rate for the linear weights Default: 0.01f
The regularization rate for the linear weights Default: 0.01f

Definition Classes
GlintFMPairParams
final val loadMetadata: BooleanParam

Whether the meta data of the data frame to fit should be loaded from HDFS.
Whether the meta data of the data frame to fit should be loaded from HDFS. This allows skipping the meta data computation stages when fitting on the same data frame with different parameters. Meta data for "cross-batch" and "uniform" sampling is intercompatible but "exp" requires its own meta data
Default: false

Definition Classes
GlintFMPairParams
def log: Logger

Attributes
protected
Definition Classes
Logging
def logDebug(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logDebug(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def logError(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logError(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def logInfo(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logInfo(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def logName: String

Attributes
protected
Definition Classes
Logging
def logTrace(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logTrace(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
def logWarning(msg: ⇒ String, throwable: Throwable): Unit

Attributes
protected
Definition Classes
Logging
def logWarning(msg: ⇒ String): Unit

Attributes
protected
Definition Classes
Logging
final val maxIter: IntParam

Definition Classes
HasMaxIter
final val metadataPath: Param[String]

The HDFS path to load meta data for the fit data frame from or to save the fitted meta data to.
The HDFS path to load meta data for the fit data frame from or to save the fitted meta data to. Default: ""

Definition Classes
GlintFMPairParams
final def ne(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def notify(): Unit

Definition Classes
AnyRef
final def notifyAll(): Unit

Definition Classes
AnyRef
final val numDims: IntParam

The number of latent factor dimensions (k) Default: 150
The number of latent factor dimensions (k) Default: 150

Definition Classes
GlintFMPairParams
final val numParameterServers: IntParam

The number of parameter servers Default: 3
The number of parameter servers Default: 3

Definition Classes
GlintFMPairParams
final val parameterServerConfig: Param[Config]

The parameter server configuration.
The parameter server configuration. Allows for detailed configuration of the parameter servers with the default configuration as fallback. Default: ConfigFactory.empty()

Definition Classes
GlintFMPairParams
final val parameterServerHost: Param[String]

The master host of the running parameter servers.
The master host of the running parameter servers. If this is not set a standalone parameter server cluster is started in this Spark application. Default: ""

Definition Classes
GlintFMPairParams
lazy val params: Array[Param[_]]

Definition Classes
Params
final val predictionCol: Param[String]

Definition Classes
HasPredictionCol
final val rho: DoubleParam

The rho value to use for the "exp" sampler.
The rho value to use for the "exp" sampler. Has to be between 0.0 and 1.0 Default: 1.0

Definition Classes
GlintFMPairParams
final val sampler: Param[String]

The sampler to use.
The sampler to use.
"uniform" means sampling negative items uniformly, as originally proposed for BPR.
"exp" means sampling negative items with probability proportional to their exponential popularity distribution, as proposed in LambdaFM.
"crossbatch" means sampling negative items uniformly, but sharing them across the mini-batch as crossbatch-BPR loss, as proposed in my masters thesis.
Default: "uniform"

Definition Classes
GlintFMPairParams
final val samplingCol: Param[String]

The name of the column of integers to use for sampling.
The name of the column of integers to use for sampling. If empty all items are accepted as negative items otherwise only items where there does not exist an interaction between the user and the sampling column value of the item. Usually the sampling column is the same as itemCol but it may also be another column with an n-to-1 relation from item column value to sampling column value.
Consider the example of playlists with "pid" as user column amd tracks with "traid" as item column. Another column "artid" holds the artist of the track. With "traid" as sampling column, only tracks which are not in the playlist are accepted as negative items. With "artid" as sampling column, only tracks whose artists are not in the playlist are accepted as negative item.
Default: ""

Definition Classes
GlintFMPairParams
def save(path: String): Unit

Definition Classes
MLWritable
Annotations
@Since( "1.6.0" ) @throws( ... )
final val saveMetadata: BooleanParam

Whether the meta data of the fitted data frame should be saved to HDFS.
Whether the meta data of the fitted data frame should be saved to HDFS. Default: false

Definition Classes
GlintFMPairParams
final val seed: LongParam

Definition Classes
HasSeed
final def set(paramPair: ParamPair[_]): GlintFMPair.this.type

Attributes
protected
Definition Classes
Params
final def set(param: String, value: Any): GlintFMPair.this.type

Attributes
protected
Definition Classes
Params
final def set[T](param: Param[T], value: T): GlintFMPair.this.type

Definition Classes
Params
def setBatchSize(value: Int): GlintFMPair.this.type
final def setDefault(paramPairs: ParamPair[_]*): GlintFMPair.this.type

Attributes
protected
Definition Classes
Params
final def setDefault[T](param: Param[T], value: T): GlintFMPair.this.type

Attributes
protected
Definition Classes
Params
def setFactorsReg(value: Float): GlintFMPair.this.type
def setFilterItemsCol(value: String): GlintFMPair.this.type
def setItemCol(value: String): GlintFMPair.this.type
def setItemFeaturesCol(value: String): GlintFMPair.this.type
def setLinearReg(value: Float): GlintFMPair.this.type
def setLoadMetadata(value: Boolean): GlintFMPair.this.type
def setMaxIter(value: Int): GlintFMPair.this.type
def setMetadataPath(value: String): GlintFMPair.this.type
def setNumDims(value: Int): GlintFMPair.this.type
def setNumParameterServers(value: Int): GlintFMPair.this.type
def setParameterServerConfig(value: Config): GlintFMPair.this.type
def setParameterServerHost(value: String): GlintFMPair.this.type
def setPredictionCol(value: String): GlintFMPair.this.type
def setSampler(value: String): GlintFMPair.this.type
def setSamplingCol(value: String): GlintFMPair.this.type
def setSaveMetadata(value: Boolean): GlintFMPair.this.type
def setSeed(value: Long): GlintFMPair.this.type
def setStepSize(value: Double): GlintFMPair.this.type
def setUserCol(value: String): GlintFMPair.this.type
def setUserctxFeaturesCol(value: String): GlintFMPair.this.type
val stepSize: DoubleParam

Definition Classes
HasStepSize
final def synchronized[T0](arg0: ⇒ T0): T0

Definition Classes
AnyRef
def toString(): String

Definition Classes
Identifiable → AnyRef → Any
def transformSchema(schema: StructType): StructType

Definition Classes
GlintFMPair → PipelineStage
def transformSchema(schema: StructType, logging: Boolean): StructType

Attributes
protected
Definition Classes
PipelineStage
Annotations
@DeveloperApi()
final val treeDepth: IntParam

The depth to use for tree reduce when computing the meta data.
The depth to use for tree reduce when computing the meta data. To avoid OOM errors, this has to be set sufficiently large but lower depths might lead to faster runtimes

Definition Classes
GlintFMPairParams
val uid: String

Definition Classes
GlintFMPair → Identifiable
final val userCol: Param[String]

The name of the user id column of integers Default: "userid"
The name of the user id column of integers Default: "userid"

Definition Classes
GlintFMPairParams
final val userctxfeaturesCol: Param[String]

The name of the user and context feature column of sparse vectors Default: "userctxfeatures"
The name of the user and context feature column of sparse vectors Default: "userctxfeatures"

Definition Classes
GlintFMPairParams
final def wait(): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long, arg1: Int): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
def write: MLWriter

Definition Classes
DefaultParamsWritable → MLWritable

Related Docs: object GlintFMPair | package recommendation

class GlintFMPair extends Estimator[GlintFMPairModel] with GlintFMPairParams with DefaultParamsWritable

Instance Constructors

new GlintFMPair()

new GlintFMPair(uid: String)

Value Members

final def !=(arg0: Any): Boolean

final def ##(): Int

final def $[T](param: Param[T]): T

final def ==(arg0: Any): Boolean

def aggFeatureProbabilities(df: DataFrame, numCols: Int): Array[Float]

def aggWeightedFeatureProbabilities(df: DataFrame): Array[Float]

final def asInstanceOf[T0]: T0

final val batchSize: IntParam

final def clear(param: Param[_]): GlintFMPair.this.type

def clone(): AnyRef

def copy(extra: ParamMap): Estimator[GlintFMPairModel]

def copyValues[T <: Params](to: T, extra: ParamMap): T

final def defaultCopy[T <: Params](extra: ParamMap): T

final def eq(arg0: AnyRef): Boolean

def equals(arg0: Any): Boolean

def explainParam(param: Param[_]): String

def explainParams(): String

final def extractParamMap(): ParamMap

final def extractParamMap(extra: ParamMap): ParamMap

final val factorsReg: FloatParam

final val filterItemsCol: Param[String]

def finalize(): Unit

def fit(dataset: Dataset[_]): GlintFMPairModel

def fit(dataset: Dataset[_], paramMaps: Array[ParamMap]): Seq[GlintFMPairModel]

def fit(dataset: Dataset[_], paramMap: ParamMap): GlintFMPairModel

def fit(dataset: Dataset[_], firstParamPair: ParamPair[_], otherParamPairs: ParamPair[_]*): GlintFMPairModel

final def get[T](param: Param[T]): Option[T]

def getBatchSize: Int

final def getClass(): Class[_]

final def getDefault[T](param: Param[T]): Option[T]

def getFactorsReg: Float

def getFilterItemsCol: String

def getItemCol: String

def getItemfeaturesCol: String

def getLinearReg: Float

def getLoadMetadata: Boolean

final def getMaxIter: Int

def getMetadataPath: String

def getNumDims: Int

def getNumParameterServers: Int

final def getOrDefault[T](param: Param[T]): T

def getParam(paramName: String): Param[Any]

def getParameterServerConfig: Config

def getParameterServerHost: String

final def getPredictionCol: String

def getRho: Double

def getSampler: String

def getSamplingCol: String

def getSaveMetadata: Boolean

final def getSeed: Long

final def getStepSize: Double

def getTreeDepth: Int

def getUserCol: String

def getUserctxfeaturesCol: String

final def hasDefault[T](param: Param[T]): Boolean

def hasParam(paramName: String): Boolean

def hashCode(): Int

def initializeLogIfNecessary(isInterpreter: Boolean, silent: Boolean): Boolean

def initializeLogIfNecessary(isInterpreter: Boolean): Unit

final def isDefined(param: Param[_]): Boolean

final def isInstanceOf[T0]: Boolean

final def isSet(param: Param[_]): Boolean

def isTraceEnabled(): Boolean

final val itemCol: Param[String]

final val itemfeaturesCol: Param[String]

final val linearReg: FloatParam

final val loadMetadata: BooleanParam

def log: Logger

def logDebug(msg: ⇒ String, throwable: Throwable): Unit

def logDebug(msg: ⇒ String): Unit

def logError(msg: ⇒ String, throwable: Throwable): Unit

def logError(msg: ⇒ String): Unit

def logInfo(msg: ⇒ String, throwable: Throwable): Unit