Packages

class SmartVectorAssembler extends Transformer

This Transformer creates a needed Dataframe for common ML approaches in Spark MLlib. The resulting Dataframe consists of a column features which is a numeric vector for each entity The other columns are a identifier column like the node id And optional column for label

Linear Supertypes
Transformer, PipelineStage, Logging, Params, Serializable, Serializable, Identifiable, AnyRef, Any
Ordering
  1. Alphabetic
  2. By Inheritance
Inherited
  1. SmartVectorAssembler
  2. Transformer
  3. PipelineStage
  4. Logging
  5. Params
  6. Serializable
  7. Serializable
  8. Identifiable
  9. AnyRef
  10. Any
  1. Hide All
  2. Show All
Visibility
  1. Public
  2. All

Instance Constructors

  1. new SmartVectorAssembler()

Value Members

  1. final def !=(arg0: Any): Boolean
    Definition Classes
    AnyRef → Any
  2. final def ##(): Int
    Definition Classes
    AnyRef → Any
  3. final def $[T](param: Param[T]): T
    Attributes
    protected
    Definition Classes
    Params
  4. final def ==(arg0: Any): Boolean
    Definition Classes
    AnyRef → Any
  5. var _entityColumn: String
  6. var _featureColumns: List[String]
  7. var _labelColumn: String
  8. var _nullReplacement: Int
  9. var _numericCollapsingStrategy: String
  10. var _stringCollapsingStrategy: String
  11. final def asInstanceOf[T0]: T0
    Definition Classes
    Any
  12. final def clear(param: Param[_]): SmartVectorAssembler.this.type
    Definition Classes
    Params
  13. def clone(): AnyRef
    Attributes
    protected[lang]
    Definition Classes
    AnyRef
    Annotations
    @throws( ... ) @native()
  14. def copy(extra: ParamMap): Transformer
    Definition Classes
    SmartVectorAssembler → Transformer → PipelineStage → Params
  15. def copyValues[T <: Params](to: T, extra: ParamMap): T
    Attributes
    protected
    Definition Classes
    Params
  16. final def defaultCopy[T <: Params](extra: ParamMap): T
    Attributes
    protected
    Definition Classes
    Params
  17. final def eq(arg0: AnyRef): Boolean
    Definition Classes
    AnyRef
  18. def equals(arg0: Any): Boolean
    Definition Classes
    AnyRef → Any
  19. def explainParam(param: Param[_]): String
    Definition Classes
    Params
  20. def explainParams(): String
    Definition Classes
    Params
  21. final def extractParamMap(): ParamMap
    Definition Classes
    Params
  22. final def extractParamMap(extra: ParamMap): ParamMap
    Definition Classes
    Params
  23. def finalize(): Unit
    Attributes
    protected[lang]
    Definition Classes
    AnyRef
    Annotations
    @throws( classOf[java.lang.Throwable] )
  24. final def get[T](param: Param[T]): Option[T]
    Definition Classes
    Params
  25. final def getClass(): Class[_]
    Definition Classes
    AnyRef → Any
    Annotations
    @native()
  26. final def getDefault[T](param: Param[T]): Option[T]
    Definition Classes
    Params
  27. final def getOrDefault[T](param: Param[T]): T
    Definition Classes
    Params
  28. def getParam(paramName: String): Param[Any]
    Definition Classes
    Params
  29. final def hasDefault[T](param: Param[T]): Boolean
    Definition Classes
    Params
  30. def hasParam(paramName: String): Boolean
    Definition Classes
    Params
  31. def hashCode(): Int
    Definition Classes
    AnyRef → Any
    Annotations
    @native()
  32. def initializeLogIfNecessary(isInterpreter: Boolean, silent: Boolean): Boolean
    Attributes
    protected
    Definition Classes
    Logging
  33. def initializeLogIfNecessary(isInterpreter: Boolean): Unit
    Attributes
    protected
    Definition Classes
    Logging
  34. final def isDefined(param: Param[_]): Boolean
    Definition Classes
    Params
  35. final def isInstanceOf[T0]: Boolean
    Definition Classes
    Any
  36. final def isSet(param: Param[_]): Boolean
    Definition Classes
    Params
  37. def isTraceEnabled(): Boolean
    Attributes
    protected
    Definition Classes
    Logging
  38. def log: Logger
    Attributes
    protected
    Definition Classes
    Logging
  39. def logDebug(msg: ⇒ String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  40. def logDebug(msg: ⇒ String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  41. def logError(msg: ⇒ String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  42. def logError(msg: ⇒ String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  43. def logInfo(msg: ⇒ String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  44. def logInfo(msg: ⇒ String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  45. def logName: String
    Attributes
    protected
    Definition Classes
    Logging
  46. def logTrace(msg: ⇒ String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  47. def logTrace(msg: ⇒ String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  48. def logWarning(msg: ⇒ String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  49. def logWarning(msg: ⇒ String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  50. final def ne(arg0: AnyRef): Boolean
    Definition Classes
    AnyRef
  51. final def notify(): Unit
    Definition Classes
    AnyRef
    Annotations
    @native()
  52. final def notifyAll(): Unit
    Definition Classes
    AnyRef
    Annotations
    @native()
  53. lazy val params: Array[Param[_]]
    Definition Classes
    Params
  54. final def set(paramPair: ParamPair[_]): SmartVectorAssembler.this.type
    Attributes
    protected
    Definition Classes
    Params
  55. final def set(param: String, value: Any): SmartVectorAssembler.this.type
    Attributes
    protected
    Definition Classes
    Params
  56. final def set[T](param: Param[T], value: T): SmartVectorAssembler.this.type
    Definition Classes
    Params
  57. final def setDefault(paramPairs: ParamPair[_]*): SmartVectorAssembler.this.type
    Attributes
    protected
    Definition Classes
    Params
  58. final def setDefault[T](param: Param[T], value: T): SmartVectorAssembler.this.type
    Attributes
    protected
    Definition Classes
    Params
  59. def setEntityColumn(p: String): SmartVectorAssembler.this.type

    set which columns represents the entity if not set first column is used

    set which columns represents the entity if not set first column is used

    p

    entity columnName as string

    returns

    set transformer

  60. def setFeatureColumns(p: List[String]): SmartVectorAssembler.this.type

    set which columns represents the features, if not set all but label and entity are used

    set which columns represents the features, if not set all but label and entity are used

    p

    label columnName as string

    returns

    set transformer

  61. def setLabelColumn(p: String): SmartVectorAssembler.this.type

    set which columns represents the labl, if not set no label column

    set which columns represents the labl, if not set no label column

    p

    label columnName as string

    returns

    set transformer

  62. val spark: SparkSession
    Attributes
    protected
  63. final def synchronized[T0](arg0: ⇒ T0): T0
    Definition Classes
    AnyRef
  64. def toString(): String
    Definition Classes
    Identifiable → AnyRef → Any
  65. def transform(dataset: Dataset[_]): DataFrame

    transforms a dataframe of query results to a numeric feature vectors and a id and label column

    transforms a dataframe of query results to a numeric feature vectors and a id and label column

    dataset

    dataframe with columns for id features and optional label

    returns

    dataframe with columns id features and optional label where features are numeric vectors which incooperate with mllib

    Definition Classes
    SmartVectorAssembler → Transformer
  66. def transform(dataset: Dataset[_], paramMap: ParamMap): DataFrame
    Definition Classes
    Transformer
    Annotations
    @Since( "2.0.0" )
  67. def transform(dataset: Dataset[_], firstParamPair: ParamPair[_], otherParamPairs: ParamPair[_]*): DataFrame
    Definition Classes
    Transformer
    Annotations
    @Since( "2.0.0" ) @varargs()
  68. def transformSchema(schema: StructType): StructType
    Definition Classes
    SmartVectorAssembler → PipelineStage
  69. def transformSchema(schema: StructType, logging: Boolean): StructType
    Attributes
    protected
    Definition Classes
    PipelineStage
    Annotations
    @DeveloperApi()
  70. val uid: String
    Definition Classes
    SmartVectorAssembler → Identifiable
  71. def validateEntityColumn(cols: Seq[String]): Unit

    Validate set column to check if we need fallback to first column if not set and if set if it is in available cols

    Validate set column to check if we need fallback to first column if not set and if set if it is in available cols

    cols

    the available columns

  72. def validateFeatureColumns(cols: Seq[String]): Unit

    validate the feature columns if feature columns are set, check if those are in avaiable columns if not raise exception if not set determine feature columns by all columns minus the label and entty column

  73. def validateLabelColumn(cols: Seq[String]): Unit

    validate if label is in available columns

    validate if label is in available columns

    cols

    the avaiable columns

  74. final def wait(): Unit
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  75. final def wait(arg0: Long, arg1: Int): Unit
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  76. final def wait(arg0: Long): Unit
    Definition Classes
    AnyRef
    Annotations
    @throws( ... ) @native()

Inherited from Transformer

Inherited from PipelineStage

Inherited from Logging

Inherited from Params

Inherited from Serializable

Inherited from Serializable

Inherited from Identifiable

Inherited from AnyRef

Inherited from Any

Ungrouped