Skip to content

Commit

Permalink
more doc for Transformer
Browse files Browse the repository at this point in the history
  • Loading branch information
mengxr committed Nov 11, 2014
1 parent 4306ed4 commit ad678e9
Show file tree
Hide file tree
Showing 3 changed files with 18 additions and 4 deletions.
4 changes: 3 additions & 1 deletion mllib/src/main/scala/org/apache/spark/ml/Model.scala
Original file line number Diff line number Diff line change
Expand Up @@ -20,7 +20,9 @@ package org.apache.spark.ml
import org.apache.spark.ml.param.ParamMap

/**
* A fitted model.
* A fitted model, i.e., a [[Transformer]] produced by an [[Estimator]].
*
* @tparam M model type
*/
abstract class Model[M <: Model[M]] extends Transformer {
/**
Expand Down
2 changes: 1 addition & 1 deletion mllib/src/main/scala/org/apache/spark/ml/Pipeline.scala
Original file line number Diff line number Diff line change
Expand Up @@ -34,7 +34,7 @@ abstract class PipelineStage extends Serializable with Logging {
def transform(schema: StructType, paramMap: ParamMap): StructType

/**
* Drives the output schema from the input schema and parameters, optionally with logging.
* Derives the output schema from the input schema and parameters, optionally with logging.
*/
protected def transform(schema: StructType, paramMap: ParamMap, logging: Boolean): StructType = {
if (logging) {
Expand Down
16 changes: 14 additions & 2 deletions mllib/src/main/scala/org/apache/spark/ml/Transformer.scala
Original file line number Diff line number Diff line change
Expand Up @@ -48,20 +48,32 @@ abstract class Transformer extends PipelineStage with Params {
}

/**
* Transforms the dataset with provided parameter map.
* Transforms the dataset with provided parameter map as additional parameters.
* @param dataset input dataset
* @param paramMap parameters
* @param paramMap additional parameters, overwrite embedded params
* @return transformed dataset
*/
def transform(dataset: SchemaRDD, paramMap: ParamMap): SchemaRDD

// Java-friendly versions of transform.

/**
* Transforms the dataset with optional parameters.
* @param dataset input datset
* @param paramPairs optional list of param pairs, overwrite embedded params
* @return transformed dataset
*/
@varargs
def transform(dataset: JavaSchemaRDD, paramPairs: ParamPair[_]*): JavaSchemaRDD = {
transform(dataset.schemaRDD, paramPairs: _*).toJavaSchemaRDD
}

/**
* Transforms the dataset with provided parameter map as additional parameters.
* @param dataset input dataset
* @param paramMap additional parameters, overwrite embedded params
* @return transformed dataset
*/
def transform(dataset: JavaSchemaRDD, paramMap: ParamMap): JavaSchemaRDD = {
transform(dataset.schemaRDD, paramMap).toJavaSchemaRDD
}
Expand Down

0 comments on commit ad678e9

Please sign in to comment.