org.apache.spark.ml.Predictor<FeaturesType,Learner,M>

org.apache.spark.ml.regression.Regressor<Vector,AFTSurvivalRegression,AFTSurvivalRegressionModel>

org.apache.spark.ml.regression.AFTSurvivalRegression

All Implemented Interfaces:: Serializable, org.apache.spark.internal.Logging, Params, HasAggregationDepth, HasFeaturesCol, HasFitIntercept, HasLabelCol, HasMaxBlockSizeInMB, HasMaxIter, HasPredictionCol, HasTol, PredictorParams, AFTSurvivalRegressionParams, DefaultParamsWritable, Identifiable, MLWritable

public class AFTSurvivalRegression extends Regressor<Vector,AFTSurvivalRegression,AFTSurvivalRegressionModel> implements AFTSurvivalRegressionParams, DefaultParamsWritable, org.apache.spark.internal.Logging

Fit a parametric survival regression model named accelerated failure time (AFT) model (see Accelerated failure time model (Wikipedia)) based on the Weibull distribution of the survival time.

Since 3.1.0, it supports stacking instances into blocks and using GEMV for better performance. The block size will be 1.0 MB, if param maxBlockSizeInMB is set 0.0 by default.

See Also:

Serialized Form

Nested Class Summary

Nested classes/interfaces inherited from interface org.apache.spark.internal.Logging
org.apache.spark.internal.Logging.LogStringContext, org.apache.spark.internal.Logging.SparkShellLoggingFilter
Constructor Summary

Constructors

Constructor

Description

AFTSurvivalRegression()

AFTSurvivalRegression(String uid)
Method Summary

Modifier and Type

Method

Description

final IntParam

aggregationDepth()

Param for suggested depth for treeAggregate (>= 2).

final Param<String>

censorCol()

Param for censor column name.

AFTSurvivalRegression

copy(ParamMap extra)

Creates a copy of this instance with the same UID and some extra params.

final BooleanParam

fitIntercept()

Param for whether to fit an intercept term.

static AFTSurvivalRegression

load(String path)

final DoubleParam

maxBlockSizeInMB()

Param for Maximum memory in MB for stacking input data into blocks.

final IntParam

maxIter()

Param for maximum number of iterations (>= 0).

final DoubleArrayParam

quantileProbabilities()

Param for quantile probabilities array.

final Param<String>

quantilesCol()

Param for quantiles column name.

static MLReader<T>

read()

AFTSurvivalRegression

setAggregationDepth(int value)

Suggested depth for treeAggregate (greater than or equal to 2).

AFTSurvivalRegression

setCensorCol(String value)

AFTSurvivalRegression

setFitIntercept(boolean value)

Set if we should fit the intercept Default is true.

AFTSurvivalRegression

setMaxBlockSizeInMB(double value)

Sets the value of param maxBlockSizeInMB().

AFTSurvivalRegression

setMaxIter(int value)

Set the maximum number of iterations.

AFTSurvivalRegression

setQuantileProbabilities(double[] value)

AFTSurvivalRegression

setQuantilesCol(String value)

AFTSurvivalRegression

setTol(double value)

Set the convergence tolerance of iterations.

final DoubleParam

tol()

Param for the convergence tolerance for iterative algorithms (>= 0).

StructType

transformSchema(StructType schema)

Check transform validity and derive the output schema from the input schema.

String

uid()

An immutable unique ID for the object and its derivatives.

Methods inherited from class org.apache.spark.ml.Predictor
featuresCol, fit, labelCol, predictionCol, setFeaturesCol, setLabelCol, setPredictionCol

Methods inherited from class org.apache.spark.ml.Estimator
fit, fit, fit, fit

Methods inherited from class org.apache.spark.ml.PipelineStage
params

Methods inherited from class java.lang.Object
equals, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait

Methods inherited from interface org.apache.spark.ml.regression.AFTSurvivalRegressionParams
getCensorCol, getQuantileProbabilities, getQuantilesCol, hasQuantilesCol, validateAndTransformSchema

Methods inherited from interface org.apache.spark.ml.util.DefaultParamsWritable
write

Methods inherited from interface org.apache.spark.ml.param.shared.HasAggregationDepth
getAggregationDepth

Methods inherited from interface org.apache.spark.ml.param.shared.HasFeaturesCol
featuresCol, getFeaturesCol

Methods inherited from interface org.apache.spark.ml.param.shared.HasFitIntercept
getFitIntercept

Methods inherited from interface org.apache.spark.ml.param.shared.HasLabelCol
getLabelCol, labelCol

Methods inherited from interface org.apache.spark.ml.param.shared.HasMaxBlockSizeInMB
getMaxBlockSizeInMB

Methods inherited from interface org.apache.spark.ml.param.shared.HasMaxIter
getMaxIter

Methods inherited from interface org.apache.spark.ml.param.shared.HasPredictionCol
getPredictionCol, predictionCol

Methods inherited from interface org.apache.spark.ml.param.shared.HasTol
getTol

Methods inherited from interface org.apache.spark.ml.util.Identifiable
toString

Methods inherited from interface org.apache.spark.internal.Logging
initializeForcefully, initializeLogIfNecessary, initializeLogIfNecessary, initializeLogIfNecessary$default$2, isTraceEnabled, log, logDebug, logDebug, logDebug, logDebug, logError, logError, logError, logError, logInfo, logInfo, logInfo, logInfo, logName, LogStringContext, logTrace, logTrace, logTrace, logTrace, logWarning, logWarning, logWarning, logWarning, org$apache$spark$internal$Logging$$log_, org$apache$spark$internal$Logging$$log__$eq, withLogContext

Methods inherited from interface org.apache.spark.ml.util.MLWritable
save

Methods inherited from interface org.apache.spark.ml.param.Params
clear, copyValues, defaultCopy, defaultParamMap, explainParam, explainParams, extractParamMap, extractParamMap, get, getDefault, getOrDefault, getParam, hasDefault, hasParam, isDefined, isSet, onParamChange, paramMap, params, set, set, set, setDefault, setDefault, shouldOwn

Methods inherited from interface org.apache.spark.ml.PredictorParams
validateAndTransformSchema

Constructor Details
- AFTSurvivalRegression
  
  public AFTSurvivalRegression(String uid)
- AFTSurvivalRegression
  
  public AFTSurvivalRegression()
Method Details
- load
  
  public static AFTSurvivalRegression load(String path)
- read
  
  public static MLReader<T> read()
- censorCol
  
  public final Param<String> censorCol()
  
  Description copied from interface: AFTSurvivalRegressionParams
  
  Param for censor column name. The value of this column could be 0 or 1. If the value is 1, it means the event has occurred i.e. uncensored; otherwise censored.
  
  Specified by:
  
  censorCol in interface AFTSurvivalRegressionParams
  
  Returns:
  
  (undocumented)
- quantileProbabilities
  
  public final DoubleArrayParam quantileProbabilities()
  
  Description copied from interface: AFTSurvivalRegressionParams
  
  Param for quantile probabilities array. Values of the quantile probabilities array should be in the range (0, 1) and the array should be non-empty.
  
  Specified by:
  
  quantileProbabilities in interface AFTSurvivalRegressionParams
  
  Returns:
  
  (undocumented)
- quantilesCol
  
  public final Param<String> quantilesCol()
  
  Description copied from interface: AFTSurvivalRegressionParams
  
  Param for quantiles column name. This column will output quantiles of corresponding quantileProbabilities if it is set.
  
  Specified by:
  
  quantilesCol in interface AFTSurvivalRegressionParams
  
  Returns:
  
  (undocumented)
- maxBlockSizeInMB
  
  public final DoubleParam maxBlockSizeInMB()
  
  Description copied from interface: HasMaxBlockSizeInMB
  
  Param for Maximum memory in MB for stacking input data into blocks. Data is stacked within partitions. If more than remaining data size in a partition then it is adjusted to the data size. Default 0.0 represents choosing optimal value, depends on specific algorithm. Must be >= 0..
  
  Specified by:
  
  maxBlockSizeInMB in interface HasMaxBlockSizeInMB
  
  Returns:
  
  (undocumented)
- aggregationDepth
  
  public final IntParam aggregationDepth()
  
  Description copied from interface: HasAggregationDepth
  
  Param for suggested depth for treeAggregate (>= 2).
  
  Specified by:
  
  aggregationDepth in interface HasAggregationDepth
  
  Returns:
  
  (undocumented)
- fitIntercept
  
  public final BooleanParam fitIntercept()
  
  Description copied from interface: HasFitIntercept
  
  Param for whether to fit an intercept term.
  
  Specified by:
  
  fitIntercept in interface HasFitIntercept
  
  Returns:
  
  (undocumented)
- tol
  
  public final DoubleParam tol()
  
  Description copied from interface: HasTol
  
  Param for the convergence tolerance for iterative algorithms (>= 0).
  
  Specified by:
  
  tol in interface HasTol
  
  Returns:
  
  (undocumented)
- maxIter
  
  public final IntParam maxIter()
  
  Description copied from interface: HasMaxIter
  
  Param for maximum number of iterations (>= 0).
  
  Specified by:
  
  maxIter in interface HasMaxIter
  
  Returns:
  
  (undocumented)
- uid
  
  public String uid()
  
  Description copied from interface: Identifiable
  
  An immutable unique ID for the object and its derivatives.
  
  Specified by:
  
  uid in interface Identifiable
  
  Returns:
  
  (undocumented)
- setCensorCol
  
  public AFTSurvivalRegression setCensorCol(String value)
- setQuantileProbabilities
  
  public AFTSurvivalRegression setQuantileProbabilities(double[] value)
- setQuantilesCol
  
  public AFTSurvivalRegression setQuantilesCol(String value)
- setFitIntercept
  
  public AFTSurvivalRegression setFitIntercept(boolean value)
  
  Set if we should fit the intercept Default is true.
  
  Parameters:
  
  value - (undocumented)
  
  Returns:
  
  (undocumented)
- setMaxIter
  
  public AFTSurvivalRegression setMaxIter(int value)
  
  Set the maximum number of iterations. Default is 100.
  
  Parameters:
  
  value - (undocumented)
  
  Returns:
  
  (undocumented)
- setTol
  
  public AFTSurvivalRegression setTol(double value)
  
  Set the convergence tolerance of iterations. Smaller value will lead to higher accuracy with the cost of more iterations. Default is 1E-6.
  
  Parameters:
  
  value - (undocumented)
  
  Returns:
  
  (undocumented)
- setAggregationDepth
  
  public AFTSurvivalRegression setAggregationDepth(int value)
  
  Suggested depth for treeAggregate (greater than or equal to 2). If the dimensions of features or the number of partitions are large, this param could be adjusted to a larger size. Default is 2.
  
  Parameters:
  
  value - (undocumented)
  
  Returns:
  
  (undocumented)
- setMaxBlockSizeInMB
  
  public AFTSurvivalRegression setMaxBlockSizeInMB(double value)
  
  Sets the value of param maxBlockSizeInMB(). Default is 0.0, then 1.0 MB will be chosen.
  
  Parameters:
  
  value - (undocumented)
  
  Returns:
  
  (undocumented)
- transformSchema
  
  public StructType transformSchema(StructType schema)
  
  Description copied from class: PipelineStage
  
  Check transform validity and derive the output schema from the input schema.
  We check validity for interactions between parameters during transformSchema and raise an exception if any parameter value is invalid. Parameter value checks which do not depend on other parameters are handled by Param.validate().
  Typical implementation should first conduct verification on schema change and parameter validity, including complex parameter interaction checks.
  
  Overrides:
  
  transformSchema in class Predictor<Vector,AFTSurvivalRegression,AFTSurvivalRegressionModel>
  
  Parameters:
  
  schema - (undocumented)
  
  Returns:
  
  (undocumented)
- copy
  
  public AFTSurvivalRegression copy(ParamMap extra)
  
  Description copied from interface: Params
  
  Creates a copy of this instance with the same UID and some extra params. Subclasses should implement this method and set the return type properly. See defaultCopy().
  
  Specified by:
  
  copy in interface Params
  
  Specified by:
  
  copy in class Predictor<Vector,AFTSurvivalRegression,AFTSurvivalRegressionModel>
  
  Parameters:
  
  extra - (undocumented)
  
  Returns:
  
  (undocumented)

Class AFTSurvivalRegression

Nested Class Summary

Nested classes/interfaces inherited from interface org.apache.spark.internal.Logging

Constructor Summary

Method Summary

Methods inherited from class org.apache.spark.ml.Predictor

Methods inherited from class org.apache.spark.ml.Estimator

Methods inherited from class org.apache.spark.ml.PipelineStage

Methods inherited from class java.lang.Object

Methods inherited from interface org.apache.spark.ml.regression.AFTSurvivalRegressionParams

Methods inherited from interface org.apache.spark.ml.util.DefaultParamsWritable

Methods inherited from interface org.apache.spark.ml.param.shared.HasAggregationDepth

Methods inherited from interface org.apache.spark.ml.param.shared.HasFeaturesCol

Methods inherited from interface org.apache.spark.ml.param.shared.HasFitIntercept

Methods inherited from interface org.apache.spark.ml.param.shared.HasLabelCol

Methods inherited from interface org.apache.spark.ml.param.shared.HasMaxBlockSizeInMB

Methods inherited from interface org.apache.spark.ml.param.shared.HasMaxIter

Methods inherited from interface org.apache.spark.ml.param.shared.HasPredictionCol

Methods inherited from interface org.apache.spark.ml.param.shared.HasTol

Methods inherited from interface org.apache.spark.ml.util.Identifiable

Methods inherited from interface org.apache.spark.internal.Logging

Methods inherited from interface org.apache.spark.ml.util.MLWritable

Methods inherited from interface org.apache.spark.ml.param.Params

Methods inherited from interface org.apache.spark.ml.PredictorParams

Constructor Details

AFTSurvivalRegression

AFTSurvivalRegression

Method Details

load

read

censorCol

quantileProbabilities

quantilesCol

maxBlockSizeInMB

aggregationDepth

fitIntercept

tol

maxIter

uid

setCensorCol

setQuantileProbabilities

setQuantilesCol

setFitIntercept

setMaxIter

setTol

setAggregationDepth

setMaxBlockSizeInMB

transformSchema

copy