Skip to content

Commit

Permalink
DistriOptimizerV2 argument (intel-analytics#3003)
Browse files Browse the repository at this point in the history
* call DistriOptimizerV2
  • Loading branch information
Le-Zheng authored May 27, 2020
1 parent 79d67c8 commit 9d82101
Show file tree
Hide file tree
Showing 3 changed files with 102 additions and 29 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -37,6 +37,14 @@ sealed trait EngineType
case object MklBlas extends EngineType
case object MklDnn extends EngineType

/**
* define optimizer version trait
*/
sealed trait OptimizerVersion

case object OptimizerV1 extends OptimizerVersion
case object OptimizerV2 extends OptimizerVersion


object Engine {

Expand Down Expand Up @@ -215,6 +223,18 @@ object Engine {
}
}

/**
* Notice: Please use property bigdl.optimizerVersion to set optimizerVersion.
* Default version is OptimizerV1
*/
private var optimizerVersion: OptimizerVersion = {
System.getProperty("bigdl.optimizerVersion", "optimizerv1").toLowerCase(Locale.ROOT) match {
case "optimizerv1" => OptimizerV1
case "optimizerv2" => OptimizerV2
case optimizerVersion => throw new IllegalArgumentException(s"Unknown type $optimizerVersion")
}
}

// Thread pool for default use
@volatile private var _default: ThreadPool = null

Expand Down Expand Up @@ -314,6 +334,19 @@ object Engine {
nodeNum = n
}

/**
* This method should only be used for test purpose.
*
* @param optimizerVersion
*/
private[bigdl] def setOptimizerVersion(optimizerVersion : OptimizerVersion): Unit = {
this.optimizerVersion = optimizerVersion
}

private[bigdl] def getOptimizerVersion(): OptimizerVersion = {
this.optimizerVersion
}

/**
* This method should only be used for test purpose.
*
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -27,6 +27,7 @@ import com.intel.analytics.bigdl.parameters.{ConstantClippingProcessor,
import com.intel.analytics.bigdl.tensor.TensorNumericMath.TensorNumeric
import com.intel.analytics.bigdl.utils._
import com.intel.analytics.bigdl.visualization.{TrainSummary, ValidationSummary}
import com.intel.analytics.bigdl.utils.Engine
import org.apache.log4j.Logger
import org.apache.spark.rdd.RDD

Expand Down Expand Up @@ -611,13 +612,24 @@ object Optimizer {
val _featurePaddingParam = if (featurePaddingParam != null) Some(featurePaddingParam) else None
val _labelPaddingParam = if (labelPaddingParam != null) Some(labelPaddingParam) else None

new DistriOptimizer[T](
_model = model,
_dataset = (DataSet.rdd(sampleRDD) ->
SampleToMiniBatch(batchSize, _featurePaddingParam, _labelPaddingParam))
.toDistributed(),
_criterion = criterion
).asInstanceOf[Optimizer[T, MiniBatch[T]]]
Engine.getOptimizerVersion() match {
case OptimizerV1 =>
new DistriOptimizer[T](
_model = model,
_dataset = (DataSet.rdd(sampleRDD) ->
SampleToMiniBatch(batchSize, _featurePaddingParam, _labelPaddingParam))
.toDistributed(),
_criterion = criterion
).asInstanceOf[Optimizer[T, MiniBatch[T]]]
case OptimizerV2 =>
new DistriOptimizerV2[T](
_model = model,
_dataset = (DataSet.rdd(sampleRDD) ->
SampleToMiniBatch(batchSize, _featurePaddingParam, _labelPaddingParam))
.toDistributed(),
_criterion = criterion
).asInstanceOf[Optimizer[T, MiniBatch[T]]]
}
}


Expand All @@ -640,13 +652,24 @@ object Optimizer {
batchSize: Int,
miniBatchImpl: MiniBatch[T]
)(implicit ev: TensorNumeric[T]): Optimizer[T, MiniBatch[T]] = {
new DistriOptimizer[T](
_model = model,
_dataset = (DataSet.rdd(sampleRDD) ->
SampleToMiniBatch(miniBatchImpl, batchSize, None))
.toDistributed(),
_criterion = criterion
).asInstanceOf[Optimizer[T, MiniBatch[T]]]
Engine.getOptimizerVersion() match {
case OptimizerV1 =>
new DistriOptimizer[T](
_model = model,
_dataset = (DataSet.rdd(sampleRDD) ->
SampleToMiniBatch(miniBatchImpl, batchSize, None))
.toDistributed(),
_criterion = criterion
).asInstanceOf[Optimizer[T, MiniBatch[T]]]
case OptimizerV2 =>
new DistriOptimizerV2[T](
_model = model,
_dataset = (DataSet.rdd(sampleRDD) ->
SampleToMiniBatch(miniBatchImpl, batchSize, None))
.toDistributed(),
_criterion = criterion
).asInstanceOf[Optimizer[T, MiniBatch[T]]]
}
}

/**
Expand All @@ -664,11 +687,20 @@ object Optimizer {
)(implicit ev: TensorNumeric[T]): Optimizer[T, D] = {
dataset match {
case d: DistributedDataSet[_] =>
new DistriOptimizer[T](
_model = model,
_dataset = d.toDistributed().asInstanceOf[DistributedDataSet[MiniBatch[T]]],
_criterion = criterion
).asInstanceOf[Optimizer[T, D]]
Engine.getOptimizerVersion() match {
case OptimizerV1 =>
new DistriOptimizer[T](
_model = model,
_dataset = d.toDistributed().asInstanceOf[DistributedDataSet[MiniBatch[T]]],
_criterion = criterion
).asInstanceOf[Optimizer[T, D]]
case OptimizerV2 =>
new DistriOptimizerV2[T](
_model = model,
_dataset = d.toDistributed().asInstanceOf[DistributedDataSet[MiniBatch[T]]],
_criterion = criterion
).asInstanceOf[Optimizer[T, D]]
}
case d: LocalDataSet[_] =>
new LocalOptimizer[T](
model = model,
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -2351,12 +2351,11 @@ class PythonBigDL[T: ClassTag](implicit ev: TensorNumeric[T]) extends Serializab
endTrigger: Trigger,
batchSize: Int): Optimizer[T, MiniBatch[T]] = {
val sampleRDD = toJSample(trainingRdd)

val optimizer = new DistriOptimizer(
_model = model,
_dataset = batching(DataSet.rdd(sampleRDD), batchSize)
val optimizer = Optimizer(
model = model,
dataset = batching(DataSet.rdd(sampleRDD), batchSize)
.asInstanceOf[DistributedDataSet[MiniBatch[T]]],
_criterion = criterion
criterion = criterion
).asInstanceOf[Optimizer[T, MiniBatch[T]]]
enrichOptimizer(optimizer, endTrigger, optimMethod.asScala.toMap)
}
Expand All @@ -2368,11 +2367,10 @@ class PythonBigDL[T: ClassTag](implicit ev: TensorNumeric[T]) extends Serializab
endTrigger: Trigger,
batchSize: Int): Optimizer[T, MiniBatch[T]] = {
val dataSet = trainDataSet -> ImageFeatureToMiniBatch[T](batchSize)

val optimizer = new DistriOptimizer(
_model = model,
_dataset = dataSet.asInstanceOf[DistributedDataSet[MiniBatch[T]]],
_criterion = criterion
val optimizer = Optimizer(
model = model,
dataset = dataSet.asInstanceOf[DistributedDataSet[MiniBatch[T]]],
criterion = criterion
).asInstanceOf[Optimizer[T, MiniBatch[T]]]
enrichOptimizer(optimizer, endTrigger, optimMethod.asScala.toMap)
}
Expand Down Expand Up @@ -2516,6 +2514,16 @@ class PythonBigDL[T: ClassTag](implicit ev: TensorNumeric[T]) extends Serializab
Array(Engine.nodeNumber(), Engine.coreNumber())
}

def setOptimizerVersion(version: String): Unit = {
version.toLowerCase() match {
case "optimizerv1" => Engine.setOptimizerVersion(OptimizerV1)
case "optimizerv2" => Engine.setOptimizerVersion(OptimizerV2)
}
}

def getOptimizerVersion(): String = {
Engine.getOptimizerVersion().toString
}

def setWeights(model: AbstractModule[Activity, Activity, T], weights: JList[JTensor]): Unit = {
val weightTensor = weights.asScala.toArray.map(toTensor(_))
Expand Down

0 comments on commit 9d82101

Please sign in to comment.