[OPS] Fixed a bug in the beam search decoder.

eaplatanios · eaplatanios · commit 6fca6452b2f4 · 2018-10-25T03:52:52.000-04:00
diff --git a/modules/api/src/main/scala/org/platanios/tensorflow/api/core/types/package.scala b/modules/api/src/main/scala/org/platanios/tensorflow/api/core/types/package.scala
@@ -17,6 +17,8 @@ package org.platanios.tensorflow.api.core
 
 import org.tensorflow.framework.DataType._
 
+import scala.annotation.implicitNotFound
+
 /**
   * @author Emmanouil Antonios Platanios
   */
@@ -73,6 +75,7 @@ package object types {
 
   //region Type Traits
 
+  @implicitNotFound(msg = "Cannot prove that ${T} is a supported TensorFlow data type.")
   trait TF[T] {
     @inline def dataType: org.platanios.tensorflow.api.core.types.DataType[T]
   }
diff --git a/modules/api/src/main/scala/org/platanios/tensorflow/api/ops/seq2seq/decoders/BeamSearchDecoder.scala b/modules/api/src/main/scala/org/platanios/tensorflow/api/ops/seq2seq/decoders/BeamSearchDecoder.scala
@@ -155,12 +155,12 @@ class BeamSearchDecoder[T: TF, State: OutputStructure, StateShape](
       val initialState = BeamSearchDecoder.BeamSearchDecoderState[State](
         modelState = processedInitialCellState,
         logProbabilities = Basic.oneHot[Float, Int](
-          indices = Basic.zeros[Int, Int](batchSize.expandDims(0)),
+          indices = Basic.zeros[Int](batchSize.expandDims(0)),
           depth = beamWidth,
           onValue = Basic.zeros[Float](Shape()),
           offValue = Basic.constant(Float.MinValue)),
         finished = finished,
-        sequenceLengths = Basic.zeros[Int, Int](Basic.stack[Int](Seq(batchSize, beamWidth))))
+        sequenceLengths = Basic.zeros[Int](Basic.stack[Int](Seq(batchSize, beamWidth))))
       (finished, beginInput, initialState)
     }
   }
@@ -183,8 +183,8 @@ class BeamSearchDecoder[T: TF, State: OutputStructure, StateShape](
         BeamSearchDecoder.MaybeTensorConverter(
           BeamSearchDecoder.MergeBatchBeamsConverter(batchSize, beamWidth)))
       val mergedNextTuple = cell(Tuple(mergedInput, mergedCellState))
-      val nextTupleOutput = BeamSearchDecoder.SplitBatchBeamsConverter(batchSize, beamWidth)(
-        mergedNextTuple.output, Some(mergedNextTuple.output.shape(1 ::)))
+      val nextTupleOutput = outputLayer(BeamSearchDecoder.SplitBatchBeamsConverter(batchSize, beamWidth)(
+        mergedNextTuple.output, Some(mergedNextTuple.output.shape(1 ::))))
       val nextTupleState = evOutputToShapeState.map(
         mergedNextTuple.state, Some(cell.stateShape),
         BeamSearchDecoder.MaybeTensorConverter(
@@ -199,15 +199,15 @@ class BeamSearchDecoder[T: TF, State: OutputStructure, StateShape](
 
       // Calculate the total log probabilities for the new hypotheses (final shape = [batchSize, beamWidth, vocabSize]).
       val stepLogProbabilities = BeamSearchDecoder.maskLogProbabilities(
-        NN.logSoftmax(nextTupleOutput.castTo[Float]), endToken, previouslyFinished)
+        NN.logSoftmax(nextTupleOutput.toFloat), endToken, previouslyFinished)
       val totalLogProbabilities = state.logProbabilities.expandDims(Output.constant[Int](2)) + stepLogProbabilities
 
       // Calculate the continuation lengths by adding to all continuing search states.
       val vocabSize = {
         if (nextTupleOutput.shape(-1) != -1)
           Basic.constant(nextTupleOutput.shape(-1))
         else
-          Basic.shape(nextTupleOutput).castTo[Int].slice(-1)
+          Basic.shape(nextTupleOutput).toInt.slice(-1)
       }
 
       var lengthsToAdd = Basic.oneHot[Int, Int](
@@ -221,7 +221,7 @@ class BeamSearchDecoder[T: TF, State: OutputStructure, StateShape](
         predictionLengths.expandDims(2))
 
       // Calculate the scores for each search state.
-      val scores = lengthPenalty(totalLogProbabilities, newPredictionLengths).castTo[Float]
+      val scores = lengthPenalty(totalLogProbabilities, newPredictionLengths).toFloat
 
       // During the first time step we only consider the initial search state.
       val scoresFlat = Basic.reshape(scores, Basic.stack[Int](Seq(batchSize, -1)))
@@ -240,8 +240,8 @@ class BeamSearchDecoder[T: TF, State: OutputStructure, StateShape](
         rangeSize = vocabSize * beamWidth,
         gatherShape = Seq(-1),
         name = "NextBeamLogProbabilities")
-      val nextPredictedIDs = Math.mod(wordIndices, vocabSize, name = "NextBeamPredictedIDs").castTo[Int]
-      val nextParentIDs = Math.divide(wordIndices, vocabSize, name = "NextBeamParentIDs").castTo[Int]
+      val nextPredictedIDs = Math.mod(wordIndices, vocabSize, name = "NextBeamPredictedIDs").toInt
+      val nextParentIDs = Math.divide(wordIndices, vocabSize, name = "NextBeamParentIDs").toInt
 
       // Append the new IDs to the current predictions.
       val gatheredFinished = BeamSearchDecoder.gather(