convert catch/gym examples to new layers api (#112)

brettkoonce · rxwei · commit 9e3ac1208ab7 · 2019-04-18T18:56:27.000-07:00
diff --git a/Catch/catch.swift b/Catch/catch.swift
@@ -44,13 +44,16 @@ protocol Agent: AnyObject {
 }
 
 struct Model: Layer {
+    typealias Input = Tensor<Float>
+    typealias Output = Tensor<Float>
+
     var layer1 = Dense<Float>(inputSize: 3, outputSize: 50, activation: sigmoid,
                               generator: &rng)
     var layer2 = Dense<Float>(inputSize: 50, outputSize: 3, activation: sigmoid,
                               generator: &rng)
 
     @differentiable
-    func applied(to input: Tensor<Float>) -> Tensor<Float> {
+    func call(_ input: Input) -> Output {
         return input.sequenced(through: layer1, layer2)
     }
 }
@@ -59,11 +62,11 @@ class CatchAgent: Agent {
     typealias Action = CatchAction
 
     var model: Model = Model()
-    let optimizer: Adam<Model, Float>
+    let optimizer: Adam<Model>
     var previousReward: Reward
 
     init(initialReward: Reward, learningRate: Float) {
-        optimizer = Adam(learningRate: learningRate)
+        optimizer = Adam(for: model, learningRate: learningRate)
         previousReward = initialReward
     }
 }
diff --git a/Gym/CartPole.swift b/Gym/CartPole.swift
@@ -37,6 +37,9 @@ fileprivate extension Optional {
 
 /// A simple two layer dense net.
 struct Net: Layer {
+    typealias Input = Tensor<Float>
+    typealias Output = Tensor<Float>
+
     var l1, l2: Dense<Float>
 
     init(observationSize: Int, hiddenSize: Int, actionCount: Int) {
@@ -48,7 +51,7 @@ struct Net: Layer {
     }
 
     @differentiable
-    func applied(to input: Tensor<Float>) -> Tensor<Float> {
+    func call(_ input: Input) -> Output {
         return input.sequenced(through: l1, l2)
     }
 }
@@ -132,7 +135,7 @@ func nextBatch(
         while true {
             let observationPython = Tensor<Double>(numpy: observationNumpy).unwrapped()
             let actionProbabilities =
-              softmax(net.applied(to: Tensor(observationPython).reshaped(to: [1, 4])))
+              softmax(net(Tensor(observationPython).reshaped(to: [1, 4])))
             let actionProbabilitiesPython = actionProbabilities[0].makeNumpyArray()
             let len = Python.len(actionProbabilitiesPython)
             assert(actionCount == Int(Python.len(actionProbabilitiesPython)))
@@ -169,7 +172,7 @@ let actionCount = Int(env.action_space.n).unwrapped()
 var net = Net(observationSize: Int(observationSize), hiddenSize: hiddenSize, actionCount: actionCount)
 // SGD optimizer reaches convergence with ~125 mini batches, while Adam uses ~25.
 // let optimizer = SGD<Net, Float>(learningRate: 0.1, momentum: 0.9)
-let optimizer = Adam<Net, Float>(learningRate: 0.01)
+let optimizer = Adam(for: net, learningRate: 0.01)
 var batchIndex = 0
 Context.local.learningPhase = .training
 while true {
@@ -181,7 +184,7 @@ while true {
       episodes: episodes, actionCount: actionCount)
 
     let gradients = gradient(at: net) { model -> Tensor<Float> in
-        let logits = model.applied(to: input)
+        let logits = model(input)
         let loss = softmaxCrossEntropy(logits: logits, probabilities: target)
         print("loss is \(loss)")
         return loss

Original file line number	Diff line number	Diff line change
`@@ -44,13 +44,16 @@ protocol Agent: AnyObject {`
`44`	`44`	`}`
`45`	`45`
`46`	`46`	`struct Model: Layer {`
	`47`	`+ typealias Input = Tensor<Float>`
	`48`	`+ typealias Output = Tensor<Float>`
	`49`	`+`
`47`	`50`	`var layer1 = Dense<Float>(inputSize: 3, outputSize: 50, activation: sigmoid,`
`48`	`51`	`generator: &rng)`
`49`	`52`	`var layer2 = Dense<Float>(inputSize: 50, outputSize: 3, activation: sigmoid,`
`50`	`53`	`generator: &rng)`
`51`	`54`
`52`	`55`	`@differentiable`
`53`		`- func applied(to input: Tensor<Float>) -> Tensor<Float> {`
	`56`	`+ func call(_ input: Input) -> Output {`
`54`	`57`	`return input.sequenced(through: layer1, layer2)`
`55`	`58`	`}`
`56`	`59`	`}`
`@@ -59,11 +62,11 @@ class CatchAgent: Agent {`
`59`	`62`	`typealias Action = CatchAction`
`60`	`63`
`61`	`64`	`var model: Model = Model()`
`62`		`- let optimizer: Adam<Model, Float>`
	`65`	`+ let optimizer: Adam<Model>`
`63`	`66`	`var previousReward: Reward`
`64`	`67`
`65`	`68`	`init(initialReward: Reward, learningRate: Float) {`
`66`		`- optimizer = Adam(learningRate: learningRate)`
	`69`	`+ optimizer = Adam(for: model, learningRate: learningRate)`
`67`	`70`	`previousReward = initialReward`
`68`	`71`	`}`
`69`	`72`	`}`