Add MNIST test.

dan-zheng · dan-zheng · commit 731ce402ce0b · 2019-01-22T17:58:32.000-08:00
diff --git a/Package.swift b/Package.swift
@@ -20,23 +20,20 @@ import PackageDescription
 let package = Package(
     name: "DeepLearning",
     products: [
-        // Products define the executables and libraries produced by a package, and make them visible to other packages.
         .library(
             name: "DeepLearning",
             targets: ["DeepLearning"]),
     ],
-    dependencies: [
-        // Dependencies declare other packages that this package depends on.
-        // .package(url: /* package url */, from: "1.0.0"),
-    ],
+    dependencies: [],
     targets: [
-        // Targets are the basic building blocks of a package. A target can define a module or a test suite.
-        // Targets can depend on other targets in this package, and on products in packages which this package depends on.
         .target(
             name: "DeepLearning",
             dependencies: []),
         .testTarget(
             name: "DeepLearningTests",
             dependencies: ["DeepLearning"]),
+        .testTarget(
+            name: "MNIST",
+            dependencies: ["DeepLearning"]),
     ]
 )
diff --git a/Tests/DeepLearningTests/TrivialModelTests.swift b/Tests/DeepLearningTests/TrivialModelTests.swift
@@ -24,8 +24,8 @@ final class TrivialModelTests: XCTestCase {
                 l2 = Dense<Float>(inputSize: hiddenSize, outputSize: 1)
             }
             func applied(to input: Tensor<Float>) -> Tensor<Float> {
-                let h1 = sigmoid(l1.applied(to: input))
-                return sigmoid(l2.applied(to: h1))
+                let h1 = relu(l1.applied(to: input))
+                return relu(l2.applied(to: h1))
             }
         }
         let optimizer = SGD<Classifier, Float>(learningRate: 0.02)
@@ -35,11 +35,9 @@ final class TrivialModelTests: XCTestCase {
         for _ in 0..<1000 {
             let (loss, 𝛁model) = classifier.valueWithGradient { classifier -> Tensor<Float> in
                 let ŷ = classifier.applied(to: x)
-                return (y - ŷ).squared().mean()
+                return meanSquaredError(predicted: ŷ, expected: y)
             }
-            print(loss)
-            optimizer.update(&classifier.allDifferentiableVariables,
-                             along: 𝛁model)
+            optimizer.update(&classifier.allDifferentiableVariables, along: 𝛁model)
         }
         print(classifier.applied(to: [[0, 0], [0, 1], [1, 0], [1, 1]]))
     }
diff --git a/Tests/DeepLearningTests/XCTestManifests.swift b/Tests/DeepLearningTests/XCTestManifests.swift
@@ -17,7 +17,8 @@ import XCTest
 #if !os(macOS)
 public func allTests() -> [XCTestCaseEntry] {
     return [
-        testCase(DeepLearningTests.allTests),
+        testCase(TrivialModelTests.allTests),
+        testCase(MNISTTests.allTests),
     ]
 }
 #endif
diff --git a/Tests/MNIST/MNIST.swift b/Tests/MNIST/MNIST.swift
@@ -0,0 +1,124 @@
+// Copyright 2018 The TensorFlow Authors. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+import XCTest
+import Python
+@testable import DeepLearning
+
+let gzip = Python.import("gzip")
+let np = Python.import("numpy")
+
+func readImagesFile(_ filename: String) -> [Float] {
+    let file = gzip.open(filename, "rb").read()
+    let data = np.frombuffer(file, dtype: np.uint8, offset: 16)
+    let array = data.astype(np.float32) / 255
+    return Array(numpyArray: array)!
+}
+
+func readLabelsFile(_ filename: String) -> [Int32] {
+    let file = gzip.open(filename, "rb").read()
+    let data = np.frombuffer(file, dtype: np.uint8, offset: 8)
+    let array = data.astype(np.int32)
+    return Array(numpyArray: array)!
+}
+
+/// Reads MNIST images and labels from specified file paths.
+func readMNIST(imagesFile: String, labelsFile: String)
+    -> (images: Tensor<Float>, labels: Tensor<Int32>) {
+        print("Reading data.")
+        let images = readImagesFile(imagesFile)
+        let labels = readLabelsFile(labelsFile)
+        let rowCount = Int32(labels.count)
+        let columnCount = Int32(images.count) / rowCount
+
+        print("Constructing data tensors.")
+        let imagesTensor = Tensor(shape: [rowCount, columnCount], scalars: images) / 255
+        let labelsTensor = Tensor(labels)
+        return (imagesTensor, labelsTensor)
+}
+
+struct MNISTClassifier: Layer {
+    var l1, l2: Dense<Float>
+    init(hiddenSize: Int) {
+        l1 = Dense<Float>(inputSize: 784, outputSize: hiddenSize)
+        l2 = Dense<Float>(inputSize: hiddenSize, outputSize: 10)
+    }
+    func applied(to input: Tensor<Float>) -> Tensor<Float> {
+        let h1 = sigmoid(l1.applied(to: input))
+        return logSoftmax(l2.applied(to: h1))
+    }
+}
+
+final class MNISTTests: XCTestCase {
+    func testMNIST() {
+        // Get training data.
+        let (images, numericLabels) = readMNIST(imagesFile: "train-images-idx3-ubyte.gz",
+                                                labelsFile: "train-labels-idx1-ubyte.gz")
+        let labels = Tensor<Float>(oneHotAtIndices: numericLabels, depth: 10)
+
+        let batchSize = images.shape[0]
+        let optimizer = RMSProp<MNISTClassifier, Float>(learningRate: 0.2)
+        var classifier = MNISTClassifier(hiddenSize: 30)
+
+        // Hyper-parameters.
+        let epochCount = 20
+        let minibatchSize: Int32 = 10
+        let learningRate: Float = 0.2
+        var loss = Float.infinity
+
+        // Training loop.
+        print("Begin training for \(epochCount) epochs.")
+
+        func minibatch<Scalar>(_ x: Tensor<Scalar>, index: Int32) -> Tensor<Scalar> {
+            let start = index * minibatchSize
+            return x[start..<start+minibatchSize]
+        }
+
+        for epoch in 0...epochCount {
+            // Store information for printing accuracy and loss.
+            var correctPredictions = 0
+            var totalLoss: Float = 0
+
+            let iterationCount = batchSize / minibatchSize
+            for i in 0..<iterationCount {
+                let images = minibatch(images, index: i)
+                let numericLabels = minibatch(numericLabels, index: i)
+                let labels = minibatch(labels, index: i)
+
+                let (loss, 𝛁model) = classifier.valueWithGradient { classifier -> Tensor<Float> in
+                    let ŷ = classifier.applied(to: images)
+
+                    // Update number of correct predictions.
+                    let correctlyPredicted = ŷ.argmax(squeezingAxis: 1) .== numericLabels
+                    correctPredictions += Int(Tensor<Int32>(correctlyPredicted).sum().scalarized())
+
+                    return -(labels * ŷ).sum() / Tensor(10)
+                }
+                optimizer.update(&classifier.allDifferentiableVariables, along: 𝛁model)
+                totalLoss += loss.scalarized()
+            }
+            print("""
+                [Epoch \(epoch)] \
+                Accuracy: \(correctPredictions)/\(batchSize) \
+                (\(Float(correctPredictions) / Float(batchSize)))\t\
+                Loss: \(totalLoss / Float(batchSize))
+                """)
+        }
+        print("Done training MNIST.")
+    }
+
+    static var allTests = [
+        ("testMNIST", testMNIST),
+    ]
+}
diff --git a/Tests/MNIST/train-images-idx3-ubyte b/Tests/MNIST/train-images-idx3-ubyte
diff --git a/Tests/MNIST/train-labels-idx1-ubyte b/Tests/MNIST/train-labels-idx1-ubyte

Original file line number	Diff line number	Diff line change
`@@ -24,8 +24,8 @@ final class TrivialModelTests: XCTestCase {`
`24`	`24`	`l2 = Dense<Float>(inputSize: hiddenSize, outputSize: 1)`
`25`	`25`	`}`
`26`	`26`	`func applied(to input: Tensor<Float>) -> Tensor<Float> {`
`27`		`- let h1 = sigmoid(l1.applied(to: input))`
`28`		`- return sigmoid(l2.applied(to: h1))`
	`27`	`+ let h1 = relu(l1.applied(to: input))`
	`28`	`+ return relu(l2.applied(to: h1))`
`29`	`29`	`}`
`30`	`30`	`}`
`31`	`31`	`let optimizer = SGD<Classifier, Float>(learningRate: 0.02)`
`@@ -35,11 +35,9 @@ final class TrivialModelTests: XCTestCase {`
`35`	`35`	`for _ in 0..<1000 {`
`36`	`36`	`let (loss, 𝛁model) = classifier.valueWithGradient { classifier -> Tensor<Float> in`
`37`	`37`	`let ŷ = classifier.applied(to: x)`
`38`		`- return (y - ŷ).squared().mean()`
	`38`	`+ return meanSquaredError(predicted: ŷ, expected: y)`
`39`	`39`	`}`
`40`		`- print(loss)`
`41`		`- optimizer.update(&classifier.allDifferentiableVariables,`
`42`		`- along: 𝛁model)`
	`40`	`+ optimizer.update(&classifier.allDifferentiableVariables, along: 𝛁model)`
`43`	`41`	`}`
`44`	`42`	`print(classifier.applied(to: [[0, 0], [0, 1], [1, 0], [1, 1]]))`
`45`	`43`	`}`
Original file line number	Diff line number	Diff line change
`@@ -17,7 +17,8 @@ import XCTest`
`17`	`17`	`#if !os(macOS)`
`18`	`18`	`public func allTests() -> [XCTestCaseEntry] {`
`19`	`19`	`return [`
`20`		`- testCase(DeepLearningTests.allTests),`
	`20`	`+ testCase(TrivialModelTests.allTests),`
	`21`	`+ testCase(MNISTTests.allTests),`
`21`	`22`	`]`
`22`	`23`	`}`
`23`	`24`	`#endif`