Digits MNist implemented, the CNN version is blocked on a backprop im…

…plementation and digits. Waiting on updates to Tensorflow.Net
fsprojects · Jun 2, 2019 · d853018 · d853018 · Oceania2018 · Jul 15, 2019
1 parent 9a8077b
commit d853018
Show file tree

Hide file tree

Showing 9 changed files with 644 additions and 6 deletions.
diff --git a/RunTest2/MNist.fs b/RunTest2/MNist.fs
@@ -0,0 +1,217 @@
+module MNist
+
+//#I __SOURCE_DIRECTORY__
+//#r "netstandard"
+//#I "../tests/bin/Debug/net461/"
+//#r "TensorFlow.FSharp.dll"
+//#r "ArrayFire.dll"
+//#r "TensorFlow.Net.dll"
+//#r "NumSharp.Core.dll"
+//#r "TensorFlow.FSharp.Tests.dll"
+//#r "ICSharpCode.SharpZipLib.dll"
+//#r "System.IO.Compression.dll"
+//#r "System.IO.Compression.FileSystem.dll"
+////#r "System.IO.Compression.Brotli.dll"
+//#r "System.IO.Compression.ZipFile.dll"
+//#r "System.Runtime.Extensions.dll"
+//
+
+open System
+open System.IO
+open System.IO.Compression
+
+open System.Net
+open System.Linq
+open System.Threading
+open System.Threading.Tasks
+open Tensorflow
+open NumSharp
+
+type Compress() = 
+    static member ExtractGZip(gzipFileName : string, targetDir : string) =
+        let dataBuffer = Array.zeroCreate<byte> 4096
+        use fs = new FileStream(gzipFileName, FileMode.Open, FileAccess.Read)
+        //use gzipStream = new Ionic.Zlib.GZipStream(fs, Ionic.Zlib.CompressionMode.Decompress)
+        let fnOut = Path.Combine(targetDir, Path.GetFileNameWithoutExtension(gzipFileName))
+        File.WriteAllBytes(fnOut,Ionic.Zlib.GZipStream.UncompressBuffer(File.ReadAllBytes(gzipFileName)))
+        //let fsOut = File.Create(fnOut)
+        //StreamUtils.Copy(gzipStream, fsOut, dataBuffer)
+
+    static member UnZip(gzArchiveName : string, destFolder : string) =
+        let flag = gzArchiveName.Split(Path.DirectorySeparatorChar).Last().Split('.').First() + ".bin"
+        if not(File.Exists(Path.Combine(destFolder, flag))) then
+            printfn "Extracting."
+            let task = Task.Run(fun () -> ZipFile.ExtractToDirectory(gzArchiveName, destFolder))
+            while (not task.IsCompleted) do
+                Thread.Sleep(200)
+                Console.Write(".")
+            File.Create(Path.Combine(destFolder, flag)) |> ignore
+            printfn ""
+            printfn "Extracting is complete"
+
+type Web() =
+    /// TODO make this better more more F#
+    static member Download(url : string, destDir : string, ?destFileName : string) = 
+        let destFileName = defaultArg destFileName (url.Split(Path.DirectorySeparatorChar).Last())
+        Directory.CreateDirectory(destDir) |> ignore
+        let relativeFilePath = Path.Combine(destDir, destFileName)
+        if File.Exists(relativeFilePath) then
+            printfn "%s already exists." destFileName
+            false
+        else 
+            use wc = new WebClient()
+            printfn "Downloading %s" relativeFilePath
+            let download = Task.Run(fun () -> wc.DownloadFile(url, relativeFilePath))
+            while (not download.IsCompleted) do
+                Thread.Sleep(1000)
+                Console.Write(".")
+            printfn ""
+            printfn "Downloaded %s" relativeFilePath
+            true
+
+
+type DataSet(images : NDArray, labels : NDArray, dtype : TF_DataType, reshape : bool) = 
+    let _num_examples = images.shape.[0]
+    let images = images.reshape(images.shape.[0], images.shape.[1] * images.shape.[2])
+    let mutable _images = np.multiply(images.astype(dtype.as_numpy_datatype()), NDArray.op_Implicit(1.0f / 255.f))
+    let mutable _labels = labels.astype(dtype.as_numpy_datatype())
+    let mutable _epochs_completed = 0
+    let mutable _index_in_epoch = 0
+
+    member this.Images = _images
+    member this.Labels = _labels
+    member this.EpochsCompleted = _epochs_completed
+    member this.IndexInEpoch = _index_in_epoch
+    member this.NumExamples = _num_examples
+
+    member this.next_batch(batch_size : int, ?fake_data : bool, ?shuffle : bool) = 
+        let fake_data = defaultArg fake_data false
+        let shuffle = defaultArg shuffle true
+        let start = _index_in_epoch
+        let applyShuffle() = 
+            let perm0 = np.arange(_num_examples)
+            np.random.shuffle(perm0)
+            _images <- _images.[perm0]
+            _labels <- _labels.[perm0]
+
+        if _epochs_completed = 0 && start = 0 && shuffle then applyShuffle()
+
+        // Go to the next epoch
+        if start + batch_size > _num_examples then
+            // Finished epoch
+            _epochs_completed <- _epochs_completed + 1
+
+            // Get the rest examples in this epoch
+            let rest_num_examples = _num_examples - start
+            if shuffle then applyShuffle()
+
+            let mutable start = 0
+            _index_in_epoch <- batch_size - rest_num_examples
+            let _end = _index_in_epoch
+            (_images.[np.arange(start, _end)], _images.[np.arange(start, _end)])
+        else
+            _index_in_epoch <- _index_in_epoch + batch_size
+            let _end = _index_in_epoch
+            (_images.[np.arange(start,_end)],_labels.[np.arange(start,_end)])
+
+
+type Datasets = {
+    train : DataSet
+    validation : DataSet
+    test : DataSet
+}
+
+
+// Re-doing the dataset program
+[<AutoOpen>]
+module Dataset = 
+
+    let DEFAULT_SOURCE_URL = "https://storage.googleapis.com/cvdf-datasets/mnist/";
+    let TRAIN_IMAGES = "train-images-idx3-ubyte.gz";
+    let TRAIN_LABELS = "train-labels-idx1-ubyte.gz";
+    let TEST_IMAGES = "t10k-images-idx3-ubyte.gz";
+    let TEST_LABELS = "t10k-labels-idx1-ubyte.gz";
+    let private _read32(bytestream : FileStream) =  
+        let buffer = Array.zeroCreate<byte> (sizeof<uint32>)
+        let count = bytestream.Read(buffer, 0, 4)
+        np.frombuffer(buffer, ">u4").Data<uint32>(0) //MM) Is this really necessary?
+    let dense_to_one_hot(labels_dense : NDArray, num_classes : int) =
+        let num_labels = labels_dense.shape.[0]
+        let index_offset = np.arange(num_labels) * NDArray.op_Implicit(num_labels)
+        let labels_one_hot = np.zeros(num_labels, num_classes)
+        for row in 0 .. num_labels - 1 do
+            let col = int(labels_dense.Data<byte>(row))
+            labels_one_hot.SetData(1.0, row,col)
+        labels_one_hot
+
+    type MNistDataset() =
+        static member extract_images(file : string, ?limit : int) : NDArray =
+            use bytestream = new FileStream(file, FileMode.Open)
+            let magic = _read32(bytestream)
+            if magic <> 2051u then raise <| ValueError(sprintf "Invalid magic number %i in MNIST image file %s" magic file)
+            let num_images = int(_read32(bytestream))
+            let rows = int(_read32(bytestream))
+            let cols = int(_read32(bytestream))
+            let buf = Array.zeroCreate<byte> (rows * cols * num_images)
+            bytestream.Read(buf, 0, buf.Length) |> ignore
+            let data = np.frombuffer(buf, np.uint8)
+            data.reshape(num_images, rows, cols, 1)
+
+        static member extract_labels(file : string, ?one_hot : bool, ?num_classes : int, ?limit : int) : NDArray =
+            let one_hot = defaultArg one_hot false
+            let num_classes = defaultArg num_classes 10
+            use bytestream = new FileStream(file, FileMode.Open)
+            let magic = _read32(bytestream)
+            if magic <> 2049u then raise <| ValueError(sprintf "Invalid magic number %i in MNIST label file %s" magic file)
+            let num_images = int(_read32(bytestream))
+            let buf = Array.zeroCreate<byte> (num_images)
+            bytestream.Read(buf, 0, buf.Length) |> ignore
+            let labels = np.frombuffer(buf, np.uint8)
+            if one_hot then dense_to_one_hot(labels,num_classes)
+            else labels
+
+        static member read_data_sets(train_dir : string, 
+                                     ?one_hot : bool, 
+                                     ?dtype : TF_DataType,
+                                     ?reshape : bool,
+                                     ?validation_size : int,
+                                     ?train_size : int,
+                                     ?test_size : int,
+                                     ?source_url) =
+            let one_hot = defaultArg one_hot false
+            let dtype   = defaultArg dtype TF_DataType.TF_FLOAT
+            let reshape = defaultArg reshape true
+            let validation_size = defaultArg validation_size 5000
+            let source_url = defaultArg source_url DEFAULT_SOURCE_URL
+            train_size |> Option.iter (fun train_size -> 
+                if validation_size >= train_size then raise <| ArgumentException("Validation set should be smaller than training set"))
+            Web.Download(source_url + TRAIN_IMAGES, train_dir, TRAIN_IMAGES) |> ignore
+            Compress.ExtractGZip(Path.Combine(train_dir, TRAIN_IMAGES), train_dir)
+            let train_images = MNistDataset.extract_images(Path.Combine(train_dir, TRAIN_IMAGES.Split('.').[0]), ?limit = train_size)
+
+            Web.Download(source_url + TRAIN_LABELS, train_dir, TRAIN_LABELS) |> ignore
+            Compress.ExtractGZip(Path.Combine(train_dir, TRAIN_LABELS), train_dir)
+            let train_labels = MNistDataset.extract_labels(Path.Combine(train_dir, TRAIN_LABELS.Split('.').[0]), one_hot = one_hot, ?limit = train_size)
+
+            Web.Download(source_url + TEST_IMAGES, train_dir, TEST_IMAGES) |> ignore
+            Compress.ExtractGZip(Path.Combine(train_dir, TEST_IMAGES), train_dir)
+            let test_images = MNistDataset.extract_images(Path.Combine(train_dir, TEST_IMAGES.Split('.').[0]), ?limit = test_size)
+
+            Web.Download(source_url + TEST_LABELS, train_dir, TEST_LABELS) |> ignore
+            Compress.ExtractGZip(Path.Combine(train_dir, TEST_LABELS), train_dir)
+            let test_labels = MNistDataset.extract_labels(Path.Combine(train_dir, TEST_LABELS.Split('.').[0]), one_hot = one_hot, ?limit = test_size)
+
+            let _end = train_images.shape.[0]
+            let validation_images = train_images.[np.arange(validation_size)]
+            let validation_labels = train_labels.[np.arange(validation_size)]
+            let train_images = train_images.[np.arange(validation_size)]
+            let train_labels = train_labels.[np.arange(validation_size)]
+
+            let train = new DataSet(train_images, train_labels, dtype, reshape)
+            let validation = new DataSet(validation_images, validation_labels, dtype, reshape)
+            let test = new DataSet(test_images, test_labels, dtype, reshape)
+            {train = train; validation = validation; test = test}
+
+
+
+
diff --git a/RunTest2/Program.fs b/RunTest2/Program.fs
@@ -141,5 +141,6 @@ let main argv =
     //FFStyle.run("starry_night")
     //FFStyle.run("wave")
     //Classifier.run()
-    NeuralStyleTransferDSL.run()
+    //NeuralStyleTransferDSL.run()
+    let mnist = MNist.Dataset.MNistDataset.read_data_sets("mnist2",one_hot = true, validation_size = 5000)
     0 
diff --git a/RunTest2/RunModels.fsproj b/RunTest2/RunModels.fsproj
@@ -13,12 +13,14 @@
     <PackageReference Include="Google.Protobuf" Version="3.7.0" />
     <PackageReference Include="Ionic.Zlib.Core" Version="1.0.0" />
     <PackageReference Include="HDF.PInvoke.NETStandard" Version="1.10.200" />
+    <PackageReference Include="TensorFlow.NET" Version="0.8.0" />
     <PackageReference Update="FSharp.Core" Version="4.6.2" />
     <PackageReference Include="System.Runtime" Version="4.3.1" />
     <PackageReference Include="System.Runtime.InteropServices" Version="4.3.0" />
   </ItemGroup>
 
   <ItemGroup>
+    <Compile Include="MNist.fs" />
     <Compile Include="NeuralStyleTransferDSL.fs" />
     <Compile Include="..\tests\FFStyleVGG.fs" Link="FFStyleVGG.fs" />
     <None Include="..\..\TensorFlow.NET\src\TensorFlowNET.Core\bin\Debug\netstandard2.0\tensorflow.dll" Link="tensorflow.dll">
@@ -29,7 +31,6 @@
   </ItemGroup>
 
   <ItemGroup>
-    <ProjectReference Include="..\..\TensorFlow.NET\src\TensorFlowNET.Core\TensorFlowNET.Core.csproj" />
     <ProjectReference Include="..\src\TensorFlow.FSharp\TensorFlow.FSharp.fsproj" />
   </ItemGroup>
 

diff --git a/Tensorflow.FSharp.sln b/Tensorflow.FSharp.sln
@@ -13,6 +13,8 @@ Project("{F2A71F9B-5D33-465A-A702-920D77279786}") = "RunModels", "RunTest2\RunMo
 EndProject
 Project("{9A19103F-16F7-4668-BE54-9A1E7A4F7556}") = "TensorFlowNET.Core", "..\TensorFlow.NET\src\TensorFlowNET.Core\TensorFlowNET.Core.csproj", "{B6E797FD-F117-418C-9FE2-51A538541DE7}"
 EndProject
+Project("{9A19103F-16F7-4668-BE54-9A1E7A4F7556}") = "TensorFlowNET.Examples", "..\TensorFlow.NET\test\TensorFlowNET.Examples\TensorFlowNET.Examples.csproj", "{B9F05C84-551B-4695-A597-C5F1F01FA992}"
+EndProject
 Global
 	GlobalSection(SolutionConfigurationPlatforms) = preSolution
 		Debug|Any CPU = Debug|Any CPU
@@ -39,6 +41,10 @@ Global
 		{B6E797FD-F117-418C-9FE2-51A538541DE7}.Debug|Any CPU.Build.0 = Debug|Any CPU
 		{B6E797FD-F117-418C-9FE2-51A538541DE7}.Release|Any CPU.ActiveCfg = Release|Any CPU
 		{B6E797FD-F117-418C-9FE2-51A538541DE7}.Release|Any CPU.Build.0 = Release|Any CPU
+		{B9F05C84-551B-4695-A597-C5F1F01FA992}.Debug|Any CPU.ActiveCfg = Debug|Any CPU
+		{B9F05C84-551B-4695-A597-C5F1F01FA992}.Debug|Any CPU.Build.0 = Debug|Any CPU
+		{B9F05C84-551B-4695-A597-C5F1F01FA992}.Release|Any CPU.ActiveCfg = Release|Any CPU
+		{B9F05C84-551B-4695-A597-C5F1F01FA992}.Release|Any CPU.Build.0 = Release|Any CPU
 	EndGlobalSection
 	GlobalSection(SolutionProperties) = preSolution
 		HideSolutionNode = FALSE

diff --git a/src/TensorFlow.FSharp/Tensorflow.FSharp.fsproj b/src/TensorFlow.FSharp/Tensorflow.FSharp.fsproj
@@ -20,6 +20,7 @@
     <PackageReference Include="Google.Protobuf" Version="3.7.0" />
     <PackageReference Include="Ionic.Zlib.Core" Version="1.0.0" />
     <PackageReference Include="HDF.PInvoke.NETStandard" Version="1.10.200" />
+    <PackageReference Include="TensorFlow.NET" Version="0.8.0" />
     <PackageReference Update="FSharp.Core" Version="4.6.2" />
     <PackageReference Include="System.Runtime" Version="4.3.1" />
     <PackageReference Include="System.Runtime.InteropServices" Version="4.3.0" />
@@ -34,9 +35,5 @@
     <Compile Include="FM.fs" />
   </ItemGroup>
 
-  <ItemGroup>
-    <ProjectReference Include="..\..\..\TensorFlow.NET\src\TensorFlowNET.Core\TensorFlowNET.Core.csproj" />
-  </ItemGroup>
-
 </Project>
 
diff --git a/tests/MNist.fsx b/tests/MNist.fsx
@@ -0,0 +1,100 @@
+#I __SOURCE_DIRECTORY__
+#r "netstandard"
+#I "../tests/bin/Debug/net461/"
+#r "TensorFlow.FSharp.dll"
+#r "TensorFlow.Net.dll"
+#r "NumSharp.Core.dll"
+#r "TensorFlow.FSharp.Tests.dll"
+#r "ICSharpCode.SharpZipLib.dll"
+#r "System.IO.Compression.dll"
+#r "System.IO.Compression.FileSystem.dll"
+//#r "System.IO.Compression.Brotli.dll"
+#r "System.IO.Compression.ZipFile.dll"
+#r "System.Runtime.Extensions.dll"
+#load "MNistDataset.fsx"
+
+// TODO needs better random initializers that draw from a normal
+// TODO tf.get_variable is not implemented
+// TODO get_gradient_function Conv2D is not implemented
+// TODO implement dropout
+
+open System
+open System.IO
+open System.IO.Compression
+open System.Net
+open System.Linq
+open System.Threading
+open System.Threading.Tasks
+open Tensorflow
+open Tensorflow.Operations
+open NumSharp
+open ICSharpCode.SharpZipLib.Core
+open ICSharpCode.SharpZipLib.GZip
+open MNistDataset
+
+let mnist = MNistDataset.read_data_sets("mnist2",one_hot = true, validation_size = 5000)
+
+let xtr = tf.placeholder(tf.float32, TensorShape(-1, 784))
+let ytr = tf.placeholder(tf.float32, TensorShape(-1, 10))
+
+let getRandom(shape:int[]) = 
+    np.random.randn(shape).astype(typeof<single>)
+
+let basicModel(xtr) : Tensor = 
+    let b = tf.Variable(getRandom([|32|]), name = "bias",dtype = TF_DataType.TF_FLOAT)
+    let W = tf.Variable(getRandom([|784;32|]), name = "weight")
+    let res =  gen_ops.relu(tf.matmul(xtr , (W._AsTensor())) + (b._AsTensor()))
+    let b1 = tf.Variable(getRandom([|10|]), name = "weight2",dtype = TF_DataType.TF_FLOAT)
+    let W1 = tf.Variable(getRandom([|32;10|]), name = "bias2")
+    tf.sigmoid(tf.matmul(res, (W1._AsTensor())) + (b1._AsTensor()))
+
+
+// NHWC
+let cnnModel(xtr) : Tensor= 
+    let x = gen_ops.reshape(xtr,tf.constant([|-1;28;28;1|]))
+    let c1f = tf.Variable(getRandom([|5;5;1;32|]),name = "c1f")
+    let x = gen_ops.relu(gen_ops.conv2d(x,c1f._AsTensor(),[|1;2;2;1|],"SAME",data_format="NHWC"))
+    let c2f = tf.Variable(getRandom([|5;5;32;64|]),name = "c2f")
+    let x = gen_ops.relu(gen_ops.conv2d(x,c2f._AsTensor(),[|1;2;2;1|],"SAME",data_format="NHWC"))
+    let x = tf.reshape(x,[|-1;7*7*64|])
+    let W = tf.Variable(getRandom([|7*7*64;1024|]), name = "weight1")
+    let b = tf.Variable(getRandom([|1024|]), name = "bias1")
+    let x = gen_ops.relu(tf.matmul(x, (W._AsTensor())) + (b._AsTensor()))
+    let W = tf.Variable(getRandom([|1024;10|]), name = "weight2")
+    let b = tf.Variable(getRandom([|10|]), name = "bias2")
+    gen_ops.relu(tf.matmul(x, (W._AsTensor())) + (b._AsTensor()))
+
+
+let batches = 1000
+let display_step = 100
+
+let toItems(xs : ('a*'b) seq) = [|for (x,y) in xs -> FeedItem(x,y)|]
+
+let output = basicModel(xtr)
+//let output = cnnModel(xtr)
+
+let sess = tf.Session()
+
+let (loss,_) = gen_ops.softmax_cross_entropy_with_logits(output,ytr).ToTuple()
+let optimizer = tf.train.GradientDescentOptimizer(0.1f).minimize(loss)
+let init = tf.global_variables_initializer()
+sess.run(init)
+
+let train(res,loss,optimizer,batches,display_step) =
+    for epoch in 0 .. batches do
+        let (x,y) = mnist.train.next_batch(64)
+        // for some super weird reason y sometimes reutrns [|4;784|]
+        if y.shape = [|64;10|] then
+            sess.run(optimizer,[(xtr,x);(ytr,y)] |> toItems) |> ignore
+            if ((epoch + 1)) % display_step = 0 then
+                let getAccuracy(xs : NDArray,ys : NDArray) = 
+                    let equal = (np.argmax(xs,1).Data<int32>(), np.argmax(ys,1).Data<int32>()) ||> Seq.zip 
+                                |> Seq.sumBy (function | (x,y) when x = y -> 1 | _ -> 0)
+                    (float equal / float xs.shape.[0])
+                let ts = sess.run(res,FeedItem(xtr,mnist.test.Images))
+                let accuracy = getAccuracy(mnist.test.Labels, ts)
+                let c = sess.run(loss,[(xtr,x);(ytr,y)] |> toItems)
+                printfn "Batch: %i cost=%f accuracy =%f " (epoch + 1) (c.Data<float32>().[0]) accuracy
+
+for _ in 0..10 do
+    train(output,loss,optimizer,batches,display_step)