Starting NN library (#11)

* Starting NN library - Added "sigmoidCrossEntropyWithLogits" - Ported across a single test
2025-05-09 05:46:44 +02:00 · 2016-10-28 12:05:27 +11:00 · 2016-10-28 12:05:27 +11:00 · b2795d7518
commit b2795d7518
parent 03a3a6d086
5 changed files with 254 additions and 0 deletions
--- a/stack.yaml
+++ b/stack.yaml
@ -10,6 +10,7 @@ packages:
 - tensorflow-mnist
 - tensorflow-mnist-input-data
 - tensorflow-queue
+- tensorflow-nn

 extra-deps:
 # proto-lens is not yet in Stackage.
--- a/tensorflow-nn/Setup.hs
+++ b/tensorflow-nn/Setup.hs
@ -0,0 +1,3 @@
+import Distribution.Simple
+
+main = defaultMain
--- a/tensorflow-nn/src/TensorFlow/NN.hs
+++ b/tensorflow-nn/src/TensorFlow/NN.hs
@ -0,0 +1,87 @@
+-- Copyright 2016 TensorFlow authors.
+--
+-- Licensed under the Apache License, Version 2.0 (the "License");
+-- you may not use this file except in compliance with the License.
+-- You may obtain a copy of the License at
+--
+--     http://www.apache.org/licenses/LICENSE-2.0
+--
+-- Unless required by applicable law or agreed to in writing, software
+-- distributed under the License is distributed on an "AS IS" BASIS,
+-- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+-- See the License for the specific language governing permissions and
+-- limitations under the License.
+
+{-# LANGUAGE DataKinds #-}
+{-# LANGUAGE OverloadedStrings #-}
+
+module TensorFlow.NN
+    ( sigmoidCrossEntropyWithLogits
+    ) where
+
+import Prelude hiding           ( log
+                                , exp
+                                )
+import TensorFlow.Build         ( Build(..)
+                                , render
+                                , withNameScope
+                                )
+import TensorFlow.GenOps.Core   ( greaterEqual
+                                , select
+                                , log
+                                , exp
+                                )
+import TensorFlow.Tensor        ( Tensor(..)
+                                , Value(..)
+                                )
+import TensorFlow.Types         ( TensorType(..)
+                                , OneOf
+                                )
+import TensorFlow.Ops           ( zerosLike
+                                , add
+                                )
+
+-- | Computes sigmoid cross entropy given `logits`.
+--
+-- Measures the probability error in discrete classification tasks in which each
+-- class is independent and not mutually exclusive.  For instance, one could
+-- perform multilabel classification where a picture can contain both an elephant
+-- and a dog at the same time.
+--
+-- For brevity, let `x = logits`, `z = targets`.  The logistic loss is
+--
+--        z * -log(sigmoid(x)) + (1 - z) * -log(1 - sigmoid(x))
+--      = z * -log(1 / (1 + exp(-x))) + (1 - z) * -log(exp(-x) / (1 + exp(-x)))
+--      = z * log(1 + exp(-x)) + (1 - z) * (-log(exp(-x)) + log(1 + exp(-x)))
+--      = z * log(1 + exp(-x)) + (1 - z) * (x + log(1 + exp(-x))
+--      = (1 - z) * x + log(1 + exp(-x))
+--      = x - x * z + log(1 + exp(-x))
+--
+--  For x < 0, to avoid overflow in exp(-x), we reformulate the above
+--
+--        x - x * z + log(1 + exp(-x))
+--      = log(exp(x)) - x * z + log(1 + exp(-x))
+--      = - x * z + log(1 + exp(x))
+--
+--  Hence, to ensure stability and avoid overflow, the implementation uses this
+--  equivalent formulation
+--
+--      max(x, 0) - x * z + log(1 + exp(-abs(x)))
+--
+--  `logits` and `targets` must have the same type and shape.
+sigmoidCrossEntropyWithLogits
+  :: (OneOf '[Float, Double] a, TensorType a, Num a)
+     => Tensor Value a          -- ^ __logits__
+     -> Tensor Value a          -- ^ __targets__
+     -> Build (Tensor Value a)
+sigmoidCrossEntropyWithLogits logits targets = do
+    logits' <- render logits
+    targets' <- render targets
+    let zeros = zerosLike logits'
+        cond = logits' `greaterEqual` zeros
+        relu_logits = select cond logits' zeros
+        neg_abs_logits = select cond (-logits') logits'
+    withNameScope "logistic_loss" $ do
+        left  <- render $ relu_logits - logits' * targets'
+        right <- render $ log (1 + exp neg_abs_logits)
+        withNameScope "sigmoid_add" $ render $ left `add` right
--- a/tensorflow-nn/tensorflow-nn.cabal
+++ b/tensorflow-nn/tensorflow-nn.cabal
@ -0,0 +1,44 @@
+name:                tensorflow-nn
+version:             0.1.0.0
+synopsis:            Friendly layer around TensorFlow bindings.
+description:         Please see README.md
+homepage:            https://github.com/tensorflow/haskell#readme
+license:             Apache
+author:              TensorFlow authors
+maintainer:          tensorflow-haskell@googlegroups.com
+copyright:           Google Inc.
+category:            Machine Learning
+build-type:          Simple
+cabal-version:       >=1.22
+
+library
+  hs-source-dirs:   src
+  exposed-modules: TensorFlow.NN
+  build-depends:  base >= 4.7 && < 5
+                , tensorflow-core-ops == 0.1.*
+                , tensorflow == 0.1.*
+                , tensorflow-ops == 0.1.*
+  default-language:    Haskell2010
+
+
+Test-Suite NNTest
+  default-language: Haskell2010
+  type: exitcode-stdio-1.0
+  main-is: NNTest.hs
+  hs-source-dirs: tests
+  build-depends: HUnit
+               , QuickCheck
+               , base
+               , tensorflow
+               , tensorflow-ops
+               , tensorflow-nn
+               , google-shim
+               , test-framework
+               , test-framework-hunit
+               , test-framework-quickcheck2
+               , vector
+
+
+source-repository head
+  type:     git
+  location: https://github.com/tensorflow/haskell
--- a/tensorflow-nn/tests/NNTest.hs
+++ b/tensorflow-nn/tests/NNTest.hs
@ -0,0 +1,119 @@
+-- Copyright 2016 TensorFlow authors.
+--
+-- Licensed under the Apache License, Version 2.0 (the "License");
+-- you may not use this file except in compliance with the License.
+-- You may obtain a copy of the License at
+--
+--     http://www.apache.org/licenses/LICENSE-2.0
+--
+-- Unless required by applicable law or agreed to in writing, software
+-- distributed under the License is distributed on an "AS IS" BASIS,
+-- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+-- See the License for the specific language governing permissions and
+-- limitations under the License.
+
+{-# LANGUAGE OverloadedLists #-}
+{-# LANGUAGE OverloadedStrings #-}
+{-# LANGUAGE NoMonomorphismRestriction #-}
+{-# LANGUAGE FlexibleInstances #-}
+{-# LANGUAGE FlexibleContexts #-}
+
+module Main where
+
+import           Data.Maybe                         (fromMaybe)
+import           Google.Test                        (googleTest)
+import           Test.Framework.Providers.HUnit     (testCase)
+import           Test.HUnit                         ((@?))
+import           Test.HUnit.Lang                    (Assertion(..))
+import qualified Data.Vector                        as V
+import qualified TensorFlow.Build                   as TF
+import qualified TensorFlow.Gradient                as TF
+import qualified TensorFlow.NN                      as TF
+import qualified TensorFlow.Ops                     as TF
+import qualified TensorFlow.Session                 as TF
+import qualified TensorFlow.Tensor                  as TF
+import qualified TensorFlow.Types                   as TF
+
+-- | These tests are ported from:
+--
+--      <tensorflow>/tensorflow/python/ops/nn_xent_tests.py
+--
+-- This is the implementation we use to check the implementation we
+-- wrote in `TensorFlow.NN.sigmoidCrossEntropyWithLogits`.
+--
+sigmoidXentWithLogits :: Floating a => Ord a => [a] -> [a] -> [a]
+sigmoidXentWithLogits logits' targets' =
+    let sig  = map (\x -> 1 / (1 + exp (-x))) logits'
+        eps  = 0.0001
+        pred = map (\p -> min (max p eps) (1 - eps)) sig
+        xent y z = (-z) * (log y) - (1 - z) * log (1 - y)
+     in zipWith xent pred targets'
+
+
+data Inputs = Inputs {
+      logits  :: [Float]
+    , targets :: [Float]
+    }
+
+
+defInputs :: Inputs
+defInputs = Inputs {
+      logits    = [-100, -2, -2, 0, 2, 2,   2, 100]
+    , targets   = [   0,  0,  1, 0, 0, 1, 0.5,   1]
+    }
+
+
+assertAllClose :: V.Vector Float -> V.Vector Float -> Assertion
+assertAllClose xs ys = all (<= tol) (V.zipWith absDiff xs ys) @?
+    ("Difference > tolerance: \nxs: " ++ show xs ++ "\nys: " ++ show ys
+        ++ "\ntolerance: " ++ show tol)
+  where
+      absDiff x y = abs (x - y)
+      tol = 0.001 :: Float
+
+
+testLogisticOutput = testCase "testLogisticOutput" $ do
+    let inputs     = defInputs
+        vLogits    = TF.vector $ logits  inputs
+        vTargets   = TF.vector $ targets inputs
+        tfLoss     = TF.sigmoidCrossEntropyWithLogits vLogits vTargets
+        ourLoss    = V.fromList $ sigmoidXentWithLogits (logits inputs) (targets inputs)
+    
+    r <- run tfLoss
+    assertAllClose r ourLoss
+
+
+testLogisticOutputMultipleDim =
+        testCase "testLogisticOutputMultipleDim" $ do
+    let inputs   = defInputs 
+        shape    = [2, 2, 2]
+        vLogits  = TF.constant shape (logits  inputs)
+        vTargets = TF.constant shape (targets inputs)
+        tfLoss   = TF.sigmoidCrossEntropyWithLogits vLogits vTargets
+        ourLoss  = V.fromList $ sigmoidXentWithLogits (logits inputs) (targets inputs)
+    
+    r <- run tfLoss
+    assertAllClose r ourLoss
+
+
+testGradientAtZero = testCase "testGradientAtZero" $ do
+    let inputs   = defInputs { logits = [0, 0], targets = [0, 1] }
+        vLogits  = TF.vector $ logits  inputs
+        vTargets = TF.vector $ targets inputs
+        tfLoss   = TF.sigmoidCrossEntropyWithLogits vLogits vTargets
+    
+    r <- run $ do
+        l <- tfLoss
+        TF.gradients l [vLogits]
+
+    assertAllClose (head r) (V.fromList [0.5, -0.5])
+
+
+run = TF.runSession . TF.buildAnd TF.run
+
+
+main :: IO ()
+main = googleTest [ testLogisticOutput
+                  , testLogisticOutputMultipleDim
+                  , testGradientAtZero
+                  ]