tensorflow-haskell/tensorflow-ops/src/TensorFlow/EmbeddingOps.hs

-- Copyright 2016 TensorFlow authors.
--
-- Licensed under the Apache License, Version 2.0 (the "License");
-- you may not use this file except in compliance with the License.
-- You may obtain a copy of the License at
--
--     http://www.apache.org/licenses/LICENSE-2.0
--
-- Unless required by applicable law or agreed to in writing, software
-- distributed under the License is distributed on an "AS IS" BASIS,
-- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-- See the License for the specific language governing permissions and
-- limitations under the License.

{-# LANGUAGE ConstraintKinds #-}
{-# LANGUAGE DataKinds #-}
{-# LANGUAGE FlexibleContexts #-}
{-# LANGUAGE NoMonomorphismRestriction #-}
{-# LANGUAGE OverloadedStrings #-}
{-# LANGUAGE RankNTypes #-}

-- | Parallel lookups on the list of tensors.
module TensorFlow.EmbeddingOps where

import Control.Monad (zipWithM)
import Data.Int (Int32, Int64)
import TensorFlow.Build (MonadBuild)
import TensorFlow.Ops (shape, vector)  -- Also Num instance for Tensor
import TensorFlow.Tensor (Tensor, Value, Rendered, colocateWith, render)
import TensorFlow.Types (OneOf, TensorType)
import qualified TensorFlow.GenOps.Core as CoreOps

-- | Looks up `ids` in a list of embedding tensors.
--
-- This function is used to perform parallel lookups on the list of
-- tensors in `params`.  It is a generalization of `TF.gather`, where
-- `params` is interpreted as a partition of a larger embedding
-- tensor.
--
-- The partition_strategy is "mod", we assign each id to partition
-- `p = id % len(params)`. For instance,
-- 13 ids are split across 5 partitions as:
-- `[[0, 5, 10], [1, 6, 11], [2, 7, 12], [3, 8], [4, 9]]`
--
-- The results of the lookup are concatenated into a dense
-- tensor. The returned tensor has shape `shape(ids) + shape(params)[1:]`.
embeddingLookup :: forall a b v1 v2 m .
                   ( MonadBuild m
                   , Rendered (Tensor v1)
                   , TensorType a
                   , OneOf '[Int64, Int32] b
                   , Num b
                   )
                => [Tensor v1 a]
                -- ^ A list of tensors which can be concatenated along
                -- dimension 0. Each `Tensor` must be appropriately
                -- sized for `mod` partition strategy.
                -> Tensor v2 b
                -- ^ A `Tensor` with type `int32` or `int64`
                -- containing the ids to be looked up in `params`.
                -- The ids are required to have fewer than 2^31
                -- entries.
                -> m (Tensor Value a)
                -- ^ A dense tensor with shape `shape(ids) + shape(params)[1:]`.
embeddingLookup [p0] ids = colocateWith p0 (render $ CoreOps.gather p0 ids)
embeddingLookup params@(p0 : _) ids = do
    -- Do np separate lookups, finding embeddings for plist[p] in params[p]
    partitionedResult <- zipWithM
                        (\p g -> colocateWith p $ render $ CoreOps.gather p g)
                        params gatherIds
    let unshapedResult = CoreOps.dynamicStitch pindices partitionedResult
    -- Shape restoration is not as optimal as it would be with client
    -- side shape tracking.
    paramShape <- colocateWith p0 (render (shape p0))
    let finalShape = CoreOps.concat 0 [shape ids, tailShape]
        tailShape = CoreOps.slice paramShape (singleton 1) (singleton (-1))
    render $ CoreOps.reshape unshapedResult finalShape
  where
    -- Avoids genericLength here which would be evaluated by TF.
    np = fromIntegral (length params)
    flatIds = CoreOps.reshape ids (singleton (-1))
    pAssignments = CoreOps.cast (flatIds `CoreOps.mod` np)
    newIds = flatIds `CoreOps.div` np
    originalIndices = CoreOps.range 0 (CoreOps.size flatIds) 1
    -- Partition list of ids based on assignments into np separate lists
    gatherIds = CoreOps.dynamicPartition np newIds pAssignments
    -- Similarly, partition the original indices.
    pindices = CoreOps.dynamicPartition np originalIndices pAssignments
    singleton i = vector [i :: Int32]

embeddingLookup [] _ = error "embeddingLookup requires params to be non empty"
Initial commit 2016-10-24 21:26:42 +02:00			`-- Copyright 2016 TensorFlow authors.`
			`--`
			`-- Licensed under the Apache License, Version 2.0 (the "License");`
			`-- you may not use this file except in compliance with the License.`
			`-- You may obtain a copy of the License at`
			`--`
			`-- http://www.apache.org/licenses/LICENSE-2.0`
			`--`
			`-- Unless required by applicable law or agreed to in writing, software`
			`-- distributed under the License is distributed on an "AS IS" BASIS,`
			`-- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`-- See the License for the specific language governing permissions and`
			`-- limitations under the License.`

			`{-# LANGUAGE ConstraintKinds #-}`
			`{-# LANGUAGE DataKinds #-}`
Update type constraints to work around a ghc-8 bug. (#47) Also removes all the ghc-8-specific logic in the .cabal files. ghc-8 has issues with deeply nested tuples of constraints. We can work around it by: - Changing TensorTypes to a regular class. This required FlexibleContexts. (But we'll probably need it anyway when we support heterogeneous tensor lists.) - Specializing NoneOf for long type lists. For more details, see: https://ghc.haskell.org/trac/ghc/ticket/12175. Also added 'directory' to tensorflow-core-ops' dependencies since it's used in the Setup script. One more step towards fixing #38. 2016-11-29 06:15:09 +01:00			`{-# LANGUAGE FlexibleContexts #-}`
Initial commit 2016-10-24 21:26:42 +02:00			`{-# LANGUAGE NoMonomorphismRestriction #-}`
			`{-# LANGUAGE OverloadedStrings #-}`
			`{-# LANGUAGE RankNTypes #-}`

			`-- \| Parallel lookups on the list of tensors.`
			`module TensorFlow.EmbeddingOps where`

			`import Control.Monad (zipWithM)`
			`import Data.Int (Int32, Int64)`
Distinguish between "rendered" and "unrendered" Tensors. (#88) Distinguish between "rendered" and "unrendered" Tensors. There are now three types of `Tensor`: - `Tensor Value a`: rendered value - `Tensor Ref a`: rendered reference - `Tensor Build a` : unrendered value The extra bookkeeping makes it easier to track (and enforce) which tensors are rendered or not. For examples where this has been confusing in the past, see With this change, pure ops look similar to before, returning `Tensor Build` instead of `Tensor Value`. "Stateful" (monadic) ops are unchanged. For example: add :: OneOf [..] t => Tensor v'1 t -> Tensor v'2 t -> Tensor Build t assign :: (MonadBuild m, TensorType t) => Tensor Ref t -> Tensor v'2 t -> m (Tensor Ref t) The `gradients` function now requires that the variables over which it's differentiating are pre-rendered: gradients :: (..., Rendered v2) => Tensor v1 a -> [Tensor v2 a] -> m [Tensor Value a] (`Rendered v2` means that `v2` is either a `Ref` or a `Value`.) Additionally, the implementation of `gradients` now takes care to render every intermediate value when performing the reverse accumulation. I suspect this fixes an exponential blowup for complicated expressions. 2017-04-07 00:10:33 +02:00			`import TensorFlow.Build (MonadBuild)`
Make code --pedantic (#35) * Enforce pedantic build mode in CI. * Our imports drifted really far from where they should be. 2016-11-18 19:42:02 +01:00			`import TensorFlow.Ops (shape, vector) -- Also Num instance for Tensor`
Distinguish between "rendered" and "unrendered" Tensors. (#88) Distinguish between "rendered" and "unrendered" Tensors. There are now three types of `Tensor`: - `Tensor Value a`: rendered value - `Tensor Ref a`: rendered reference - `Tensor Build a` : unrendered value The extra bookkeeping makes it easier to track (and enforce) which tensors are rendered or not. For examples where this has been confusing in the past, see With this change, pure ops look similar to before, returning `Tensor Build` instead of `Tensor Value`. "Stateful" (monadic) ops are unchanged. For example: add :: OneOf [..] t => Tensor v'1 t -> Tensor v'2 t -> Tensor Build t assign :: (MonadBuild m, TensorType t) => Tensor Ref t -> Tensor v'2 t -> m (Tensor Ref t) The `gradients` function now requires that the variables over which it's differentiating are pre-rendered: gradients :: (..., Rendered v2) => Tensor v1 a -> [Tensor v2 a] -> m [Tensor Value a] (`Rendered v2` means that `v2` is either a `Ref` or a `Value`.) Additionally, the implementation of `gradients` now takes care to render every intermediate value when performing the reverse accumulation. I suspect this fixes an exponential blowup for complicated expressions. 2017-04-07 00:10:33 +02:00			`import TensorFlow.Tensor (Tensor, Value, Rendered, colocateWith, render)`
Initial commit 2016-10-24 21:26:42 +02:00			`import TensorFlow.Types (OneOf, TensorType)`
			`import qualified TensorFlow.GenOps.Core as CoreOps`

			-- \| Looks up `ids` in a list of embedding tensors.
			`--`
			`-- This function is used to perform parallel lookups on the list of`
			-- tensors in `params`. It is a generalization of `TF.gather`, where
			-- `params` is interpreted as a partition of a larger embedding
			`-- tensor.`
			`--`
			`-- The partition_strategy is "mod", we assign each id to partition`
			-- `p = id % len(params)`. For instance,
			`-- 13 ids are split across 5 partitions as:`
			-- `[[0, 5, 10], [1, 6, 11], [2, 7, 12], [3, 8], [4, 9]]`
			`--`
			`-- The results of the lookup are concatenated into a dense`
			-- tensor. The returned tensor has shape `shape(ids) + shape(params)[1:]`.
Distinguish between "rendered" and "unrendered" Tensors. (#88) Distinguish between "rendered" and "unrendered" Tensors. There are now three types of `Tensor`: - `Tensor Value a`: rendered value - `Tensor Ref a`: rendered reference - `Tensor Build a` : unrendered value The extra bookkeeping makes it easier to track (and enforce) which tensors are rendered or not. For examples where this has been confusing in the past, see With this change, pure ops look similar to before, returning `Tensor Build` instead of `Tensor Value`. "Stateful" (monadic) ops are unchanged. For example: add :: OneOf [..] t => Tensor v'1 t -> Tensor v'2 t -> Tensor Build t assign :: (MonadBuild m, TensorType t) => Tensor Ref t -> Tensor v'2 t -> m (Tensor Ref t) The `gradients` function now requires that the variables over which it's differentiating are pre-rendered: gradients :: (..., Rendered v2) => Tensor v1 a -> [Tensor v2 a] -> m [Tensor Value a] (`Rendered v2` means that `v2` is either a `Ref` or a `Value`.) Additionally, the implementation of `gradients` now takes care to render every intermediate value when performing the reverse accumulation. I suspect this fixes an exponential blowup for complicated expressions. 2017-04-07 00:10:33 +02:00			`embeddingLookup :: forall a b v1 v2 m .`
Introduce a MonadBuild class, and remove `buildAnd`. (#83) This change adds a class that both `Build` and `Session` are instances of: class MonadBuild m where build :: Build a -> m a All stateful ops (generated and manually written) now have a signature that returns an instance of `MonadBuild` (rather than just `Build`). For example: assign_ :: (MonadBuild m, TensorType t) => Tensor Ref t -> Tensor v t -> m (Tensor Ref t) This lets us remove a bunch of spurious calls to `build` in user code. It also lets us replace the pattern `buildAnd run foo` with the simpler pattern `foo >>= run` (or `run =<< foo`, which is sometimes nicer when foo is a complicated expression). I went ahead and deleted `buildAnd` altogether since it seems to lead to confusion; in particular a few tests had `buildAnd run . pure` which is actually equivalent to just `run`. 2017-03-18 20:08:53 +01:00			`( MonadBuild m`
Expand Rendered class to support ResourceHandle wrappers like Variable This allows functions like `feed`, `colocateWith`, and (in a later commit) `gradients` to work with `Variable`. 2017-05-14 22:32:19 +02:00			`, Rendered (Tensor v1)`
Introduce a MonadBuild class, and remove `buildAnd`. (#83) This change adds a class that both `Build` and `Session` are instances of: class MonadBuild m where build :: Build a -> m a All stateful ops (generated and manually written) now have a signature that returns an instance of `MonadBuild` (rather than just `Build`). For example: assign_ :: (MonadBuild m, TensorType t) => Tensor Ref t -> Tensor v t -> m (Tensor Ref t) This lets us remove a bunch of spurious calls to `build` in user code. It also lets us replace the pattern `buildAnd run foo` with the simpler pattern `foo >>= run` (or `run =<< foo`, which is sometimes nicer when foo is a complicated expression). I went ahead and deleted `buildAnd` altogether since it seems to lead to confusion; in particular a few tests had `buildAnd run . pure` which is actually equivalent to just `run`. 2017-03-18 20:08:53 +01:00			`, TensorType a`
Initial commit 2016-10-24 21:26:42 +02:00			`, OneOf '[Int64, Int32] b`
			`, Num b`
			`)`
Distinguish between "rendered" and "unrendered" Tensors. (#88) Distinguish between "rendered" and "unrendered" Tensors. There are now three types of `Tensor`: - `Tensor Value a`: rendered value - `Tensor Ref a`: rendered reference - `Tensor Build a` : unrendered value The extra bookkeeping makes it easier to track (and enforce) which tensors are rendered or not. For examples where this has been confusing in the past, see With this change, pure ops look similar to before, returning `Tensor Build` instead of `Tensor Value`. "Stateful" (monadic) ops are unchanged. For example: add :: OneOf [..] t => Tensor v'1 t -> Tensor v'2 t -> Tensor Build t assign :: (MonadBuild m, TensorType t) => Tensor Ref t -> Tensor v'2 t -> m (Tensor Ref t) The `gradients` function now requires that the variables over which it's differentiating are pre-rendered: gradients :: (..., Rendered v2) => Tensor v1 a -> [Tensor v2 a] -> m [Tensor Value a] (`Rendered v2` means that `v2` is either a `Ref` or a `Value`.) Additionally, the implementation of `gradients` now takes care to render every intermediate value when performing the reverse accumulation. I suspect this fixes an exponential blowup for complicated expressions. 2017-04-07 00:10:33 +02:00			`=> [Tensor v1 a]`
Initial commit 2016-10-24 21:26:42 +02:00			`-- ^ A list of tensors which can be concatenated along`
			-- dimension 0. Each `Tensor` must be appropriately
			-- sized for `mod` partition strategy.
Distinguish between "rendered" and "unrendered" Tensors. (#88) Distinguish between "rendered" and "unrendered" Tensors. There are now three types of `Tensor`: - `Tensor Value a`: rendered value - `Tensor Ref a`: rendered reference - `Tensor Build a` : unrendered value The extra bookkeeping makes it easier to track (and enforce) which tensors are rendered or not. For examples where this has been confusing in the past, see With this change, pure ops look similar to before, returning `Tensor Build` instead of `Tensor Value`. "Stateful" (monadic) ops are unchanged. For example: add :: OneOf [..] t => Tensor v'1 t -> Tensor v'2 t -> Tensor Build t assign :: (MonadBuild m, TensorType t) => Tensor Ref t -> Tensor v'2 t -> m (Tensor Ref t) The `gradients` function now requires that the variables over which it's differentiating are pre-rendered: gradients :: (..., Rendered v2) => Tensor v1 a -> [Tensor v2 a] -> m [Tensor Value a] (`Rendered v2` means that `v2` is either a `Ref` or a `Value`.) Additionally, the implementation of `gradients` now takes care to render every intermediate value when performing the reverse accumulation. I suspect this fixes an exponential blowup for complicated expressions. 2017-04-07 00:10:33 +02:00			`-> Tensor v2 b`
Initial commit 2016-10-24 21:26:42 +02:00			-- ^ A `Tensor` with type `int32` or `int64`
			-- containing the ids to be looked up in `params`.
Fixed #19 by adding previously missing reshape. The comment did say that only flat shapes were supported though. 2016-11-09 20:47:49 +01:00			`-- The ids are required to have fewer than 2^31`
			`-- entries.`
Introduce a MonadBuild class, and remove `buildAnd`. (#83) This change adds a class that both `Build` and `Session` are instances of: class MonadBuild m where build :: Build a -> m a All stateful ops (generated and manually written) now have a signature that returns an instance of `MonadBuild` (rather than just `Build`). For example: assign_ :: (MonadBuild m, TensorType t) => Tensor Ref t -> Tensor v t -> m (Tensor Ref t) This lets us remove a bunch of spurious calls to `build` in user code. It also lets us replace the pattern `buildAnd run foo` with the simpler pattern `foo >>= run` (or `run =<< foo`, which is sometimes nicer when foo is a complicated expression). I went ahead and deleted `buildAnd` altogether since it seems to lead to confusion; in particular a few tests had `buildAnd run . pure` which is actually equivalent to just `run`. 2017-03-18 20:08:53 +01:00			`-> m (Tensor Value a)`
Initial commit 2016-10-24 21:26:42 +02:00			-- ^ A dense tensor with shape `shape(ids) + shape(params)[1:]`.
Fixed #19 by adding previously missing reshape. The comment did say that only flat shapes were supported though. 2016-11-09 20:47:49 +01:00			`embeddingLookup [p0] ids = colocateWith p0 (render $ CoreOps.gather p0 ids)`
			`embeddingLookup params@(p0 : _) ids = do`
			`-- Do np separate lookups, finding embeddings for plist[p] in params[p]`
			`partitionedResult <- zipWithM`
			`(\p g -> colocateWith p $ render $ CoreOps.gather p g)`
			`params gatherIds`
			`let unshapedResult = CoreOps.dynamicStitch pindices partitionedResult`
			`-- Shape restoration is not as optimal as it would be with client`
			`-- side shape tracking.`
			`paramShape <- colocateWith p0 (render (shape p0))`
			`let finalShape = CoreOps.concat 0 [shape ids, tailShape]`
			`tailShape = CoreOps.slice paramShape (singleton 1) (singleton (-1))`
			`render $ CoreOps.reshape unshapedResult finalShape`
			`where`
genericLength is too generic. Avoid folding in TF. 2016-11-09 23:20:26 +01:00			`-- Avoids genericLength here which would be evaluated by TF.`
			`np = fromIntegral (length params)`
Fixed #19 by adding previously missing reshape. The comment did say that only flat shapes were supported though. 2016-11-09 20:47:49 +01:00			`flatIds = CoreOps.reshape ids (singleton (-1))`
			pAssignments = CoreOps.cast (flatIds `CoreOps.mod` np)
			newIds = flatIds `CoreOps.div` np
			`originalIndices = CoreOps.range 0 (CoreOps.size flatIds) 1`
			`-- Partition list of ids based on assignments into np separate lists`
			`gatherIds = CoreOps.dynamicPartition np newIds pAssignments`
			`-- Similarly, partition the original indices.`
			`pindices = CoreOps.dynamicPartition np originalIndices pAssignments`
			`singleton i = vector [i :: Int32]`

			`embeddingLookup [] _ = error "embeddingLookup requires params to be non empty"`