···11+# Revision history for hmm-haskell
22+33+## 0.1.0.0 -- YYYY-mm-dd
44+55+* First version. Released on an unsuspecting world.
+202
LICENSE
···11+22+ Apache License
33+ Version 2.0, January 2004
44+ http://www.apache.org/licenses/
55+66+ TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
77+88+ 1. Definitions.
99+1010+ "License" shall mean the terms and conditions for use, reproduction,
1111+ and distribution as defined by Sections 1 through 9 of this document.
1212+1313+ "Licensor" shall mean the copyright owner or entity authorized by
1414+ the copyright owner that is granting the License.
1515+1616+ "Legal Entity" shall mean the union of the acting entity and all
1717+ other entities that control, are controlled by, or are under common
1818+ control with that entity. For the purposes of this definition,
1919+ "control" means (i) the power, direct or indirect, to cause the
2020+ direction or management of such entity, whether by contract or
2121+ otherwise, or (ii) ownership of fifty percent (50%) or more of the
2222+ outstanding shares, or (iii) beneficial ownership of such entity.
2323+2424+ "You" (or "Your") shall mean an individual or Legal Entity
2525+ exercising permissions granted by this License.
2626+2727+ "Source" form shall mean the preferred form for making modifications,
2828+ including but not limited to software source code, documentation
2929+ source, and configuration files.
3030+3131+ "Object" form shall mean any form resulting from mechanical
3232+ transformation or translation of a Source form, including but
3333+ not limited to compiled object code, generated documentation,
3434+ and conversions to other media types.
3535+3636+ "Work" shall mean the work of authorship, whether in Source or
3737+ Object form, made available under the License, as indicated by a
3838+ copyright notice that is included in or attached to the work
3939+ (an example is provided in the Appendix below).
4040+4141+ "Derivative Works" shall mean any work, whether in Source or Object
4242+ form, that is based on (or derived from) the Work and for which the
4343+ editorial revisions, annotations, elaborations, or other modifications
4444+ represent, as a whole, an original work of authorship. For the purposes
4545+ of this License, Derivative Works shall not include works that remain
4646+ separable from, or merely link (or bind by name) to the interfaces of,
4747+ the Work and Derivative Works thereof.
4848+4949+ "Contribution" shall mean any work of authorship, including
5050+ the original version of the Work and any modifications or additions
5151+ to that Work or Derivative Works thereof, that is intentionally
5252+ submitted to Licensor for inclusion in the Work by the copyright owner
5353+ or by an individual or Legal Entity authorized to submit on behalf of
5454+ the copyright owner. For the purposes of this definition, "submitted"
5555+ means any form of electronic, verbal, or written communication sent
5656+ to the Licensor or its representatives, including but not limited to
5757+ communication on electronic mailing lists, source code control systems,
5858+ and issue tracking systems that are managed by, or on behalf of, the
5959+ Licensor for the purpose of discussing and improving the Work, but
6060+ excluding communication that is conspicuously marked or otherwise
6161+ designated in writing by the copyright owner as "Not a Contribution."
6262+6363+ "Contributor" shall mean Licensor and any individual or Legal Entity
6464+ on behalf of whom a Contribution has been received by Licensor and
6565+ subsequently incorporated within the Work.
6666+6767+ 2. Grant of Copyright License. Subject to the terms and conditions of
6868+ this License, each Contributor hereby grants to You a perpetual,
6969+ worldwide, non-exclusive, no-charge, royalty-free, irrevocable
7070+ copyright license to reproduce, prepare Derivative Works of,
7171+ publicly display, publicly perform, sublicense, and distribute the
7272+ Work and such Derivative Works in Source or Object form.
7373+7474+ 3. Grant of Patent License. Subject to the terms and conditions of
7575+ this License, each Contributor hereby grants to You a perpetual,
7676+ worldwide, non-exclusive, no-charge, royalty-free, irrevocable
7777+ (except as stated in this section) patent license to make, have made,
7878+ use, offer to sell, sell, import, and otherwise transfer the Work,
7979+ where such license applies only to those patent claims licensable
8080+ by such Contributor that are necessarily infringed by their
8181+ Contribution(s) alone or by combination of their Contribution(s)
8282+ with the Work to which such Contribution(s) was submitted. If You
8383+ institute patent litigation against any entity (including a
8484+ cross-claim or counterclaim in a lawsuit) alleging that the Work
8585+ or a Contribution incorporated within the Work constitutes direct
8686+ or contributory patent infringement, then any patent licenses
8787+ granted to You under this License for that Work shall terminate
8888+ as of the date such litigation is filed.
8989+9090+ 4. Redistribution. You may reproduce and distribute copies of the
9191+ Work or Derivative Works thereof in any medium, with or without
9292+ modifications, and in Source or Object form, provided that You
9393+ meet the following conditions:
9494+9595+ (a) You must give any other recipients of the Work or
9696+ Derivative Works a copy of this License; and
9797+9898+ (b) You must cause any modified files to carry prominent notices
9999+ stating that You changed the files; and
100100+101101+ (c) You must retain, in the Source form of any Derivative Works
102102+ that You distribute, all copyright, patent, trademark, and
103103+ attribution notices from the Source form of the Work,
104104+ excluding those notices that do not pertain to any part of
105105+ the Derivative Works; and
106106+107107+ (d) If the Work includes a "NOTICE" text file as part of its
108108+ distribution, then any Derivative Works that You distribute must
109109+ include a readable copy of the attribution notices contained
110110+ within such NOTICE file, excluding those notices that do not
111111+ pertain to any part of the Derivative Works, in at least one
112112+ of the following places: within a NOTICE text file distributed
113113+ as part of the Derivative Works; within the Source form or
114114+ documentation, if provided along with the Derivative Works; or,
115115+ within a display generated by the Derivative Works, if and
116116+ wherever such third-party notices normally appear. The contents
117117+ of the NOTICE file are for informational purposes only and
118118+ do not modify the License. You may add Your own attribution
119119+ notices within Derivative Works that You distribute, alongside
120120+ or as an addendum to the NOTICE text from the Work, provided
121121+ that such additional attribution notices cannot be construed
122122+ as modifying the License.
123123+124124+ You may add Your own copyright statement to Your modifications and
125125+ may provide additional or different license terms and conditions
126126+ for use, reproduction, or distribution of Your modifications, or
127127+ for any such Derivative Works as a whole, provided Your use,
128128+ reproduction, and distribution of the Work otherwise complies with
129129+ the conditions stated in this License.
130130+131131+ 5. Submission of Contributions. Unless You explicitly state otherwise,
132132+ any Contribution intentionally submitted for inclusion in the Work
133133+ by You to the Licensor shall be under the terms and conditions of
134134+ this License, without any additional terms or conditions.
135135+ Notwithstanding the above, nothing herein shall supersede or modify
136136+ the terms of any separate license agreement you may have executed
137137+ with Licensor regarding such Contributions.
138138+139139+ 6. Trademarks. This License does not grant permission to use the trade
140140+ names, trademarks, service marks, or product names of the Licensor,
141141+ except as required for reasonable and customary use in describing the
142142+ origin of the Work and reproducing the content of the NOTICE file.
143143+144144+ 7. Disclaimer of Warranty. Unless required by applicable law or
145145+ agreed to in writing, Licensor provides the Work (and each
146146+ Contributor provides its Contributions) on an "AS IS" BASIS,
147147+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
148148+ implied, including, without limitation, any warranties or conditions
149149+ of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
150150+ PARTICULAR PURPOSE. You are solely responsible for determining the
151151+ appropriateness of using or redistributing the Work and assume any
152152+ risks associated with Your exercise of permissions under this License.
153153+154154+ 8. Limitation of Liability. In no event and under no legal theory,
155155+ whether in tort (including negligence), contract, or otherwise,
156156+ unless required by applicable law (such as deliberate and grossly
157157+ negligent acts) or agreed to in writing, shall any Contributor be
158158+ liable to You for damages, including any direct, indirect, special,
159159+ incidental, or consequential damages of any character arising as a
160160+ result of this License or out of the use or inability to use the
161161+ Work (including but not limited to damages for loss of goodwill,
162162+ work stoppage, computer failure or malfunction, or any and all
163163+ other commercial damages or losses), even if such Contributor
164164+ has been advised of the possibility of such damages.
165165+166166+ 9. Accepting Warranty or Additional Liability. While redistributing
167167+ the Work or Derivative Works thereof, You may choose to offer,
168168+ and charge a fee for, acceptance of support, warranty, indemnity,
169169+ or other liability obligations and/or rights consistent with this
170170+ License. However, in accepting such obligations, You may act only
171171+ on Your own behalf and on Your sole responsibility, not on behalf
172172+ of any other Contributor, and only if You agree to indemnify,
173173+ defend, and hold each Contributor harmless for any liability
174174+ incurred by, or claims asserted against, such Contributor by reason
175175+ of your accepting any such warranty or additional liability.
176176+177177+ END OF TERMS AND CONDITIONS
178178+179179+ APPENDIX: How to apply the Apache License to your work.
180180+181181+ To apply the Apache License to your work, attach the following
182182+ boilerplate notice, with the fields enclosed by brackets "[]"
183183+ replaced with your own identifying information. (Don't include
184184+ the brackets!) The text should be enclosed in the appropriate
185185+ comment syntax for the file format. We also recommend that a
186186+ file or class name and description of purpose be included on the
187187+ same "printed page" as the copyright notice for easier
188188+ identification within third-party archives.
189189+190190+ Copyright [yyyy] [name of copyright owner]
191191+192192+ Licensed under the Apache License, Version 2.0 (the "License");
193193+ you may not use this file except in compliance with the License.
194194+ You may obtain a copy of the License at
195195+196196+ http://www.apache.org/licenses/LICENSE-2.0
197197+198198+ Unless required by applicable law or agreed to in writing, software
199199+ distributed under the License is distributed on an "AS IS" BASIS,
200200+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
201201+ See the License for the specific language governing permissions and
202202+ limitations under the License.
+1
README.md
···11+Haskell implementation of Hidden Markov Models & related algorithms from AIMA book
···11+{-# LANGUAGE DataKinds #-}
22+{-# LANGUAGE KindSignatures #-}
33+{-# LANGUAGE ScopedTypeVariables #-}
44+{-# LANGUAGE TemplateHaskell #-}
55+{-# LANGUAGE TypeOperators #-}
66+module HMM where
77+88+-- import Prelude (undefined)
99+-- import System.IO (print)
1010+import Text.Printf (printf)
1111+1212+import Papa
1313+import GHC.TypeNats
1414+import Data.Proxy (Proxy(..))
1515+1616+import Control.Monad.State (State, runState)
1717+import Control.Monad.Trans.Maybe (MaybeT, runMaybeT)
1818+1919+import qualified Data.Vector as Vec
2020+2121+import Linear.V
2222+import Linear
2323+2424+import qualified Numeric.LinearAlgebra.Static as HM
2525+import qualified Numeric.LinearAlgebra as HMat
2626+-----------------------------------------------------------------------------------
2727+2828+-- | Type synonyms
2929+type R = Double
3030+type TransitionModel (s :: Nat) a = V s (V s a)
3131+type SensorDiagonal (s :: Nat) a = V s (V s a)
3232+type SensorModel (t :: Nat) (s :: Nat) a = V t (SensorDiagonal s a)
3333+type Message (s :: Nat) a = V s (V 1 a)
3434+type Distribution (s :: Nat) a = V s a
3535+3636+-- | Utility Functions
3737+3838+-- | Multiply each number by a constant such that the sum is 1.0
3939+4040+normalise :: (Fractional a, Foldable f, Functor f) => f a -> f a
4141+normalise xs | null xs = xs
4242+ | otherwise =
4343+ let
4444+ s = sum xs
4545+ in
4646+ (/ s) <$> xs
4747+4848+toHM :: (KnownNat s, KnownNat t) => V s (V t R) -> HM.L s t
4949+toHM = HM.matrix . foldMap (Vec.toList . toVector)
5050+5151+fromHM :: (KnownNat s, KnownNat t) => HM.L s t -> V s (V t R)
5252+fromHM m = V $ V <$> Vec.fromList (fmap Vec.fromList $ HMat.toLists $ HM.extract m)
5353+5454+inverse :: forall s. (KnownNat s) => V s (V s R) -> V s (V s R)
5555+inverse = fromHM . HM.inv . toHM
5656+5757+reverseV :: forall s a. (KnownNat s) => V s a -> V s a
5858+reverseV = V . Vec.fromList . Papa.reverse . toList
5959+6060+extract1 :: (KnownNat s) => V s (V 1 a) -> V s a
6161+extract1 = V . foldMap toVector
6262+6363+infix 8 !**!
6464+(!**!) :: (KnownNat m, KnownNat n) => V m (V n R) -> V m (V n R) -> V m (V n R)
6565+as !**! bs = fromHM $ toHM as * toHM bs
6666+6767+unitColumn :: forall s. KnownNat s => Message s R
6868+unitColumn = V $ Vec.replicate (fromIntegral $ natVal (Proxy :: Proxy s)) (toV $ V1 1.0)
6969+7070+7171+-- | Hidden Markov Models
7272+7373+data HMM (s :: Nat) (t :: Nat) a b = HMM {
7474+ -- prior distribution which is used as initial forward message
7575+ _prior :: Message s a,
7676+ -- transition model with `s` states as `sxs` matrix
7777+ _tModel :: TransitionModel s a,
7878+ -- evidence value vector, each index maps to the corresponding evidence values
7979+ _sDist :: V t b,
8080+ -- sensor model with `t` evidence values having `sxs` diagonal matrix capturing their ditributions for each state `s`
8181+ _sModel :: SensorModel t s a
8282+ } deriving (Show)
8383+makeLenses ''HMM
8484+8585+8686+-- | Smart HMM constructors
8787+8888+-- | Make HMM
8989+-- `mp :: Maybe (Message s a)` -- Prior distribution on the initial state, `P(X0)`. If nothing then considered `(0.5,0.5)`
9090+-- `xs :: TransitionModel s a` -- Transition Model as `sxs` matrix, `s` being the number of states
9191+-- `evs :: V t b` - evidence values vector map
9292+-- `es :: V t (V s a)` -- a `txs` matrix for each evidence value `t`, a vector capturing conditional probabilities for each state `s`
9393+mkHMM_ :: (KnownNat s, KnownNat t) => Maybe (Message s R) -> TransitionModel s R -> V t b -> V t (V s R) -> HMM s t R b
9494+mkHMM_ mp xs evs = let p = fromMaybe (V $ Vec.replicate (dim xs) 0.5) mp
9595+ in
9696+ HMM p xs evs . (scaled <$>)
9797+9898+-- | A default HMM where both transition model states and evidence variables have boolean support
9999+mkHMM :: KnownNat s => TransitionModel s R -> V 2 (V s R) -> HMM s 2 R Bool
100100+mkHMM ts = mkHMM_ Nothing ts (V $ Vec.fromList [True, False])
101101+102102+-- | A default HMM with one state variable having boolean support
103103+mkHMM1 :: V2 (V2 R) -> V2 (V2 R) -> HMM 2 2 R Bool
104104+mkHMM1 ts ss = let f = (_V #) . over mapped toV
105105+ in
106106+ uncurry mkHMM $ over both f (ts , ss)
107107+108108+sensorDiagonal :: (KnownNat s, KnownNat t, Eq b) => HMM s t a b -> b -> Maybe (SensorDiagonal s a)
109109+sensorDiagonal hmm e = findIndexOf (sDist.folded) (== e) hmm >>= (\i -> hmm ^? sModel . ix i)
110110+111111+-- | Fixed Lag Smoothing
112112+113113+-- | Persistent State
114114+data Persistent (s :: Nat) a b d= Persistent {
115115+ _t :: d,
116116+ _f_msg :: Message s a,
117117+ _b :: V s (V s a),
118118+ _e_td_t :: Vec.Vector b
119119+ } deriving (Show)
120120+makeLenses ''Persistent
121121+122122+-- | State to start with
123123+persistentInit :: forall s b d. (KnownNat s, Integral d) => Message s R -> Persistent s R b d
124124+persistentInit p = Persistent { _t = 1, _f_msg = p, _b = identity, _e_td_t = Vec.empty}
125125+126126+-- | Filtering message propagated forward
127127+forward :: (KnownNat s) => HMM s t R b -> SensorDiagonal s R -> Message s R -> Message s R
128128+forward hmm ot f = normalise (ot !*! Linear.transpose (hmm ^. tModel) !*! f)
129129+130130+-- | Smoothing message propagated backward
131131+backward :: (KnownNat s) => HMM s t R b -> SensorDiagonal s R -> Message s R -> Message s R
132132+backward hmm ok1 bk2 = (hmm ^. tModel) !*! ok1 !*! bk2
133133+134134+135135+-- | Online Algorithm for smoothing with a fixed time lag of `d` steps
136136+-- hmm -- HMM model
137137+-- d -- length of lag
138138+-- e -- evidence at time t
139139+fixedLagSmoothing :: forall s u b d. (KnownNat s, KnownNat u, Eq b, Integral d) => HMM s u R b -> d -> b -> MaybeT (State (Persistent s R b d)) (Distribution s R)
140140+fixedLagSmoothing hmm d e = do
141141+ e_td_t %= flip Vec.snoc e
142142+143143+ o_t <- uses e_td_t $ (^?! _Just) . sensorDiagonal hmm . Vec.last
144144+145145+ t' <- use t
146146+ if t' > d then
147147+ do
148148+ e_td_t %= Vec.drop 1
149149+ o_tmd <- uses e_td_t $ (^?! _Just) . sensorDiagonal hmm . Vec.head
150150+ f_msg %= forward hmm o_tmd
151151+ b %= \b' -> inverse o_tmd !*! inverse (hmm ^. tModel) !*! b' !*! (hmm ^. tModel) !*! o_t
152152+ t += 1
153153+154154+ (f'', b'') <- liftA2 (,) (use f_msg) (use b)
155155+156156+ return $ extract1 $ normalise (f'' !**! (b'' !*! unitColumn))
157157+ else
158158+ do
159159+ b %= \b' -> b' !*! (hmm ^. tModel) !*! o_t
160160+ t += 1
161161+ mzero
162162+163163+164164+-- | The forward–backward algorithm for smoothing: computing posterior prob- abilities of a sequence of states given a sequence of observations
165165+-- hmm - HMM model as a way to implement
166166+-- evs - list of evidences for each time step
167167+forwardBackward :: forall s t u b . (KnownNat t, KnownNat s, KnownNat u, Eq b) => HMM s u R b -> V t b -> V t (Distribution s R)
168168+forwardBackward hmm evs = let
169169+ -- forward messages
170170+ fv :: V (t + 1) (Message s R)
171171+ fv = V $ Vec.fromList $ foldl' (\m@(x:_) e -> forward hmm (sensorDiagonal hmm e ^?! _Just) x : m) [hmm ^. prior] evs
172172+ -- reifying the number of evidences
173173+ tNat = dim evs
174174+ -- getting rid of the prior message from the end of the list
175175+ fv_0 :: V t (Message s R)
176176+ fv_0 = V $ Vec.fromList $ fv ^.. taking tNat traversed
177177+ -- backward messages
178178+ bs :: V t (Message s R)
179179+ bs = V $ Vec.fromList $ foldl' (\m@(x:_) e -> backward hmm (sensorDiagonal hmm e ^?! _Just) x : m) [unitColumn] $ reverseV evs
180180+ in
181181+ -- smoothing probabilities in reverse order of the list of evidences
182182+ liftA2 (\f b' -> extract1 $ normalise $ f !**! b') fv_0 (reverseV bs)
183183+184184+-- | execution
185185+umbrellaHMM :: HMM 2 2 R Bool
186186+umbrellaHMM = mkHMM1 (V2 (V2 0.7 0.3) (V2 0.3 0.7)) (V2 (V2 0.9 0.2) (V2 0.1 0.8))
187187+188188+runFLSAlgo :: [Bool] -> [Maybe (Distribution 2 String)]
189189+runFLSAlgo bs = let hmm = mkHMM1 (V2 (V2 0.7 0.3) (V2 0.3 0.7)) (V2 (V2 0.9 0.2) (V2 0.1 0.8))
190190+ initState = persistentInit (V $ Vec.fromList [V $ Vec.singleton 0.5, V $ Vec.singleton 0.5]) :: Persistent 2 R Bool Integer
191191+ algo = fixedLagSmoothing hmm 1
192192+ a :: ([Maybe (Distribution 2 R)], Persistent 2 R Bool Integer)
193193+ a = foldl' (\(rs, s) x -> runState (runMaybeT $ algo x) s & _1 #%~ ((rs ++) . pure)) ([], initState) bs
194194+ in
195195+ (a ^. _1) & traverse.traverse.traverse %~ \(x :: R) -> printf "%.3f" x :: String
196196+197197+198198+runFBAlgo :: (KnownNat t) =>V t Bool -> [Distribution 2 R]
199199+runFBAlgo bs = toList $ forwardBackward umbrellaHMM bs