hmm_filter.html 38 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895
  1. <!DOCTYPE html>
  2. <html>
  3. <head>
  4. <meta charset="utf-8" />
  5. <meta name="viewport" content="width=device-width, initial-scale=1.0" />
  6. <title>HMM filtering (forwards algorithm) &#8212; State Space Models: A Modern Approach</title>
  7. <link href="../../_static/css/theme.css" rel="stylesheet">
  8. <link href="../../_static/css/index.ff1ffe594081f20da1ef19478df9384b.css" rel="stylesheet">
  9. <link rel="stylesheet"
  10. href="../../_static/vendor/fontawesome/5.13.0/css/all.min.css">
  11. <link rel="preload" as="font" type="font/woff2" crossorigin
  12. href="../../_static/vendor/fontawesome/5.13.0/webfonts/fa-solid-900.woff2">
  13. <link rel="preload" as="font" type="font/woff2" crossorigin
  14. href="../../_static/vendor/fontawesome/5.13.0/webfonts/fa-brands-400.woff2">
  15. <link rel="stylesheet" type="text/css" href="../../_static/pygments.css" />
  16. <link rel="stylesheet" type="text/css" href="../../_static/sphinx-book-theme.css?digest=c3fdc42140077d1ad13ad2f1588a4309" />
  17. <link rel="stylesheet" type="text/css" href="../../_static/togglebutton.css" />
  18. <link rel="stylesheet" type="text/css" href="../../_static/copybutton.css" />
  19. <link rel="stylesheet" type="text/css" href="../../_static/mystnb.css" />
  20. <link rel="stylesheet" type="text/css" href="../../_static/sphinx-thebe.css" />
  21. <link rel="stylesheet" type="text/css" href="../../_static/panels-main.c949a650a448cc0ae9fd3441c0e17fb0.css" />
  22. <link rel="stylesheet" type="text/css" href="../../_static/panels-variables.06eb56fa6e07937060861dad626602ad.css" />
  23. <link rel="preload" as="script" href="../../_static/js/index.be7d3bbb2ef33a8344ce.js">
  24. <script data-url_root="../../" id="documentation_options" src="../../_static/documentation_options.js"></script>
  25. <script src="../../_static/jquery.js"></script>
  26. <script src="../../_static/underscore.js"></script>
  27. <script src="../../_static/doctools.js"></script>
  28. <script src="../../_static/clipboard.min.js"></script>
  29. <script src="../../_static/copybutton.js"></script>
  30. <script>let toggleHintShow = 'Click to show';</script>
  31. <script>let toggleHintHide = 'Click to hide';</script>
  32. <script>let toggleOpenOnPrint = 'true';</script>
  33. <script src="../../_static/togglebutton.js"></script>
  34. <script>var togglebuttonSelector = '.toggle, .admonition.dropdown, .tag_hide_input div.cell_input, .tag_hide-input div.cell_input, .tag_hide_output div.cell_output, .tag_hide-output div.cell_output, .tag_hide_cell.cell, .tag_hide-cell.cell';</script>
  35. <script src="../../_static/sphinx-book-theme.d59cb220de22ca1c485ebbdc042f0030.js"></script>
  36. <script>const THEBE_JS_URL = "https://unpkg.com/thebe@0.8.2/lib/index.js"
  37. const thebe_selector = ".thebe,.cell"
  38. const thebe_selector_input = "pre"
  39. const thebe_selector_output = ".output, .cell_output"
  40. </script>
  41. <script async="async" src="../../_static/sphinx-thebe.js"></script>
  42. <script>window.MathJax = {"TeX": {"Macros": {"N": "\\mathbb{N}", "floor": ["\\lfloor#1\\rfloor", 1], "bmat": ["\\left[\\begin{array}"], "emat": ["\\end{array}\\right]"]}}, "options": {"processHtmlClass": "tex2jax_process|mathjax_process|math|output_area"}}</script>
  43. <script defer="defer" src="https://cdn.jsdelivr.net/npm/mathjax@3/es5/tex-mml-chtml.js"></script>
  44. <link rel="index" title="Index" href="../../genindex.html" />
  45. <link rel="search" title="Search" href="../../search.html" />
  46. <link rel="next" title="HMM smoothing (forwards-backwards algorithm)" href="hmm_smoother.html" />
  47. <link rel="prev" title="Hidden Markov Models" href="hmm_index.html" />
  48. <meta name="viewport" content="width=device-width, initial-scale=1" />
  49. <meta name="docsearch:language" content="None">
  50. <!-- Google Analytics -->
  51. </head>
  52. <body data-spy="scroll" data-target="#bd-toc-nav" data-offset="80">
  53. <div class="container-fluid" id="banner"></div>
  54. <div class="container-xl">
  55. <div class="row">
  56. <div class="col-12 col-md-3 bd-sidebar site-navigation show" id="site-navigation">
  57. <div class="navbar-brand-box">
  58. <a class="navbar-brand text-wrap" href="../../index.html">
  59. <h1 class="site-logo" id="site-title">State Space Models: A Modern Approach</h1>
  60. </a>
  61. </div><form class="bd-search d-flex align-items-center" action="../../search.html" method="get">
  62. <i class="icon fas fa-search"></i>
  63. <input type="search" class="form-control" name="q" id="search-input" placeholder="Search this book..." aria-label="Search this book..." autocomplete="off" >
  64. </form><nav class="bd-links" id="bd-docs-nav" aria-label="Main">
  65. <div class="bd-toc-item active">
  66. <ul class="nav bd-sidenav">
  67. <li class="toctree-l1">
  68. <a class="reference internal" href="../../root.html">
  69. State Space Models: A Modern Approach
  70. </a>
  71. </li>
  72. </ul>
  73. <ul class="current nav bd-sidenav">
  74. <li class="toctree-l1">
  75. <a class="reference internal" href="../scratch.html">
  76. Scratchpad
  77. </a>
  78. </li>
  79. <li class="toctree-l1 has-children">
  80. <a class="reference internal" href="../ssm/ssm_index.html">
  81. State Space Models
  82. </a>
  83. <input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" type="checkbox"/>
  84. <label for="toctree-checkbox-1">
  85. <i class="fas fa-chevron-down">
  86. </i>
  87. </label>
  88. <ul>
  89. <li class="toctree-l2">
  90. <a class="reference internal" href="../ssm/ssm_intro.html">
  91. What are State Space Models?
  92. </a>
  93. </li>
  94. <li class="toctree-l2">
  95. <a class="reference internal" href="../ssm/hmm.html">
  96. Hidden Markov Models
  97. </a>
  98. </li>
  99. <li class="toctree-l2">
  100. <a class="reference internal" href="../ssm/lds.html">
  101. Linear Gaussian SSMs
  102. </a>
  103. </li>
  104. <li class="toctree-l2">
  105. <a class="reference internal" href="../ssm/nlds.html">
  106. Nonlinear Gaussian SSMs
  107. </a>
  108. </li>
  109. <li class="toctree-l2">
  110. <a class="reference internal" href="../ssm/inference.html">
  111. Inferential goals
  112. </a>
  113. </li>
  114. </ul>
  115. </li>
  116. <li class="toctree-l1 current active has-children">
  117. <a class="reference internal" href="hmm_index.html">
  118. Hidden Markov Models
  119. </a>
  120. <input checked="" class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" type="checkbox"/>
  121. <label for="toctree-checkbox-2">
  122. <i class="fas fa-chevron-down">
  123. </i>
  124. </label>
  125. <ul class="current">
  126. <li class="toctree-l2 current active">
  127. <a class="current reference internal" href="#">
  128. HMM filtering (forwards algorithm)
  129. </a>
  130. </li>
  131. <li class="toctree-l2">
  132. <a class="reference internal" href="hmm_smoother.html">
  133. HMM smoothing (forwards-backwards algorithm)
  134. </a>
  135. </li>
  136. <li class="toctree-l2">
  137. <a class="reference internal" href="hmm_viterbi.html">
  138. Viterbi algorithm
  139. </a>
  140. </li>
  141. <li class="toctree-l2">
  142. <a class="reference internal" href="hmm_parallel.html">
  143. Parallel HMM smoothing
  144. </a>
  145. </li>
  146. <li class="toctree-l2">
  147. <a class="reference internal" href="hmm_sampling.html">
  148. Forwards-filtering backwards-sampling algorithm
  149. </a>
  150. </li>
  151. </ul>
  152. </li>
  153. <li class="toctree-l1 has-children">
  154. <a class="reference internal" href="../lgssm/lgssm_index.html">
  155. Linear-Gaussian SSMs
  156. </a>
  157. <input class="toctree-checkbox" id="toctree-checkbox-3" name="toctree-checkbox-3" type="checkbox"/>
  158. <label for="toctree-checkbox-3">
  159. <i class="fas fa-chevron-down">
  160. </i>
  161. </label>
  162. <ul>
  163. <li class="toctree-l2">
  164. <a class="reference internal" href="../lgssm/kalman_filter.html">
  165. Kalman filtering
  166. </a>
  167. </li>
  168. <li class="toctree-l2">
  169. <a class="reference internal" href="../lgssm/kalman_smoother.html">
  170. Kalman (RTS) smoother
  171. </a>
  172. </li>
  173. <li class="toctree-l2">
  174. <a class="reference internal" href="../lgssm/kalman_parallel.html">
  175. Parallel Kalman Smoother
  176. </a>
  177. </li>
  178. <li class="toctree-l2">
  179. <a class="reference internal" href="../lgssm/kalman_sampling.html">
  180. Forwards-filtering backwards sampling
  181. </a>
  182. </li>
  183. </ul>
  184. </li>
  185. <li class="toctree-l1 has-children">
  186. <a class="reference internal" href="../extended/extended_index.html">
  187. Extended (linearized) methods
  188. </a>
  189. <input class="toctree-checkbox" id="toctree-checkbox-4" name="toctree-checkbox-4" type="checkbox"/>
  190. <label for="toctree-checkbox-4">
  191. <i class="fas fa-chevron-down">
  192. </i>
  193. </label>
  194. <ul>
  195. <li class="toctree-l2">
  196. <a class="reference internal" href="../extended/extended_filter.html">
  197. Extended Kalman filtering
  198. </a>
  199. </li>
  200. <li class="toctree-l2">
  201. <a class="reference internal" href="../extended/extended_smoother.html">
  202. Extended Kalman smoother
  203. </a>
  204. </li>
  205. <li class="toctree-l2">
  206. <a class="reference internal" href="../extended/extended_parallel.html">
  207. Parallel extended Kalman smoothing
  208. </a>
  209. </li>
  210. </ul>
  211. </li>
  212. <li class="toctree-l1 has-children">
  213. <a class="reference internal" href="../unscented/unscented_index.html">
  214. Unscented methods
  215. </a>
  216. <input class="toctree-checkbox" id="toctree-checkbox-5" name="toctree-checkbox-5" type="checkbox"/>
  217. <label for="toctree-checkbox-5">
  218. <i class="fas fa-chevron-down">
  219. </i>
  220. </label>
  221. <ul>
  222. <li class="toctree-l2">
  223. <a class="reference internal" href="../unscented/unscented_filter.html">
  224. Unscented filtering
  225. </a>
  226. </li>
  227. <li class="toctree-l2">
  228. <a class="reference internal" href="../unscented/unscented_smoother.html">
  229. Unscented smoothing
  230. </a>
  231. </li>
  232. </ul>
  233. </li>
  234. <li class="toctree-l1">
  235. <a class="reference internal" href="../quadrature/quadrature_index.html">
  236. Quadrature and cubature methods
  237. </a>
  238. </li>
  239. <li class="toctree-l1">
  240. <a class="reference internal" href="../postlin/postlin_index.html">
  241. Posterior linearization
  242. </a>
  243. </li>
  244. <li class="toctree-l1">
  245. <a class="reference internal" href="../adf/adf_index.html">
  246. Assumed Density Filtering
  247. </a>
  248. </li>
  249. <li class="toctree-l1">
  250. <a class="reference internal" href="../vi/vi_index.html">
  251. Variational inference
  252. </a>
  253. </li>
  254. <li class="toctree-l1">
  255. <a class="reference internal" href="../pf/pf_index.html">
  256. Particle filtering
  257. </a>
  258. </li>
  259. <li class="toctree-l1">
  260. <a class="reference internal" href="../smc/smc_index.html">
  261. Sequential Monte Carlo
  262. </a>
  263. </li>
  264. <li class="toctree-l1">
  265. <a class="reference internal" href="../learning/learning_index.html">
  266. Offline parameter estimation (learning)
  267. </a>
  268. </li>
  269. <li class="toctree-l1">
  270. <a class="reference internal" href="../tracking/tracking_index.html">
  271. Multi-target tracking
  272. </a>
  273. </li>
  274. <li class="toctree-l1">
  275. <a class="reference internal" href="../ensemble/ensemble_index.html">
  276. Data assimilation using Ensemble Kalman filter
  277. </a>
  278. </li>
  279. <li class="toctree-l1">
  280. <a class="reference internal" href="../bnp/bnp_index.html">
  281. Bayesian non-parametric SSMs
  282. </a>
  283. </li>
  284. <li class="toctree-l1">
  285. <a class="reference internal" href="../changepoint/changepoint_index.html">
  286. Changepoint detection
  287. </a>
  288. </li>
  289. <li class="toctree-l1">
  290. <a class="reference internal" href="../timeseries/timeseries_index.html">
  291. Timeseries forecasting
  292. </a>
  293. </li>
  294. <li class="toctree-l1">
  295. <a class="reference internal" href="../gp/gp_index.html">
  296. Markovian Gaussian processes
  297. </a>
  298. </li>
  299. <li class="toctree-l1">
  300. <a class="reference internal" href="../ode/ode_index.html">
  301. Differential equations and SSMs
  302. </a>
  303. </li>
  304. <li class="toctree-l1">
  305. <a class="reference internal" href="../control/control_index.html">
  306. Optimal control
  307. </a>
  308. </li>
  309. <li class="toctree-l1">
  310. <a class="reference internal" href="../../bib.html">
  311. Bibliography
  312. </a>
  313. </li>
  314. </ul>
  315. </div>
  316. </nav> <!-- To handle the deprecated key -->
  317. <div class="navbar_extra_footer">
  318. Powered by <a href="https://jupyterbook.org">Jupyter Book</a>
  319. </div>
  320. </div>
  321. <main class="col py-md-3 pl-md-4 bd-content overflow-auto" role="main">
  322. <div class="topbar container-xl fixed-top">
  323. <div class="topbar-contents row">
  324. <div class="col-12 col-md-3 bd-topbar-whitespace site-navigation show"></div>
  325. <div class="col pl-md-4 topbar-main">
  326. <button id="navbar-toggler" class="navbar-toggler ml-0" type="button" data-toggle="collapse"
  327. data-toggle="tooltip" data-placement="bottom" data-target=".site-navigation" aria-controls="navbar-menu"
  328. aria-expanded="true" aria-label="Toggle navigation" aria-controls="site-navigation"
  329. title="Toggle navigation" data-toggle="tooltip" data-placement="left">
  330. <i class="fas fa-bars"></i>
  331. <i class="fas fa-arrow-left"></i>
  332. <i class="fas fa-arrow-up"></i>
  333. </button>
  334. <div class="dropdown-buttons-trigger">
  335. <button id="dropdown-buttons-trigger" class="btn btn-secondary topbarbtn" aria-label="Download this page"><i
  336. class="fas fa-download"></i></button>
  337. <div class="dropdown-buttons">
  338. <!-- ipynb file if we had a myst markdown file -->
  339. <!-- Download raw file -->
  340. <a class="dropdown-buttons" href="../../_sources/chapters/hmm/hmm_filter.ipynb"><button type="button"
  341. class="btn btn-secondary topbarbtn" title="Download source file" data-toggle="tooltip"
  342. data-placement="left">.ipynb</button></a>
  343. <!-- Download PDF via print -->
  344. <button type="button" id="download-print" class="btn btn-secondary topbarbtn" title="Print to PDF"
  345. onclick="printPdf(this)" data-toggle="tooltip" data-placement="left">.pdf</button>
  346. </div>
  347. </div>
  348. <!-- Source interaction buttons -->
  349. <div class="dropdown-buttons-trigger">
  350. <button id="dropdown-buttons-trigger" class="btn btn-secondary topbarbtn"
  351. aria-label="Connect with source repository"><i class="fab fa-github"></i></button>
  352. <div class="dropdown-buttons sourcebuttons">
  353. <a class="repository-button"
  354. href="https://github.com/probml/ssm-book"><button type="button" class="btn btn-secondary topbarbtn"
  355. data-toggle="tooltip" data-placement="left" title="Source repository"><i
  356. class="fab fa-github"></i>repository</button></a>
  357. <a class="issues-button"
  358. href="https://github.com/probml/ssm-book/issues/new?title=Issue%20on%20page%20%2Fchapters/hmm/hmm_filter.html&body=Your%20issue%20content%20here."><button
  359. type="button" class="btn btn-secondary topbarbtn" data-toggle="tooltip" data-placement="left"
  360. title="Open an issue"><i class="fas fa-lightbulb"></i>open issue</button></a>
  361. </div>
  362. </div>
  363. <!-- Full screen (wrap in <a> to have style consistency -->
  364. <a class="full-screen-button"><button type="button" class="btn btn-secondary topbarbtn" data-toggle="tooltip"
  365. data-placement="bottom" onclick="toggleFullScreen()" aria-label="Fullscreen mode"
  366. title="Fullscreen mode"><i
  367. class="fas fa-expand"></i></button></a>
  368. <!-- Launch buttons -->
  369. <div class="dropdown-buttons-trigger">
  370. <button id="dropdown-buttons-trigger" class="btn btn-secondary topbarbtn"
  371. aria-label="Launch interactive content"><i class="fas fa-rocket"></i></button>
  372. <div class="dropdown-buttons">
  373. <a class="binder-button" href="https://mybinder.org/v2/gh/probml/ssm-book/main?urlpath=tree/chapters/hmm/hmm_filter.ipynb"><button type="button"
  374. class="btn btn-secondary topbarbtn" title="Launch Binder" data-toggle="tooltip"
  375. data-placement="left"><img class="binder-button-logo"
  376. src="../../_static/images/logo_binder.svg"
  377. alt="Interact on binder">Binder</button></a>
  378. <a class="colab-button" href="https://colab.research.google.com/github/probml/ssm-book/blob/main/chapters/hmm/hmm_filter.ipynb"><button type="button" class="btn btn-secondary topbarbtn"
  379. title="Launch Colab" data-toggle="tooltip" data-placement="left"><img class="colab-button-logo"
  380. src="../../_static/images/logo_colab.png"
  381. alt="Interact on Colab">Colab</button></a>
  382. </div>
  383. </div>
  384. </div>
  385. <!-- Table of contents -->
  386. <div class="d-none d-md-block col-md-2 bd-toc show noprint">
  387. </div>
  388. </div>
  389. </div>
  390. <div id="main-content" class="row">
  391. <div class="col-12 col-md-9 pl-md-3 pr-md-0">
  392. <!-- Table of contents that is only displayed when printing the page -->
  393. <div id="jb-print-docs-body" class="onlyprint">
  394. <h1>HMM filtering (forwards algorithm)</h1>
  395. <!-- Table of contents -->
  396. <div id="print-main-content">
  397. <div id="jb-print-toc">
  398. </div>
  399. </div>
  400. </div>
  401. <div>
  402. <div class="math notranslate nohighlight">
  403. \[ \begin{align}\begin{aligned}\newcommand{\defeq}{\triangleq}
  404. \newcommand{\trans}{{\mkern-1.5mu\mathsf{T}}}
  405. \newcommand{\transpose}[1]{{#1}^{\trans}}\\\newcommand{\inv}[1]{{#1}^{-1}}
  406. \DeclareMathOperator{\dotstar}{\odot}\\
  407. \newcommand\floor[1]{\lfloor#1\rfloor}\\\newcommand{\real}{\mathbb{R}}\\% Numbers
  408. \newcommand{\vzero}{\boldsymbol{0}}
  409. \newcommand{\vone}{\boldsymbol{1}}\\% Greek https://www.latex-tutorial.com/symbols/greek-alphabet/
  410. \newcommand{\valpha}{\boldsymbol{\alpha}}
  411. \newcommand{\vbeta}{\boldsymbol{\beta}}
  412. \newcommand{\vchi}{\boldsymbol{\chi}}
  413. \newcommand{\vdelta}{\boldsymbol{\delta}}
  414. \newcommand{\vDelta}{\boldsymbol{\Delta}}
  415. \newcommand{\vepsilon}{\boldsymbol{\epsilon}}
  416. \newcommand{\vzeta}{\boldsymbol{\zeta}}
  417. \newcommand{\vXi}{\boldsymbol{\Xi}}
  418. \newcommand{\vell}{\boldsymbol{\ell}}
  419. \newcommand{\veta}{\boldsymbol{\eta}}
  420. %\newcommand{\vEta}{\boldsymbol{\Eta}}
  421. \newcommand{\vgamma}{\boldsymbol{\gamma}}
  422. \newcommand{\vGamma}{\boldsymbol{\Gamma}}
  423. \newcommand{\vmu}{\boldsymbol{\mu}}
  424. \newcommand{\vmut}{\boldsymbol{\tilde{\mu}}}
  425. \newcommand{\vnu}{\boldsymbol{\nu}}
  426. \newcommand{\vkappa}{\boldsymbol{\kappa}}
  427. \newcommand{\vlambda}{\boldsymbol{\lambda}}
  428. \newcommand{\vLambda}{\boldsymbol{\Lambda}}
  429. \newcommand{\vLambdaBar}{\overline{\vLambda}}
  430. %\newcommand{\vnu}{\boldsymbol{\nu}}
  431. \newcommand{\vomega}{\boldsymbol{\omega}}
  432. \newcommand{\vOmega}{\boldsymbol{\Omega}}
  433. \newcommand{\vphi}{\boldsymbol{\phi}}
  434. \newcommand{\vvarphi}{\boldsymbol{\varphi}}
  435. \newcommand{\vPhi}{\boldsymbol{\Phi}}
  436. \newcommand{\vpi}{\boldsymbol{\pi}}
  437. \newcommand{\vPi}{\boldsymbol{\Pi}}
  438. \newcommand{\vpsi}{\boldsymbol{\psi}}
  439. \newcommand{\vPsi}{\boldsymbol{\Psi}}
  440. \newcommand{\vrho}{\boldsymbol{\rho}}
  441. \newcommand{\vtheta}{\boldsymbol{\theta}}
  442. \newcommand{\vthetat}{\boldsymbol{\tilde{\theta}}}
  443. \newcommand{\vTheta}{\boldsymbol{\Theta}}
  444. \newcommand{\vsigma}{\boldsymbol{\sigma}}
  445. \newcommand{\vSigma}{\boldsymbol{\Sigma}}
  446. \newcommand{\vSigmat}{\boldsymbol{\tilde{\Sigma}}}
  447. \newcommand{\vsigmoid}{\vsigma}
  448. \newcommand{\vtau}{\boldsymbol{\tau}}
  449. \newcommand{\vxi}{\boldsymbol{\xi}}\\
  450. % Lower Roman (Vectors)
  451. \newcommand{\va}{\mathbf{a}}
  452. \newcommand{\vb}{\mathbf{b}}
  453. \newcommand{\vBt}{\mathbf{\tilde{B}}}
  454. \newcommand{\vc}{\mathbf{c}}
  455. \newcommand{\vct}{\mathbf{\tilde{c}}}
  456. \newcommand{\vd}{\mathbf{d}}
  457. \newcommand{\ve}{\mathbf{e}}
  458. \newcommand{\vf}{\mathbf{f}}
  459. \newcommand{\vg}{\mathbf{g}}
  460. \newcommand{\vh}{\mathbf{h}}
  461. %\newcommand{\myvh}{\mathbf{h}}
  462. \newcommand{\vi}{\mathbf{i}}
  463. \newcommand{\vj}{\mathbf{j}}
  464. \newcommand{\vk}{\mathbf{k}}
  465. \newcommand{\vl}{\mathbf{l}}
  466. \newcommand{\vm}{\mathbf{m}}
  467. \newcommand{\vn}{\mathbf{n}}
  468. \newcommand{\vo}{\mathbf{o}}
  469. \newcommand{\vp}{\mathbf{p}}
  470. \newcommand{\vq}{\mathbf{q}}
  471. \newcommand{\vr}{\mathbf{r}}
  472. \newcommand{\vs}{\mathbf{s}}
  473. \newcommand{\vt}{\mathbf{t}}
  474. \newcommand{\vu}{\mathbf{u}}
  475. \newcommand{\vv}{\mathbf{v}}
  476. \newcommand{\vw}{\mathbf{w}}
  477. \newcommand{\vws}{\vw_s}
  478. \newcommand{\vwt}{\mathbf{\tilde{w}}}
  479. \newcommand{\vWt}{\mathbf{\tilde{W}}}
  480. \newcommand{\vwh}{\hat{\vw}}
  481. \newcommand{\vx}{\mathbf{x}}
  482. %\newcommand{\vx}{\mathbf{x}}
  483. \newcommand{\vxt}{\mathbf{\tilde{x}}}
  484. \newcommand{\vy}{\mathbf{y}}
  485. \newcommand{\vyt}{\mathbf{\tilde{y}}}
  486. \newcommand{\vz}{\mathbf{z}}
  487. %\newcommand{\vzt}{\mathbf{\tilde{z}}}\\
  488. % Upper Roman (Matrices)
  489. \newcommand{\vA}{\mathbf{A}}
  490. \newcommand{\vB}{\mathbf{B}}
  491. \newcommand{\vC}{\mathbf{C}}
  492. \newcommand{\vD}{\mathbf{D}}
  493. \newcommand{\vE}{\mathbf{E}}
  494. \newcommand{\vF}{\mathbf{F}}
  495. \newcommand{\vG}{\mathbf{G}}
  496. \newcommand{\vH}{\mathbf{H}}
  497. \newcommand{\vI}{\mathbf{I}}
  498. \newcommand{\vJ}{\mathbf{J}}
  499. \newcommand{\vK}{\mathbf{K}}
  500. \newcommand{\vL}{\mathbf{L}}
  501. \newcommand{\vM}{\mathbf{M}}
  502. \newcommand{\vMt}{\mathbf{\tilde{M}}}
  503. \newcommand{\vN}{\mathbf{N}}
  504. \newcommand{\vO}{\mathbf{O}}
  505. \newcommand{\vP}{\mathbf{P}}
  506. \newcommand{\vQ}{\mathbf{Q}}
  507. \newcommand{\vR}{\mathbf{R}}
  508. \newcommand{\vS}{\mathbf{S}}
  509. \newcommand{\vT}{\mathbf{T}}
  510. \newcommand{\vU}{\mathbf{U}}
  511. \newcommand{\vV}{\mathbf{V}}
  512. \newcommand{\vW}{\mathbf{W}}
  513. \newcommand{\vX}{\mathbf{X}}
  514. %\newcommand{\vXs}{\vX_{\vs}}
  515. \newcommand{\vXs}{\vX_{s}}
  516. \newcommand{\vXt}{\mathbf{\tilde{X}}}
  517. \newcommand{\vY}{\mathbf{Y}}
  518. \newcommand{\vZ}{\mathbf{Z}}
  519. \newcommand{\vZt}{\mathbf{\tilde{Z}}}
  520. \newcommand{\vzt}{\mathbf{\tilde{z}}}\\
  521. %%%%
  522. \newcommand{\hidden}{\vz}
  523. \newcommand{\hid}{\hidden}
  524. \newcommand{\observed}{\vy}
  525. \newcommand{\obs}{\observed}
  526. \newcommand{\inputs}{\vu}
  527. \newcommand{\input}{\inputs}\\\newcommand{\hmmTrans}{\vA}
  528. \newcommand{\hmmObs}{\vB}
  529. \newcommand{\hmmInit}{\vpi}\\
  530. \newcommand{\ldsDyn}{\vA}
  531. \newcommand{\ldsObs}{\vC}
  532. \newcommand{\ldsDynIn}{\vB}
  533. \newcommand{\ldsObsIn}{\vD}
  534. \newcommand{\ldsDynNoise}{\vQ}
  535. \newcommand{\ldsObsNoise}{\vR}\\\newcommand{\ssmDynFn}{f}
  536. \newcommand{\ssmObsFn}{h}\\
  537. %%%
  538. \newcommand{\gauss}{\mathcal{N}}\\\newcommand{\diag}{\mathrm{diag}}\end{aligned}\end{align} \]</div>
  539. <div class="cell docutils container">
  540. <div class="cell_input docutils container">
  541. <div class="highlight-ipython3 notranslate"><div class="highlight"><pre><span></span><span class="c1"># meta-data does not work yet in VScode</span>
  542. <span class="c1"># https://github.com/microsoft/vscode-jupyter/issues/1121</span>
  543. <span class="p">{</span>
  544. <span class="s2">&quot;tags&quot;</span><span class="p">:</span> <span class="p">[</span>
  545. <span class="s2">&quot;hide-cell&quot;</span>
  546. <span class="p">]</span>
  547. <span class="p">}</span>
  548. <span class="c1">### Install necessary libraries</span>
  549. <span class="k">try</span><span class="p">:</span>
  550. <span class="kn">import</span> <span class="nn">jax</span>
  551. <span class="k">except</span><span class="p">:</span>
  552. <span class="c1"># For cuda version, see https://github.com/google/jax#installation</span>
  553. <span class="o">%</span><span class="k">pip</span> install --upgrade &quot;jax[cpu]&quot;
  554. <span class="kn">import</span> <span class="nn">jax</span>
  555. <span class="k">try</span><span class="p">:</span>
  556. <span class="kn">import</span> <span class="nn">distrax</span>
  557. <span class="k">except</span><span class="p">:</span>
  558. <span class="o">%</span><span class="k">pip</span> install --upgrade distrax
  559. <span class="kn">import</span> <span class="nn">distrax</span>
  560. <span class="k">try</span><span class="p">:</span>
  561. <span class="kn">import</span> <span class="nn">jsl</span>
  562. <span class="k">except</span><span class="p">:</span>
  563. <span class="o">%</span><span class="k">pip</span> install git+https://github.com/probml/jsl
  564. <span class="kn">import</span> <span class="nn">jsl</span>
  565. <span class="c1">#try:</span>
  566. <span class="c1"># import ssm_jax</span>
  567. <span class="c1">##except:</span>
  568. <span class="c1"># %pip install git+https://github.com/probml/ssm-jax</span>
  569. <span class="c1"># import ssm_jax</span>
  570. <span class="k">try</span><span class="p">:</span>
  571. <span class="kn">import</span> <span class="nn">rich</span>
  572. <span class="k">except</span><span class="p">:</span>
  573. <span class="o">%</span><span class="k">pip</span> install rich
  574. <span class="kn">import</span> <span class="nn">rich</span>
  575. </pre></div>
  576. </div>
  577. </div>
  578. </div>
  579. <div class="cell docutils container">
  580. <div class="cell_input docutils container">
  581. <div class="highlight-ipython3 notranslate"><div class="highlight"><pre><span></span><span class="p">{</span>
  582. <span class="s2">&quot;tags&quot;</span><span class="p">:</span> <span class="p">[</span>
  583. <span class="s2">&quot;hide-cell&quot;</span>
  584. <span class="p">]</span>
  585. <span class="p">}</span>
  586. <span class="c1">### Import standard libraries</span>
  587. <span class="kn">import</span> <span class="nn">abc</span>
  588. <span class="kn">from</span> <span class="nn">dataclasses</span> <span class="kn">import</span> <span class="n">dataclass</span>
  589. <span class="kn">import</span> <span class="nn">functools</span>
  590. <span class="kn">import</span> <span class="nn">itertools</span>
  591. <span class="kn">from</span> <span class="nn">typing</span> <span class="kn">import</span> <span class="n">Any</span><span class="p">,</span> <span class="n">Callable</span><span class="p">,</span> <span class="n">NamedTuple</span><span class="p">,</span> <span class="n">Optional</span><span class="p">,</span> <span class="n">Union</span><span class="p">,</span> <span class="n">Tuple</span>
  592. <span class="kn">import</span> <span class="nn">matplotlib.pyplot</span> <span class="k">as</span> <span class="nn">plt</span>
  593. <span class="kn">import</span> <span class="nn">numpy</span> <span class="k">as</span> <span class="nn">np</span>
  594. <span class="kn">import</span> <span class="nn">jax</span>
  595. <span class="kn">import</span> <span class="nn">jax.numpy</span> <span class="k">as</span> <span class="nn">jnp</span>
  596. <span class="kn">from</span> <span class="nn">jax</span> <span class="kn">import</span> <span class="n">lax</span><span class="p">,</span> <span class="n">vmap</span><span class="p">,</span> <span class="n">jit</span><span class="p">,</span> <span class="n">grad</span>
  597. <span class="kn">from</span> <span class="nn">jax.scipy.special</span> <span class="kn">import</span> <span class="n">logit</span>
  598. <span class="kn">from</span> <span class="nn">jax.nn</span> <span class="kn">import</span> <span class="n">softmax</span>
  599. <span class="kn">from</span> <span class="nn">functools</span> <span class="kn">import</span> <span class="n">partial</span>
  600. <span class="kn">from</span> <span class="nn">jax.random</span> <span class="kn">import</span> <span class="n">PRNGKey</span><span class="p">,</span> <span class="n">split</span>
  601. <span class="kn">import</span> <span class="nn">inspect</span>
  602. <span class="kn">import</span> <span class="nn">inspect</span> <span class="k">as</span> <span class="nn">py_inspect</span>
  603. <span class="kn">import</span> <span class="nn">rich</span>
  604. <span class="kn">from</span> <span class="nn">rich</span> <span class="kn">import</span> <span class="n">inspect</span> <span class="k">as</span> <span class="n">r_inspect</span>
  605. <span class="kn">from</span> <span class="nn">rich</span> <span class="kn">import</span> <span class="nb">print</span> <span class="k">as</span> <span class="n">r_print</span>
  606. <span class="k">def</span> <span class="nf">print_source</span><span class="p">(</span><span class="n">fname</span><span class="p">):</span>
  607. <span class="n">r_print</span><span class="p">(</span><span class="n">py_inspect</span><span class="o">.</span><span class="n">getsource</span><span class="p">(</span><span class="n">fname</span><span class="p">))</span>
  608. </pre></div>
  609. </div>
  610. </div>
  611. </div>
  612. <div class="tex2jax_ignore mathjax_ignore section" id="hmm-filtering-forwards-algorithm">
  613. <span id="sec-forwards"></span><h1>HMM filtering (forwards algorithm)<a class="headerlink" href="#hmm-filtering-forwards-algorithm" title="Permalink to this headline">¶</a></h1>
  614. <p>The <strong>Bayes filter</strong> is an algorithm for recursively computing
  615. the belief state
  616. <span class="math notranslate nohighlight">\(p(\hidden_t|\obs_{1:t})\)</span> given
  617. the prior belief from the previous step,
  618. <span class="math notranslate nohighlight">\(p(\hidden_{t-1}|\obs_{1:t-1})\)</span>,
  619. the new observation <span class="math notranslate nohighlight">\(\obs_t\)</span>,
  620. and the model.
  621. This can be done using <strong>sequential Bayesian updating</strong>.
  622. For a dynamical model, this reduces to the
  623. <strong>predict-update</strong> cycle described below.</p>
  624. <p>The <strong>prediction step</strong> is just the <strong>Chapman-Kolmogorov equation</strong>:</p>
  625. <div class="math notranslate nohighlight">
  626. \[p(\hidden_t|\obs_{1:t-1})
  627. = \int p(\hidden_t|\hidden_{t-1}) p(\hidden_{t-1}|\obs_{1:t-1}) d\hidden_{t-1}\]</div>
  628. <p>The prediction step computes
  629. the one-step-ahead predictive distribution
  630. for the latent state, which updates
  631. the posterior from the previous time step into the prior
  632. for the current step.</p>
  633. <p>The <strong>update step</strong>
  634. is just Bayes rule:</p>
  635. <div class="math notranslate nohighlight">
  636. \[p(\hidden_t|\obs_{1:t}) = \frac{1}{Z_t}
  637. p(\obs_t|\hidden_t) p(\hidden_t|\obs_{1:t-1})\]</div>
  638. <p>where the normalization constant is</p>
  639. <div class="math notranslate nohighlight">
  640. \[Z_t = \int p(\obs_t|\hidden_t) p(\hidden_t|\obs_{1:t-1}) d\hidden_{t}
  641. = p(\obs_t|\obs_{1:t-1})\]</div>
  642. <p>When the latent states <span class="math notranslate nohighlight">\(\hidden_t\)</span> are discrete, as in HMM,
  643. the above integrals become sums.
  644. In particular, suppose we define
  645. the belief state as <span class="math notranslate nohighlight">\(\alpha_t(j) \defeq p(\hidden_t=j|\obs_{1:t})\)</span>,
  646. the local evidence as <span class="math notranslate nohighlight">\(\lambda_t(j) \defeq p(\obs_t|\hidden_t=j)\)</span>,
  647. and the transition matrix
  648. <span class="math notranslate nohighlight">\(A(i,j) = p(\hidden_t=j|\hidden_{t-1}=i)\)</span>.
  649. Then the predict step becomes</p>
  650. <div class="math notranslate nohighlight" id="equation-eqn-predictivehmm">
  651. <span class="eqno">(19)<a class="headerlink" href="#equation-eqn-predictivehmm" title="Permalink to this equation">¶</a></span>\[\alpha_{t|t-1}(j) \defeq p(\hidden_t=j|\obs_{1:t-1})
  652. = \sum_i \alpha_{t-1}(i) A(i,j)\]</div>
  653. <p>and the update step becomes</p>
  654. <div class="math notranslate nohighlight" id="equation-eqn-fwdseqn">
  655. <span class="eqno">(20)<a class="headerlink" href="#equation-eqn-fwdseqn" title="Permalink to this equation">¶</a></span>\[\alpha_t(j)
  656. = \frac{1}{Z_t} \lambda_t(j) \alpha_{t|t-1}(j)
  657. = \frac{1}{Z_t} \lambda_t(j) \left[\sum_i \alpha_{t-1}(i) A(i,j) \right]\]</div>
  658. <p>where
  659. the normalization constant for each time step is given by</p>
  660. <div class="math notranslate nohighlight" id="equation-eqn-hmmz">
  661. <span class="eqno">(21)<a class="headerlink" href="#equation-eqn-hmmz" title="Permalink to this equation">¶</a></span>\[\begin{split}\begin{align}
  662. Z_t \defeq p(\obs_t|\obs_{1:t-1})
  663. &amp;= \sum_{j=1}^K p(\obs_t|\hidden_t=j) p(\hidden_t=j|\obs_{1:t-1}) \\
  664. &amp;= \sum_{j=1}^K \lambda_t(j) \alpha_{t|t-1}(j)
  665. \end{align}\end{split}\]</div>
  666. <p>Since all the quantities are finite length vectors and matrices,
  667. we can write the update equation
  668. in matrix-vector notation as follows:</p>
  669. <div class="math notranslate nohighlight">
  670. \[\valpha_t =\text{normalize}\left(
  671. \vlambda_t \dotstar (\vA^{\trans} \valpha_{t-1}) \right)
  672. \label{eqn:fwdsAlgoMatrixForm}\]</div>
  673. <p>where <span class="math notranslate nohighlight">\(\dotstar\)</span> represents
  674. elementwise vector multiplication,
  675. and the <span class="math notranslate nohighlight">\(\text{normalize}\)</span> function just ensures its argument sums to one.</p>
  676. <p>In {ref}(sec:casino-inference)
  677. we illustrate
  678. filtering for the casino HMM,
  679. applied to a random sequence <span class="math notranslate nohighlight">\(\obs_{1:T}\)</span> of length <span class="math notranslate nohighlight">\(T=300\)</span>.
  680. In blue, we plot the probability that the dice is in the loaded (vs fair) state,
  681. based on the evidence seen so far.
  682. The gray bars indicate time intervals during which the generative
  683. process actually switched to the loaded dice.
  684. We see that the probability generally increases in the right places.</p>
  685. <p>Here is a JAX implementation of the forwards algorithm.</p>
  686. <div class="cell docutils container">
  687. <div class="cell_input docutils container">
  688. <div class="highlight-ipython3 notranslate"><div class="highlight"><pre><span></span><span class="kn">import</span> <span class="nn">jsl.hmm.hmm_lib</span> <span class="k">as</span> <span class="nn">hmm_lib</span>
  689. <span class="n">print_source</span><span class="p">(</span><span class="n">hmm_lib</span><span class="o">.</span><span class="n">hmm_forwards_jax</span><span class="p">)</span>
  690. <span class="c1">#https://github.com/probml/JSL/blob/main/jsl/hmm/hmm_lib.py#L189</span>
  691. </pre></div>
  692. </div>
  693. </div>
  694. <div class="cell_output docutils container">
  695. <div class="output text_html"><pre style="white-space:pre;overflow-x:auto;line-height:normal;font-family:Menlo,'DejaVu Sans Mono',consolas,'Courier New',monospace">@jit
  696. def hmm_forwards_jax<span style="font-weight: bold">(</span>params, obs_seq, <span style="color: #808000; text-decoration-color: #808000">length</span>=<span style="color: #800080; text-decoration-color: #800080; font-style: italic">None</span><span style="font-weight: bold">)</span>:
  697. <span style="color: #008000; text-decoration-color: #008000">''</span>'
  698. Calculates a belief state
  699. Parameters
  700. ----------
  701. params : HMMJax
  702. Hidden Markov Model
  703. obs_seq: array<span style="font-weight: bold">(</span>seq_len<span style="font-weight: bold">)</span>
  704. History of observable events
  705. Returns
  706. -------
  707. * float
  708. The loglikelihood giving log<span style="font-weight: bold">(</span>p<span style="font-weight: bold">(</span>x|model<span style="font-weight: bold">))</span>
  709. * array<span style="font-weight: bold">(</span>seq_len, n_hidden<span style="font-weight: bold">)</span> :
  710. All alpha values found for each sample
  711. <span style="color: #008000; text-decoration-color: #008000">''</span>'
  712. seq_len = len<span style="font-weight: bold">(</span>obs_seq<span style="font-weight: bold">)</span>
  713. if length is <span style="color: #800080; text-decoration-color: #800080; font-style: italic">None</span>:
  714. length = seq_len
  715. trans_mat, obs_mat, init_dist = params.trans_mat, params.obs_mat, params.init_dist
  716. trans_mat = jnp.array<span style="font-weight: bold">(</span>trans_mat<span style="font-weight: bold">)</span>
  717. obs_mat = jnp.array<span style="font-weight: bold">(</span>obs_mat<span style="font-weight: bold">)</span>
  718. init_dist = jnp.array<span style="font-weight: bold">(</span>init_dist<span style="font-weight: bold">)</span>
  719. n_states, n_obs = obs_mat.shape
  720. def scan_fn<span style="font-weight: bold">(</span>carry, t<span style="font-weight: bold">)</span>:
  721. <span style="font-weight: bold">(</span>alpha_prev, log_ll_prev<span style="font-weight: bold">)</span> = carry
  722. alpha_n = jnp.where<span style="font-weight: bold">(</span>t &lt; length,
  723. obs_mat<span style="font-weight: bold">[</span>:, obs_seq<span style="font-weight: bold">]</span> * <span style="font-weight: bold">(</span>alpha_prev<span style="font-weight: bold">[</span>:, <span style="color: #800080; text-decoration-color: #800080; font-style: italic">None</span><span style="font-weight: bold">]</span> *
  724. trans_mat<span style="font-weight: bold">)</span>.sum<span style="font-weight: bold">(</span><span style="color: #808000; text-decoration-color: #808000">axis</span>=<span style="color: #000080; text-decoration-color: #000080; font-weight: bold">0</span><span style="font-weight: bold">)</span>,
  725. jnp.zeros_like<span style="font-weight: bold">(</span>alpha_prev<span style="font-weight: bold">))</span>
  726. alpha_n, cn = normalize<span style="font-weight: bold">(</span>alpha_n<span style="font-weight: bold">)</span>
  727. carry = <span style="font-weight: bold">(</span>alpha_n, jnp.log<span style="font-weight: bold">(</span>cn<span style="font-weight: bold">)</span> + log_ll_prev<span style="font-weight: bold">)</span>
  728. return carry, alpha_n
  729. # initial belief state
  730. alpha_0, c0 = normalize<span style="font-weight: bold">(</span>init_dist * obs_mat<span style="font-weight: bold">[</span>:, obs_seq<span style="font-weight: bold">[</span><span style="color: #000080; text-decoration-color: #000080; font-weight: bold">0</span><span style="font-weight: bold">]])</span>
  731. # setup scan loop
  732. init_state = <span style="font-weight: bold">(</span>alpha_0, jnp.log<span style="font-weight: bold">(</span>c0<span style="font-weight: bold">))</span>
  733. ts = jnp.arange<span style="font-weight: bold">(</span><span style="color: #000080; text-decoration-color: #000080; font-weight: bold">1</span>, seq_len<span style="font-weight: bold">)</span>
  734. carry, alpha_hist = lax.scan<span style="font-weight: bold">(</span>scan_fn, init_state, ts<span style="font-weight: bold">)</span>
  735. # post-process
  736. alpha_hist = jnp.vstack<span style="font-weight: bold">()</span>
  737. <span style="font-weight: bold">(</span>alpha_final, log_ll<span style="font-weight: bold">)</span> = carry
  738. return log_ll, alpha_hist
  739. </pre>
  740. </div></div>
  741. </div>
  742. </div>
  743. <script type="text/x-thebe-config">
  744. {
  745. requestKernel: true,
  746. binderOptions: {
  747. repo: "binder-examples/jupyter-stacks-datascience",
  748. ref: "master",
  749. },
  750. codeMirrorConfig: {
  751. theme: "abcdef",
  752. mode: "python"
  753. },
  754. kernelOptions: {
  755. kernelName: "python3",
  756. path: "./chapters/hmm"
  757. },
  758. predefinedOutput: true
  759. }
  760. </script>
  761. <script>kernelName = 'python3'</script>
  762. </div>
  763. <!-- Previous / next buttons -->
  764. <div class='prev-next-area'>
  765. <a class='left-prev' id="prev-link" href="hmm_index.html" title="previous page">
  766. <i class="fas fa-angle-left"></i>
  767. <div class="prev-next-info">
  768. <p class="prev-next-subtitle">previous</p>
  769. <p class="prev-next-title">Hidden Markov Models</p>
  770. </div>
  771. </a>
  772. <a class='right-next' id="next-link" href="hmm_smoother.html" title="next page">
  773. <div class="prev-next-info">
  774. <p class="prev-next-subtitle">next</p>
  775. <p class="prev-next-title">HMM smoothing (forwards-backwards algorithm)</p>
  776. </div>
  777. <i class="fas fa-angle-right"></i>
  778. </a>
  779. </div>
  780. </div>
  781. </div>
  782. <footer class="footer">
  783. <p>
  784. By Kevin Murphy, Scott Linderman, et al.<br/>
  785. &copy; Copyright 2021.<br/>
  786. </p>
  787. </footer>
  788. </main>
  789. </div>
  790. </div>
  791. <script src="../../_static/js/index.be7d3bbb2ef33a8344ce.js"></script>
  792. </body>
  793. </html>